diff --git b/BeNePar/DataPreparation.ipynb a/BeNePar/DataPreparation.ipynb
new file mode 100644
index 0000000..cd2148f
--- /dev/null
+++ a/BeNePar/DataPreparation.ipynb
@@ -0,0 +1,175 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "5cd26f6f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "\n",
+    "from datasets import load_dataset\n",
+    "\n",
+    "from IPython.display import display\n",
+    "\n",
+    "import sys\n",
+    "sys.path.append('../')\n",
+    "from neural_parser import hybrid_tree_utils"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "fecef4af",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Found cached dataset pdb_c_beta (/home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1)\n"
+     ]
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "d6fc0deda216433982f304d7451158b2",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  0%|          | 0/3 [00:00<?, ?it/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    }
+   ],
+   "source": [
+    "pdbc_dataset = load_dataset('../pdb_c_beta/')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "23da801f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "BRACKETS_DIR = 'brackets'\n",
+    "! rm -r {BRACKETS_DIR}\n",
+    "! mkdir {BRACKETS_DIR}"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "c105feff",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "train\n",
+      "    brackets/pdbc-cont-train.dat\n",
+      "        15903\n",
+      "validation\n",
+      "    brackets/pdbc-cont-validation.dat\n",
+      "        1980\n",
+      "test\n",
+      "    brackets/pdbc-cont-test.dat\n",
+      "        1990\n"
+     ]
+    }
+   ],
+   "source": [
+    "features = pdbc_dataset['train'].features\n",
+    "\n",
+    "for part, dataset in pdbc_dataset.items():\n",
+    "    print(part)\n",
+    "    b_cont = []\n",
+    "    for sentence in dataset:\n",
+    "        tree = hybrid_tree_utils.tree_from_dataset_instance(sentence, features)\n",
+    "        if tree.is_continuous():\n",
+    "            b_cont.append(f'(TOP {tree.to_brackets(morph_tags=True)})')\n",
+    "    filepath = os.path.join(BRACKETS_DIR, f'pdbc-cont-{part}.dat')\n",
+    "    with open(filepath, 'w') as f:\n",
+    "        print('   ', filepath)\n",
+    "        print('       ', len(b_cont))\n",
+    "        for row in b_cont:\n",
+    "            print(row, file=f)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "c849233c",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "    1990   121784  1024525 brackets/pdbc-cont-test.dat\n",
+      "   15903  1022627  8620535 brackets/pdbc-cont-train.dat\n",
+      "    1980   126288  1065593 brackets/pdbc-cont-validation.dat\n",
+      "   19873  1270699 10710653 total\n"
+     ]
+    }
+   ],
+   "source": [
+    "! wc {BRACKETS_DIR}/*.dat"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "id": "679b9f10",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(TOP (ROOT (*S (S (NP (AdjP (*Adj (adj:sg:nom:f:pos Skośnooka))) (*NP (*N (subst:sg:nom:f dziewczynka)))) (*VP (*V (fin:sg:ter:imperf trzyma))) (PrepNP (*Prep (prep:loc:nwok w)) (NP (*N (subst:pl:loc:f rękach)))) (NP (AdjP (*Adj (adj:pl:nom:f:pos drewniane))) (*NP (*N (subst:pl:nom:f pałeczki))))) (Punct (interp ,)) (*Conj (conj a)) (S (PrepNP (*Prep (prep:inst:nwok przed)) (NP (*N (ppron3:sg:inst:f:ter:akc:praep nią)))) (*VP (*V (fin:pl:ter:imperf znajdują))) (Part (part się)) (NP (*NP (*N (subst:pl:nom:n:ncol naczynia))) (AdjP (*Adj (adj:pl:nom:n:pos kuchenne)))))) (Punct (interp .))))\r\n",
+      "(TOP (ROOT (*S (NP (*NP (*N (subst:sg:nom:n:col Dziecko))) (PrepNP (*Prep (prep:loc:nwok w)) (NP (AdjP (*Adj (adj:sg:loc:f:pos różowej))) (*NP (*N (subst:sg:loc:f opasce)))))) (*VP (*V (fin:sg:ter:imperf unosi))) (PrepNP (*Prep (prep:loc:nwok w)) (NP (*N (subst:pl:loc:f rękach)))) (NP (AdjP (*Adj (adj:pl:acc:m3:pos drewniane))) (*NP (*N (subst:pl:acc:m3 patyczki)))) (PrepNP (*Prep (prep:inst:nwok nad)) (NP (AdjP (*AdjP (*Adj (ppas:pl:inst:n:perf:aff postawionymi))) (NP (PrepNP (*Prep (prep:gen do)) (NP (*N (subst:sg:gen:f góry)))) (*NP (*N (subst:sg:inst:n:ncol dnem))))) (*NP (NP (*N (subst:sg:inst:f miską))) (*Conj (conj i)) (NP (*N (subst:sg:inst:m3 garnkiem))))))) (Punct (interp .))))\r\n",
+      "(TOP (ROOT (*S (NP (*NP (*N (subst:pl:nom:m1 Zawodnicy))) (PrepNP (*Prep (prep:loc:nwok w)) (NP (*NP (*N (subst:sg:loc:n:ncol pobliżu))) (NP (*N (subst:sg:gen:f piłki)))))) (*VP (*V (fin:pl:ter:imperf przepychają))) (Part (part się)) (PrepNP (*Prep (prep:inst między)) (NP (*N (siebie:inst sobą)))) (PrepNP (*Prep (prep:loc na)) (NP (*N (subst:sg:loc:n:ncol boisku))))) (Punct (interp .))))\r\n",
+      "(TOP (ROOT (*S (S (NP (*NP (*N (subst:sg:nom:f Dziewczynka))) (PrepNP (*Prep (prep:loc:nwok w)) (NP (*N (subst:sg:loc:f sukience))))) (*VP (*V (fin:sg:ter:imperf puszcza))) (NP (*NP (*N (subst:pl:acc:f bańki))) (AdjP (*Adj (adj:pl:acc:f:pos mydlane)))) (PrepNP (*Prep (prep:loc na)) (NP (*N (subst:sg:loc:f trawie))))) (Punct (interp ,)) (*Conj (conj a)) (S (PrepNP (*Prep (prep:inst za)) (NP (*N (ppron3:sg:inst:f:ter:akc:praep nią)))) (*VP (*V (fin:sg:ter:imperf stoi))) (NP (AdjP (*Adj (adj:sg:nom:f:pos druga))) (*NP (*N (subst:sg:nom:f dziewczynka)))))) (Punct (interp .))))\r\n",
+      "(TOP (ROOT (*S (NP (*NP (*N (subst:pl:nom:f Dziewczynki))) (PrepNP (*Prep (prep:loc:nwok w)) (NP (AdjP (*Adj (adj:pl:loc:f:pos kolorowych))) (*NP (*N (subst:pl:loc:f sukienkach)))))) (*VP (*V (fin:pl:ter:imperf stoją))) (PrepNP (*Prep (prep:loc na)) (NP (*N (subst:sg:loc:f trawie)))) (VP (Punct (interp ,)) (*VP (*V (pcon:imperf puszczając))) (NP (*NP (*N (subst:pl:acc:f bańki))) (AdjP (*Adj (adj:pl:acc:f:pos mydlane)))))) (Punct (interp .))))\r\n",
+      "(TOP (ROOT (*S (NP (*NP (*N (subst:sg:nom:f Grupa))) (NP (*N (subst:pl:gen:n:col dzieci)))) (*VP (*V (fin:sg:ter:imperf moczy))) (Part (part się)) (PrepNP (*Prep (prep:loc:nwok w)) (NP (*NP (*N (subst:sg:loc:f wodzie))) (PrepNP (*Prep (prep:gen:nwok z)) (NP (*N (subst:sg:gen:f fontanny))))))) (Punct (interp .))))\r\n",
+      "(TOP (ROOT (*S (NP (*NumP (*Num (num:pl:nom:m1:rec:ncol Kilku))) (NP (*N (subst:pl:gen:m1 chłopców)))) (*VP (*V (fin:sg:ter:imperf kąpie))) (Part (part się)) (PrepNP (*Prep (prep:loc:nwok w)) (NP (*NP (*N (subst:sg:loc:f fontannie))) (PrepNP (*Prep (prep:gen obok)) (NP (*NP (*N (subst:pl:gen:m3 stolików))) (CP (Punct (interp ,)) (*S (PrepAdjP (*Prep (prep:loc przy)) (AdjP (*Adj (adj:pl:loc:m3:pos których)))) (*VP (*V (fin:pl:ter:imperf siedzą))) (NP (*N (subst:pl:nom:m1 ludzie)))))))))) (Punct (interp .))))\r\n",
+      "(TOP (ROOT (*S (NP (*NP (*N (subst:sg:nom:f Dwójka))) (NP (AdjP (*Adj (adj:pl:gen:n:pos nagich))) (*NP (*N (subst:pl:gen:n:col dzieci))) (AdjP (*AdjP (*Adj (ppas:pl:gen:n:perf:aff ubrudzonych))) (NP (*N (subst:pl:inst:f farbkami)))))) (*VP (*V (fin:sg:ter:imperf siedzi))) (PrepNP (*Prep (prep:loc na)) (NP (*N (subst:sg:loc:f podłodze)))) (PrepNP (*Prep (prep:gen obok)) (NP (AdjP (*Adj (adj:pl:gen:f:pos porozrzucanych))) (*NP (*N (subst:pl:gen:f kartek)))))) (Punct (interp .))))\r\n",
+      "(TOP (ROOT (*S (S (NP (*NumP (*Num (num:pl:nom:n:rec:col Dwoje))) (NP (AdjP (AdjP (*Adj (adj:pl:gen:n:pos nagich))) (*Conj (interp ,)) (AdjP (*Adj (adj:pl:gen:n:pos małych)))) (*NP (*N (subst:pl:gen:n:col dzieci))))) (*VP (*V (fin:sg:ter:imperf siedzi))) (PrepNP (*Prep (prep:gen naprzeciwko)) (NP (*N (siebie:gen siebie))))) (*Conj (conj i)) (S (NP (AdjP (*Adj (adj:sg:nom:n:com większe))) (*NP (*N (subst:sg:nom:n:col dziecko)))) (*VP (*V (fin:sg:ter:imperf smaruje))) (NP (*N (subst:sg:inst:f farbą))) (NP (AdjP (*Adj (adj:sg:acc:n:com mniejsze))) (*NP (*N (subst:sg:acc:n:col dziecko)))))) (Punct (interp .))))\r\n",
+      "(TOP (ROOT (*S (NP (*NP (*N (subst:sg:nom:f Dziewczynka))) (PrepNP (*Prep (prep:loc o)) (NP (AdjP (*Adj (adj:pl:loc:n:pos ciemnych))) (*NP (*N (subst:pl:loc:n:col oczach)))))) (*VP (*V (fin:sg:ter:imperf patrzy))) (PrepNP (*Prep (prep:acc na)) (NP (AdjP (*Adj (adj:sg:acc:m3:pos czarny))) (*NP (*N (subst:sg:acc:m3 przedmiot))) (CP (Punct (interp ,)) (*S (AdjP (*Adj (adj:sg:acc:m3:pos który))) (*VP (*V (fin:sg:ter:imperf trzyma))) (PrepNP (*Prep (prep:loc:nwok w)) (NP (*N (subst:sg:loc:f ręce))))))))) (Punct (interp .))))\r\n"
+     ]
+    }
+   ],
+   "source": [
+    "! head {BRACKETS_DIR}/pdbc-cont-train.dat"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "TF_zajecia",
+   "language": "python",
+   "name": "tf_zajecia"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.10.6"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git b/BeNePar/TrainAndParse.ipynb a/BeNePar/TrainAndParse.ipynb
new file mode 100644
index 0000000..34a3065
--- /dev/null
+++ a/BeNePar/TrainAndParse.ipynb
@@ -0,0 +1,973 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "d8404675",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "#BENEPAR = '/home/kkrasnowska/benepar_experiments/self-attentive-parser/src/main.py'"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "88603098",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "#! mkdir models"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "d5aedb53",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "#! python {BENEPAR} train \\\n",
+    "#    --train-path brackets/pdbc-cont-train.dat \\\n",
+    "#    --dev-path brackets/pdbc-cont-validation.dat \\\n",
+    "#    --evalb-dir /home/kkrasnowska/benepar_experiments/self-attentive-parser/EVALB_SPMRL \\\n",
+    "#    --use-pretrained --pretrained-model \"allegro/herbert-large-cased\" \\\n",
+    "#    --use-encoder --num-layers 2 \\\n",
+    "#    --predict-tags \\\n",
+    "#    --model-path-base models"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "id": "3f6aaf27",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from IPython.display import display, HTML"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "id": "8d9d5103",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import benepar\n",
+    "import nltk\n",
+    "import spacy"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "id": "c56eda57",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Some weights of the model checkpoint at allegro/herbert-large-cased were not used when initializing BertModel: ['cls.predictions.transform.LayerNorm.bias', 'cls.sso.sso_relationship.weight', 'cls.predictions.transform.dense.weight', 'cls.sso.sso_relationship.bias', 'cls.predictions.bias', 'cls.predictions.decoder.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.decoder.bias']\n",
+      "- This IS expected if you are initializing BertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n",
+      "- This IS NOT expected if you are initializing BertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n"
+     ]
+    }
+   ],
+   "source": [
+    "MODEL = 'models_dev=97.36.pt'\n",
+    "parser = benepar.Parser(MODEL)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "35ffd9af",
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "id": "06ae821c",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def postprocess(tree):\n",
+    "    for node in tree.subtrees():\n",
+    "        l = node.label()\n",
+    "        node.set_label(l.replace('LPAR', '(').replace('RPAR', ')'))\n",
+    "        for i, child in enumerate(node):\n",
+    "            if type(child) == str:\n",
+    "                node[i] = child.replace('-LSB-', '[').replace('-RSB-', ']')\n",
+    "    return tree\n",
+    "\n",
+    "def parse_tokenized_sentences(sentences, parser):\n",
+    "    [benepar.InputSentence(words=tokens) for tokens in sentences]\n",
+    "    return list(map(postprocess, parser.parse_sents(\n",
+    "        [benepar.InputSentence(words=tokens) for tokens in sentences]\n",
+    "    )))\n",
+    "\n",
+    "def parse_sentence(sentence, parser):\n",
+    "    return parse_tokenized_sentences([sentence.split()], parser)[0]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "id": "c96dc9d9",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "You're using a HerbertTokenizerFast tokenizer. Please note that with a fast tokenizer, using the `__call__` method is faster than using a method to encode the text followed by a call to the `pad` method to get a padded encoding.\n",
+      "/home/kkrasnowska/venvs/torch_benepar/lib/python3.10/site-packages/torch/distributions/distribution.py:44: UserWarning: <class 'torch_struct.distributions.TreeCRF'> does not define `arg_constraints`. Please set `arg_constraints = {}` or initialize the distribution with `validate_args=False` to turn off validation.\n",
+      "  warnings.warn(f'{self.__class__} does not define `arg_constraints`. ' +\n"
+     ]
+    },
+    {
+     "data": {
+      "image/svg+xml": [
+       "<svg baseProfile=\"full\" height=\"312px\" preserveAspectRatio=\"xMidYMid meet\" style=\"font-family: times, serif; font-weight:normal; font-style: normal; font-size: 16px;\" version=\"1.1\" viewBox=\"0,0,512.0,312.0\" width=\"512px\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:ev=\"http://www.w3.org/2001/xml-events\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">TOP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">ROOT</text></svg><svg width=\"12.5%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">[</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"6.25%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"75%\" x=\"12.5%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*S</text></svg><svg width=\"35.4167%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:pl:nom:m2</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Koty</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"17.7083%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"12.5%\" x=\"35.4167%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*VP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*V</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">pred</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">to</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"41.6667%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"35.4167%\" x=\"47.9167%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:pl:nom:m1</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">złodzieje</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"65.625%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"16.6667%\" x=\"83.3333%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">.</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"91.6667%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"12.5%\" x=\"87.5%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">]</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"93.75%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg>"
+      ],
+      "text/plain": [
+       "Tree('TOP', [Tree('ROOT', [Tree('Punct', [Tree('interp', ['['])]), Tree('*S', [Tree('NP', [Tree('*N', [Tree('subst:pl:nom:m2', ['Koty'])])]), Tree('*VP', [Tree('*V', [Tree('pred', ['to'])])]), Tree('NP', [Tree('*N', [Tree('subst:pl:nom:m1', ['złodzieje'])])]), Tree('Punct', [Tree('interp', ['.'])])]), Tree('Punct', [Tree('interp', [']'])])])])"
+      ]
+     },
+     "execution_count": 12,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "parse_sentence('[ Koty to złodzieje . ]', parser)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 13,
+   "id": "d62d1e31",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "image/svg+xml": [
+       "<svg baseProfile=\"full\" height=\"312px\" preserveAspectRatio=\"xMidYMid meet\" style=\"font-family: times, serif; font-weight:normal; font-style: normal; font-size: 16px;\" version=\"1.1\" viewBox=\"0,0,560.0,312.0\" width=\"560px\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:ev=\"http://www.w3.org/2001/xml-events\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">TOP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">ROOT</text></svg><svg width=\"88.5714%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*S</text></svg><svg width=\"72.5806%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*VP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*V</text></svg><svg width=\"44.4444%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">praet:sg:m1:imperf</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Widział</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"22.2222%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"55.5556%\" x=\"44.4444%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">aglt:sg:pri:imperf:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">am</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"72.2222%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"36.2903%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"27.4194%\" x=\"72.5806%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:sg:acc:m2</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">kotka</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"86.2903%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"44.2857%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"11.4286%\" x=\"88.5714%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">.</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"94.2857%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg>"
+      ],
+      "text/plain": [
+       "Tree('TOP', [Tree('ROOT', [Tree('*S', [Tree('*VP', [Tree('*V', [Tree('praet:sg:m1:imperf', ['Widział']), Tree('aglt:sg:pri:imperf:nwok', ['am'])])]), Tree('NP', [Tree('*N', [Tree('subst:sg:acc:m2', ['kotka'])])])]), Tree('Punct', [Tree('interp', ['.'])])])])"
+      ]
+     },
+     "execution_count": 13,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "parse_sentence('Widział am kotka .', parser)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 14,
+   "id": "418db531",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "with open('brackets/pdbc-cont-validation.dat') as f:\n",
+    "    val_trees = [postprocess(nltk.Tree.fromstring(l.strip('\\n'))) for l in f.readlines()]\n",
+    "with open('brackets/pdbc-cont-test.dat') as f:\n",
+    "    test_trees = [postprocess(nltk.Tree.fromstring(l.strip('\\n'))) for l in f.readlines()]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 15,
+   "id": "2e5f4739",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "val_sentences = [tree.leaves() for tree in val_trees]\n",
+    "test_sentences = [tree.leaves() for tree in test_trees]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 16,
+   "id": "6c52ef3f",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/home/kkrasnowska/venvs/torch_benepar/lib/python3.10/site-packages/torch/distributions/distribution.py:44: UserWarning: <class 'torch_struct.distributions.TreeCRF'> does not define `arg_constraints`. Please set `arg_constraints = {}` or initialize the distribution with `validate_args=False` to turn off validation.\n",
+      "  warnings.warn(f'{self.__class__} does not define `arg_constraints`. ' +\n"
+     ]
+    }
+   ],
+   "source": [
+    "val_pred_trees = parse_tokenized_sentences(val_sentences, parser)\n",
+    "test_pred_trees = parse_tokenized_sentences(test_sentences, parser)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 17,
+   "id": "d6d45ba8",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "assert(len(val_trees) == len(val_pred_trees))\n",
+    "assert(len(test_trees) == len(test_pred_trees))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 18,
+   "id": "399c3f08",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# drop the TOP\n",
+    "val_trees = [t[0] for t in val_trees]\n",
+    "test_trees = [t[0] for t in test_trees]\n",
+    "val_pred_trees = [t[0] for t in val_pred_trees]\n",
+    "test_pred_trees = [t[0] for t in test_pred_trees]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 19,
+   "id": "827be810",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "image/svg+xml": [
+       "<svg baseProfile=\"full\" height=\"504px\" preserveAspectRatio=\"xMidYMid meet\" style=\"font-family: times, serif; font-weight:normal; font-style: normal; font-size: 16px;\" version=\"1.1\" viewBox=\"0,0,2808.0,504.0\" width=\"2808px\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:ev=\"http://www.w3.org/2001/xml-events\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">ROOT</text></svg><svg width=\"97.7208%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*S</text></svg><svg width=\"41.691%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">S</text></svg><svg width=\"22.3776%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepNP</text></svg><svg width=\"46.875%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prep:loc:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">W</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"23.4375%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"53.125%\" x=\"46.875%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:sg:loc:m3</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">samolocie</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"73.4375%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"11.1888%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"13.986%\" x=\"22.3776%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*VP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*V</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">praet:sg:m1:imperf</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">czytał</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"29.3706%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"63.6364%\" x=\"36.3636%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"18.6813%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:pl:acc:m3</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">wycinki</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"9.34066%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"81.3187%\" x=\"18.6813%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepNP</text></svg><svg width=\"20.2703%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prep:gen:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">z</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"10.1351%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"79.7297%\" x=\"20.2703%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"27.1186%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:sg:gen:f</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prasy</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"13.5593%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"72.8814%\" x=\"27.1186%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">AdjP</text></svg><svg width=\"41.8605%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">AdjP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Adj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">adj:sg:gen:f:pos</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">polskiej</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"20.9302%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"16.2791%\" x=\"41.8605%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Conj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">conj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">i</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"41.8605%\" x=\"58.1395%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">AdjP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Adj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">adj:sg:gen:f:pos</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">polonijnej</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"79.0698%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"63.5593%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"60.1351%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"59.3407%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"68.1818%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"20.8455%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"2.33236%\" x=\"41.691%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Conj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">-</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"42.8571%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"55.9767%\" x=\"44.0233%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">S</text></svg><svg width=\"17.7083%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepAdjP</text></svg><svg width=\"44.1176%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prep:loc:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">w</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"22.0588%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"55.8824%\" x=\"44.1176%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">AdjP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Adj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">adj:sg:loc:m3:pos</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">każdym</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"72.0588%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"8.85417%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"6.77083%\" x=\"17.7083%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*VP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*V</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">imps:imperf</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">piętnowano</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"21.0938%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"17.7083%\" x=\"24.4792%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">ppron3:sg:acc:m1:ter:nakc:npraep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">go</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"33.3333%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"57.8125%\" x=\"42.1875%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Compar</text></svg><svg width=\"6.30631%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Comp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">comp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">jako</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"3.15315%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"93.6937%\" x=\"6.30631%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">AdjP</text></svg><svg width=\"7.69231%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">\"</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"3.84615%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"30.7692%\" x=\"7.69231%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepNP</text></svg><svg width=\"46.875%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prep:gen:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">bez</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"23.4375%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"53.125%\" x=\"46.875%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:sg:gen:m3</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">umiaru</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"73.4375%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"23.0769%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"24.0385%\" x=\"38.4615%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*AdjP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Adj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">ppas:sg:acc:m1:perf:aff</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">zapatrzonego</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50.4808%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"29.8077%\" x=\"62.5%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepNP</text></svg><svg width=\"48.3871%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prep:acc:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">w</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"24.1935%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"51.6129%\" x=\"48.3871%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:sg:acc:f</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Moskwę</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"74.1935%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"77.4038%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"7.69231%\" x=\"92.3077%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">\"</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"96.1538%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"53.1532%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"71.0938%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"72.0117%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"48.8604%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"2.2792%\" x=\"97.7208%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">.</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"98.8604%\" y1=\"1.2em\" y2=\"3em\" /></svg>"
+      ],
+      "text/plain": [
+       "Tree('ROOT', [Tree('*S', [Tree('S', [Tree('PrepNP', [Tree('*Prep', [Tree('prep:loc:nwok', ['W'])]), Tree('NP', [Tree('*N', [Tree('subst:sg:loc:m3', ['samolocie'])])])]), Tree('*VP', [Tree('*V', [Tree('praet:sg:m1:imperf', ['czytał'])])]), Tree('NP', [Tree('*NP', [Tree('*N', [Tree('subst:pl:acc:m3', ['wycinki'])])]), Tree('PrepNP', [Tree('*Prep', [Tree('prep:gen:nwok', ['z'])]), Tree('NP', [Tree('*NP', [Tree('*N', [Tree('subst:sg:gen:f', ['prasy'])])]), Tree('AdjP', [Tree('AdjP', [Tree('*Adj', [Tree('adj:sg:gen:f:pos', ['polskiej'])])]), Tree('*Conj', [Tree('conj', ['i'])]), Tree('AdjP', [Tree('*Adj', [Tree('adj:sg:gen:f:pos', ['polonijnej'])])])])])])])]), Tree('*Conj', [Tree('interp', ['-'])]), Tree('S', [Tree('PrepAdjP', [Tree('*Prep', [Tree('prep:loc:nwok', ['w'])]), Tree('AdjP', [Tree('*Adj', [Tree('adj:sg:loc:m3:pos', ['każdym'])])])]), Tree('*VP', [Tree('*V', [Tree('imps:imperf', ['piętnowano'])])]), Tree('NP', [Tree('*N', [Tree('ppron3:sg:acc:m1:ter:nakc:npraep', ['go'])])]), Tree('Compar', [Tree('*Comp', [Tree('comp', ['jako'])]), Tree('AdjP', [Tree('Punct', [Tree('interp', ['\"'])]), Tree('PrepNP', [Tree('*Prep', [Tree('prep:gen:nwok', ['bez'])]), Tree('NP', [Tree('*N', [Tree('subst:sg:gen:m3', ['umiaru'])])])]), Tree('*AdjP', [Tree('*Adj', [Tree('ppas:sg:acc:m1:perf:aff', ['zapatrzonego'])])]), Tree('PrepNP', [Tree('*Prep', [Tree('prep:acc:nwok', ['w'])]), Tree('NP', [Tree('*N', [Tree('subst:sg:acc:f', ['Moskwę'])])])]), Tree('Punct', [Tree('interp', ['\"'])])])])])]), Tree('Punct', [Tree('interp', ['.'])])])"
+      ]
+     },
+     "execution_count": 19,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "val_trees[504]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 20,
+   "id": "1059e782",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "image/svg+xml": [
+       "<svg baseProfile=\"full\" height=\"504px\" preserveAspectRatio=\"xMidYMid meet\" style=\"font-family: times, serif; font-weight:normal; font-style: normal; font-size: 16px;\" version=\"1.1\" viewBox=\"0,0,2808.0,504.0\" width=\"2808px\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:ev=\"http://www.w3.org/2001/xml-events\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">ROOT</text></svg><svg width=\"97.7208%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*S</text></svg><svg width=\"41.691%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">S</text></svg><svg width=\"22.3776%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepNP</text></svg><svg width=\"46.875%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prep:loc:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">W</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"23.4375%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"53.125%\" x=\"46.875%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:sg:loc:m3</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">samolocie</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"73.4375%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"11.1888%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"13.986%\" x=\"22.3776%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*VP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*V</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">praet:sg:m1:imperf</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">czytał</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"29.3706%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"63.6364%\" x=\"36.3636%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"18.6813%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:pl:acc:m3</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">wycinki</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"9.34066%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"81.3187%\" x=\"18.6813%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepNP</text></svg><svg width=\"20.2703%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prep:gen:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">z</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"10.1351%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"79.7297%\" x=\"20.2703%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"27.1186%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:sg:gen:f</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prasy</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"13.5593%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"72.8814%\" x=\"27.1186%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">AdjP</text></svg><svg width=\"41.8605%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">AdjP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Adj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">adj:sg:gen:f:pos</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">polskiej</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"20.9302%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"16.2791%\" x=\"41.8605%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Conj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">conj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">i</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"41.8605%\" x=\"58.1395%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">AdjP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Adj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">adj:sg:gen:f:pos</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">polonijnej</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"79.0698%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"63.5593%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"60.1351%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"59.3407%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"68.1818%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"20.8455%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"2.33236%\" x=\"41.691%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Conj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">-</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"42.8571%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"55.9767%\" x=\"44.0233%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">S</text></svg><svg width=\"17.7083%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepAdjP</text></svg><svg width=\"44.1176%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prep:loc:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">w</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"22.0588%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"55.8824%\" x=\"44.1176%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">AdjP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Adj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">adj:sg:loc:m3:pos</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">każdym</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"72.0588%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"8.85417%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"6.77083%\" x=\"17.7083%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*VP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*V</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">imps:imperf</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">piętnowano</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"21.0938%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"17.7083%\" x=\"24.4792%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">ppron3:sg:acc:m1:ter:nakc:npraep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">go</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"33.3333%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"57.8125%\" x=\"42.1875%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Compar</text></svg><svg width=\"6.30631%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Comp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">comp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">jako</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"3.15315%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"93.6937%\" x=\"6.30631%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">AdjP</text></svg><svg width=\"7.69231%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">\"</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"3.84615%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"30.7692%\" x=\"7.69231%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepNP</text></svg><svg width=\"46.875%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prep:gen:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">bez</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"23.4375%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"53.125%\" x=\"46.875%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:sg:gen:m3</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">umiaru</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"73.4375%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"23.0769%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"24.0385%\" x=\"38.4615%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*AdjP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Adj</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">ppas:sg:acc:m1:perf:aff</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">zapatrzonego</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50.4808%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"29.8077%\" x=\"62.5%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepNP</text></svg><svg width=\"48.3871%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">prep:acc:nwok</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">w</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"24.1935%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"51.6129%\" x=\"48.3871%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">subst:sg:acc:f</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Moskwę</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"74.1935%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"77.4038%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"7.69231%\" x=\"92.3077%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">\"</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"96.1538%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"53.1532%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"71.0938%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"72.0117%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"48.8604%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"2.2792%\" x=\"97.7208%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">interp</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">.</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"98.8604%\" y1=\"1.2em\" y2=\"3em\" /></svg>"
+      ],
+      "text/plain": [
+       "Tree('ROOT', [Tree('*S', [Tree('S', [Tree('PrepNP', [Tree('*Prep', [Tree('prep:loc:nwok', ['W'])]), Tree('NP', [Tree('*N', [Tree('subst:sg:loc:m3', ['samolocie'])])])]), Tree('*VP', [Tree('*V', [Tree('praet:sg:m1:imperf', ['czytał'])])]), Tree('NP', [Tree('*NP', [Tree('*N', [Tree('subst:pl:acc:m3', ['wycinki'])])]), Tree('PrepNP', [Tree('*Prep', [Tree('prep:gen:nwok', ['z'])]), Tree('NP', [Tree('*NP', [Tree('*N', [Tree('subst:sg:gen:f', ['prasy'])])]), Tree('AdjP', [Tree('AdjP', [Tree('*Adj', [Tree('adj:sg:gen:f:pos', ['polskiej'])])]), Tree('*Conj', [Tree('conj', ['i'])]), Tree('AdjP', [Tree('*Adj', [Tree('adj:sg:gen:f:pos', ['polonijnej'])])])])])])])]), Tree('*Conj', [Tree('interp', ['-'])]), Tree('S', [Tree('PrepAdjP', [Tree('*Prep', [Tree('prep:loc:nwok', ['w'])]), Tree('AdjP', [Tree('*Adj', [Tree('adj:sg:loc:m3:pos', ['każdym'])])])]), Tree('*VP', [Tree('*V', [Tree('imps:imperf', ['piętnowano'])])]), Tree('NP', [Tree('*N', [Tree('ppron3:sg:acc:m1:ter:nakc:npraep', ['go'])])]), Tree('Compar', [Tree('*Comp', [Tree('comp', ['jako'])]), Tree('AdjP', [Tree('Punct', [Tree('interp', ['\"'])]), Tree('PrepNP', [Tree('*Prep', [Tree('prep:gen:nwok', ['bez'])]), Tree('NP', [Tree('*N', [Tree('subst:sg:gen:m3', ['umiaru'])])])]), Tree('*AdjP', [Tree('*Adj', [Tree('ppas:sg:acc:m1:perf:aff', ['zapatrzonego'])])]), Tree('PrepNP', [Tree('*Prep', [Tree('prep:acc:nwok', ['w'])]), Tree('NP', [Tree('*N', [Tree('subst:sg:acc:f', ['Moskwę'])])])]), Tree('Punct', [Tree('interp', ['\"'])])])])])]), Tree('Punct', [Tree('interp', ['.'])])])"
+      ]
+     },
+     "execution_count": 20,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "val_pred_trees[504]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 25,
+   "id": "4d6c7096",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "'''\n",
+    "def undummy(_tree):\n",
+    "    tree = _tree.copy(deep=True)\n",
+    "    for node in tree.subtrees():\n",
+    "        for i, child in enumerate(node):\n",
+    "            if type(child) != str and child.label() == 'DUMMY_PRE':\n",
+    "                node[i] = child[0]\n",
+    "    return tree\n",
+    "\n",
+    "'''\n",
+    "def untag(_tree):\n",
+    "    tree = _tree.copy(deep=True)\n",
+    "    for node in tree.subtrees():\n",
+    "        for i, child in enumerate(node):\n",
+    "            if type(child) != str and set(map(type, child)) == {str}:\n",
+    "                assert(len(child) == 1)\n",
+    "                node[i] = child[0]\n",
+    "        #if set(map(type, node)) == {str}:\n",
+    "        #    assert(len(node) == 1)\n",
+    "        #    node.set_label('xxx')\n",
+    "    return tree\n",
+    "\n",
+    "'''\n",
+    "\n",
+    "ZDANIE_HEADS = {'*ff', '*spójnik', '*przec', '*zdanie', '*formawykrz'}\n",
+    "ZDANIE_HEADS2 = set(l.strip('*') for l in ZDANIE_HEADS)\n",
+    "ZDANIE_HEAD_HIERARCHY = ('ff', 'spójnik', 'przec', 'zdanie')\n",
+    "\n",
+    "\n",
+    "def correct(_tree):\n",
+    "    tree = _tree.copy(deep=True)\n",
+    "    for node in tree.subtrees():\n",
+    "        if len(node) == 1 and type(node[0]) != str and node.label() == node[0].label():\n",
+    "            new_children = [child for child in node[0]]\n",
+    "            node.pop()\n",
+    "            node += new_children\n",
+    "    for node in tree.subtrees():\n",
+    "        if 'zdanie' in node.label():\n",
+    "            heads = []\n",
+    "            non_heads = []\n",
+    "            for child in node:\n",
+    "                if child.label().startswith('*') and child.label() not in ZDANIE_HEADS:\n",
+    "                    child.set_label(child.label()[1:])\n",
+    "                (heads if child.label().startswith('*') else non_heads).append(child)\n",
+    "    \n",
+    "    return tree\n",
+    "''';"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 35,
+   "id": "4a26b2e1",
+   "metadata": {
+    "scrolled": false
+   },
+   "outputs": [],
+   "source": [
+    "from collections import Counter, defaultdict\n",
+    "\n",
+    "c = Counter()\n",
+    "\n",
+    "def tree2spans(_tree):\n",
+    "    # make tokens unique\n",
+    "    tree = _tree.copy(deep=True)\n",
+    "    idx = 0\n",
+    "    for node in tree.subtrees():\n",
+    "        for i, child in enumerate(node):\n",
+    "            if type(child) == str:\n",
+    "                node[i] = f'{idx}##{child}'\n",
+    "                idx += 1\n",
+    "    spans = []\n",
+    "    for node in tree.subtrees():\n",
+    "        spans.append((\n",
+    "            node.label(),\n",
+    "            tuple(child if type(child) == str else child.label() for child in node),\n",
+    "            ' '.join(node.leaves())\n",
+    "        ))\n",
+    "    assert (len(set(spans)) == len(spans))\n",
+    "    return set(spans)\n",
+    "\n",
+    "def spans2dict(spans):\n",
+    "    s = defaultdict(set)\n",
+    "    for node, children, text in spans:\n",
+    "        if node in s[text]:\n",
+    "            print('!!!!!!!!!!!!!!!', node, text)\n",
+    "            display(spans)\n",
+    "        s[text].add(node)\n",
+    "    return s\n",
+    "\n",
+    "def spans2errors(spans_gold, spans_pred):\n",
+    "    sg = spans2dict(spans_gold)\n",
+    "    sp = spans2dict(spans_pred)\n",
+    "    errors = []\n",
+    "    tp, fp, fn = 0, 0, 0\n",
+    "    for text in set(sg.keys()).union(sp.keys()):\n",
+    "        txt = ' '.join('X' for _ in text.split())\n",
+    "        errs = []\n",
+    "        for span in sg[text].union(sp[text]):\n",
+    "            if span in sg[text] and span not in sp[text]:\n",
+    "                errs.append(f'-{span}')\n",
+    "                fn += 1\n",
+    "            elif span not in sg[text] and span in sp[text]:\n",
+    "                errs.append(f'+{span}')\n",
+    "                fp += 1\n",
+    "            else:\n",
+    "                tp += 1\n",
+    "        if errs:\n",
+    "            errors.append((tuple(sorted(errs)), text))\n",
+    "    #display(errors)\n",
+    "    #print('tp:', tp, 'fp:', fp, 'fn:', fn)\n",
+    "    #p, r = tp / (tp + fp), tp / (tp + fn)\n",
+    "    #f1 = 2 * tp / (2 * tp + fp + fn)\n",
+    "    #print('precision:   ', p)\n",
+    "    #print('recall:      ', r)\n",
+    "    #print('f1:          ', f1)\n",
+    "    return (tp, fp, fn), errors"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 54,
+   "id": "397e3750",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def eval_trees(trees_gold, trees_pred):\n",
+    "    evaluation, errors = [], []\n",
+    "    for _tree_gold, _tree_pred in list(zip(trees_gold, trees_pred)):\n",
+    "        try:\n",
+    "            assert(''.join(_tree_gold.leaves()) == ''.join(_tree_pred.leaves()))\n",
+    "        except:\n",
+    "            print(_tree_gold.leaves())\n",
+    "            print(_tree_pred.leaves())\n",
+    "            raise\n",
+    "        tree_gold = untag(_tree_gold)\n",
+    "        tree_pred = untag(_tree_pred)\n",
+    "        spans_gold = tree2spans(tree_gold)\n",
+    "        spans_pred = tree2spans(tree_pred)\n",
+    "        if tree_gold.leaves() == ['Poszedł', 'em', 'do', 'adwokata', '.']:\n",
+    "            display(tree_gold)\n",
+    "            display(tree_pred)\n",
+    "            print(spans_gold)\n",
+    "            print(spans_pred)\n",
+    "        try:\n",
+    "            evl, errs = spans2errors(spans_gold, spans_pred)\n",
+    "            evaluation.append(evl)\n",
+    "            errors += [(err, _tree_gold, _tree_pred) for err in errs]\n",
+    "        except:\n",
+    "            display(tree_pred)\n",
+    "            display2(_tree_pred)\n",
+    "            print(i)\n",
+    "            raise\n",
+    "    return evaluation, errors"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 55,
+   "id": "5dcd68fd",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "image/svg+xml": [
+       "<svg baseProfile=\"full\" height=\"264px\" preserveAspectRatio=\"xMidYMid meet\" style=\"font-family: times, serif; font-weight:normal; font-style: normal; font-size: 16px;\" version=\"1.1\" viewBox=\"0,0,296.0,264.0\" width=\"296px\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:ev=\"http://www.w3.org/2001/xml-events\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">ROOT</text></svg><svg width=\"81.0811%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*S</text></svg><svg width=\"43.3333%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*VP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*V</text></svg><svg width=\"69.2308%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Poszedł</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"34.6154%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"30.7692%\" x=\"69.2308%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">em</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"84.6154%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"21.6667%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"56.6667%\" x=\"43.3333%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepNP</text></svg><svg width=\"41.1765%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">do</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"20.5882%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"58.8235%\" x=\"41.1765%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">adwokata</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"70.5882%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"71.6667%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"40.5405%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"18.9189%\" x=\"81.0811%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">.</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"90.5405%\" y1=\"1.2em\" y2=\"3em\" /></svg>"
+      ],
+      "text/plain": [
+       "Tree('ROOT', [Tree('*S', [Tree('*VP', [Tree('*V', ['Poszedł', 'em'])]), Tree('PrepNP', [Tree('*Prep', ['do']), Tree('NP', [Tree('*N', ['adwokata'])])])]), Tree('Punct', ['.'])])"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "image/svg+xml": [
+       "<svg baseProfile=\"full\" height=\"264px\" preserveAspectRatio=\"xMidYMid meet\" style=\"font-family: times, serif; font-weight:normal; font-style: normal; font-size: 16px;\" version=\"1.1\" viewBox=\"0,0,296.0,264.0\" width=\"296px\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:ev=\"http://www.w3.org/2001/xml-events\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">ROOT</text></svg><svg width=\"81.0811%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*S</text></svg><svg width=\"43.3333%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*VP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*V</text></svg><svg width=\"69.2308%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Poszedł</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"34.6154%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"30.7692%\" x=\"69.2308%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">em</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"84.6154%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"21.6667%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"56.6667%\" x=\"43.3333%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">PrepNP</text></svg><svg width=\"41.1765%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*Prep</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">do</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"20.5882%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"58.8235%\" x=\"41.1765%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">NP</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">*N</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">adwokata</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"70.5882%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"71.6667%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"40.5405%\" y1=\"1.2em\" y2=\"3em\" /><svg width=\"18.9189%\" x=\"81.0811%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">Punct</text></svg><svg width=\"100%\" x=\"0%\" y=\"3em\"><defs /><svg width=\"100%\" x=\"0\" y=\"0em\"><defs /><text text-anchor=\"middle\" x=\"50%\" y=\"1em\">.</text></svg></svg><line stroke=\"black\" x1=\"50%\" x2=\"50%\" y1=\"1.2em\" y2=\"3em\" /></svg><line stroke=\"black\" x1=\"50%\" x2=\"90.5405%\" y1=\"1.2em\" y2=\"3em\" /></svg>"
+      ],
+      "text/plain": [
+       "Tree('ROOT', [Tree('*S', [Tree('*VP', [Tree('*V', ['Poszedł', 'em'])]), Tree('PrepNP', [Tree('*Prep', ['do']), Tree('NP', [Tree('*N', ['adwokata'])])])]), Tree('Punct', ['.'])])"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "{('Punct', ('4##.',), '4##.'), ('*Prep', ('2##do',), '2##do'), ('ROOT', ('*S', 'Punct'), '0##Poszedł 1##em 2##do 3##adwokata 4##.'), ('NP', ('*N',), '3##adwokata'), ('*V', ('0##Poszedł', '1##em'), '0##Poszedł 1##em'), ('PrepNP', ('*Prep', 'NP'), '2##do 3##adwokata'), ('*S', ('*VP', 'PrepNP'), '0##Poszedł 1##em 2##do 3##adwokata'), ('*N', ('3##adwokata',), '3##adwokata'), ('*VP', ('*V',), '0##Poszedł 1##em')}\n",
+      "{('Punct', ('4##.',), '4##.'), ('*Prep', ('2##do',), '2##do'), ('ROOT', ('*S', 'Punct'), '0##Poszedł 1##em 2##do 3##adwokata 4##.'), ('NP', ('*N',), '3##adwokata'), ('*V', ('0##Poszedł', '1##em'), '0##Poszedł 1##em'), ('PrepNP', ('*Prep', 'NP'), '2##do 3##adwokata'), ('*S', ('*VP', 'PrepNP'), '0##Poszedł 1##em 2##do 3##adwokata'), ('*N', ('3##adwokata',), '3##adwokata'), ('*VP', ('*V',), '0##Poszedł 1##em')}\n",
+      "!!!!!!!!!!!!!!! *AdvP 0##Trudno\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "{('*Adv', ('0##Trudno',), '0##Trudno'),\n",
+       " ('*AdvP', ('*Adv',), '0##Trudno'),\n",
+       " ('*AdvP', ('*AdvP',), '0##Trudno'),\n",
+       " ('Punct', ('1##.',), '1##.'),\n",
+       " ('ROOT', ('*AdvP', 'Punct'), '0##Trudno 1##.')}"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "!!!!!!!!!!!!!!! *AdvP 0##Trudno\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "{('*Adv', ('0##Trudno',), '0##Trudno'),\n",
+       " ('*AdvP', ('*Adv',), '0##Trudno'),\n",
+       " ('*AdvP', ('*AdvP',), '0##Trudno'),\n",
+       " ('Punct', ('1##.',), '1##.'),\n",
+       " ('ROOT', ('*AdvP', 'Punct'), '0##Trudno 1##.')}"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "!!!!!!!!!!!!!!! *PrepNP 0##O 1##tym 2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "{('*Comp', ('3##iż',), '3##iż'),\n",
+       " ('*Comp', ('7##iż',), '7##iż'),\n",
+       " ('*Conj', ('6##,',), '6##,'),\n",
+       " ('*N', ('1##tym',), '1##tym'),\n",
+       " ('*N', ('11##nic',), '11##nic'),\n",
+       " ('*N', ('5##nikim',), '5##nikim'),\n",
+       " ('*N', ('9##cię',), '9##cię'),\n",
+       " ('*NP', ('*N',), '1##tym'),\n",
+       " ('*Prep', ('0##O',), '0##O'),\n",
+       " ('*Prep', ('10##za',), '10##za'),\n",
+       " ('*PrepNP',\n",
+       "  ('*Prep', 'NP'),\n",
+       "  '0##O 1##tym 2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic'),\n",
+       " ('*PrepNP',\n",
+       "  ('*PrepNP',),\n",
+       "  '0##O 1##tym 2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic'),\n",
+       " ('*V', ('4##jesteś',), '4##jesteś'),\n",
+       " ('*V', ('8##mają',), '8##mają'),\n",
+       " ('*VP', ('*V',), '4##jesteś'),\n",
+       " ('*VP', ('*V',), '8##mają'),\n",
+       " ('CP', ('*Comp', 'S'), '7##iż 8##mają 9##cię 10##za 11##nic'),\n",
+       " ('CP',\n",
+       "  ('CP', '*Conj', 'CP'),\n",
+       "  '2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic'),\n",
+       " ('CP', ('Punct', '*Comp', 'S'), '2##, 3##iż 4##jesteś 5##nikim'),\n",
+       " ('NP', ('*N',), '11##nic'),\n",
+       " ('NP', ('*N',), '5##nikim'),\n",
+       " ('NP', ('*N',), '9##cię'),\n",
+       " ('NP',\n",
+       "  ('*NP', 'CP'),\n",
+       "  '1##tym 2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic'),\n",
+       " ('PrepNP', ('*Prep', 'NP'), '10##za 11##nic'),\n",
+       " ('Punct', ('12##!',), '12##!'),\n",
+       " ('Punct', ('2##,',), '2##,'),\n",
+       " ('ROOT',\n",
+       "  ('*PrepNP', 'Punct'),\n",
+       "  '0##O 1##tym 2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic 12##!'),\n",
+       " ('S', ('*VP', 'NP'), '4##jesteś 5##nikim'),\n",
+       " ('S', ('*VP', 'NP', 'PrepNP'), '8##mają 9##cię 10##za 11##nic')}"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "!!!!!!!!!!!!!!! *PrepNP 0##O 1##tym 2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "{('*Comp', ('3##iż',), '3##iż'),\n",
+       " ('*Comp', ('7##iż',), '7##iż'),\n",
+       " ('*Conj', ('6##,',), '6##,'),\n",
+       " ('*N', ('1##tym',), '1##tym'),\n",
+       " ('*N', ('11##nic',), '11##nic'),\n",
+       " ('*N', ('5##nikim',), '5##nikim'),\n",
+       " ('*N', ('9##cię',), '9##cię'),\n",
+       " ('*NP', ('*N',), '1##tym'),\n",
+       " ('*Prep', ('0##O',), '0##O'),\n",
+       " ('*Prep', ('10##za',), '10##za'),\n",
+       " ('*PrepNP',\n",
+       "  ('*Prep', 'NP'),\n",
+       "  '0##O 1##tym 2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic'),\n",
+       " ('*PrepNP',\n",
+       "  ('*PrepNP',),\n",
+       "  '0##O 1##tym 2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic'),\n",
+       " ('*V', ('4##jesteś',), '4##jesteś'),\n",
+       " ('*V', ('8##mają',), '8##mają'),\n",
+       " ('*VP', ('*V',), '4##jesteś'),\n",
+       " ('*VP', ('*V',), '8##mają'),\n",
+       " ('CP', ('*Comp', 'S'), '7##iż 8##mają 9##cię 10##za 11##nic'),\n",
+       " ('CP',\n",
+       "  ('CP', '*Conj', 'CP'),\n",
+       "  '2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic'),\n",
+       " ('CP', ('Punct', '*Comp', 'S'), '2##, 3##iż 4##jesteś 5##nikim'),\n",
+       " ('NP', ('*N',), '11##nic'),\n",
+       " ('NP', ('*N',), '5##nikim'),\n",
+       " ('NP', ('*N',), '9##cię'),\n",
+       " ('NP',\n",
+       "  ('*NP', 'CP'),\n",
+       "  '1##tym 2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic'),\n",
+       " ('PrepNP', ('*Prep', 'NP'), '10##za 11##nic'),\n",
+       " ('Punct', ('12##!',), '12##!'),\n",
+       " ('Punct', ('2##,',), '2##,'),\n",
+       " ('ROOT',\n",
+       "  ('*PrepNP', 'Punct'),\n",
+       "  '0##O 1##tym 2##, 3##iż 4##jesteś 5##nikim 6##, 7##iż 8##mają 9##cię 10##za 11##nic 12##!'),\n",
+       " ('S', ('*VP', 'NP'), '4##jesteś 5##nikim'),\n",
+       " ('S', ('*VP', 'NP', 'PrepNP'), '8##mają 9##cię 10##za 11##nic')}"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "!!!!!!!!!!!!!!! *NP 0##Cztery 1##małe 2##groszki 3##w 4##strąku 5##w 6##tunelu 7##miłości\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "{('*Adj', ('1##małe',), '1##małe'),\n",
+       " ('*N', ('2##groszki',), '2##groszki'),\n",
+       " ('*N', ('4##strąku',), '4##strąku'),\n",
+       " ('*N', ('6##tunelu',), '6##tunelu'),\n",
+       " ('*N', ('7##miłości',), '7##miłości'),\n",
+       " ('*NP', ('*N',), '2##groszki'),\n",
+       " ('*NP', ('*N',), '6##tunelu'),\n",
+       " ('*NP',\n",
+       "  ('*NP',),\n",
+       "  '0##Cztery 1##małe 2##groszki 3##w 4##strąku 5##w 6##tunelu 7##miłości'),\n",
+       " ('*NP',\n",
+       "  ('*NumP', 'NP'),\n",
+       "  '0##Cztery 1##małe 2##groszki 3##w 4##strąku 5##w 6##tunelu 7##miłości'),\n",
+       " ('*Num', ('0##Cztery',), '0##Cztery'),\n",
+       " ('*NumP', ('*Num',), '0##Cztery'),\n",
+       " ('*Prep', ('3##w',), '3##w'),\n",
+       " ('*Prep', ('5##w',), '5##w'),\n",
+       " ('AdjP', ('*Adj',), '1##małe'),\n",
+       " ('NP', ('*N',), '4##strąku'),\n",
+       " ('NP', ('*N',), '7##miłości'),\n",
+       " ('NP', ('*NP', 'NP'), '6##tunelu 7##miłości'),\n",
+       " ('NP',\n",
+       "  ('AdjP', '*NP', 'PrepNP', 'PrepNP'),\n",
+       "  '1##małe 2##groszki 3##w 4##strąku 5##w 6##tunelu 7##miłości'),\n",
+       " ('PrepNP', ('*Prep', 'NP'), '3##w 4##strąku'),\n",
+       " ('PrepNP', ('*Prep', 'NP'), '5##w 6##tunelu 7##miłości'),\n",
+       " ('Punct', ('8##.',), '8##.'),\n",
+       " ('ROOT',\n",
+       "  ('*NP', 'Punct'),\n",
+       "  '0##Cztery 1##małe 2##groszki 3##w 4##strąku 5##w 6##tunelu 7##miłości 8##.')}"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "!!!!!!!!!!!!!!! *PrepNP 0##W 1##chwili 2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "{('*Adv', ('3##gdy',), '3##gdy'),\n",
+       " ('*N', ('1##chwili',), '1##chwili'),\n",
+       " ('*N', ('7##Alpy',), '7##Alpy'),\n",
+       " ('*N', ('8##słonie',), '8##słonie'),\n",
+       " ('*N', ('9##Hannibala',), '9##Hannibala'),\n",
+       " ('*NP', ('*N',), '1##chwili'),\n",
+       " ('*NP', ('*N',), '8##słonie'),\n",
+       " ('*Prep', ('0##W',), '0##W'),\n",
+       " ('*Prep', ('6##przez',), '6##przez'),\n",
+       " ('*PrepNP',\n",
+       "  ('*Prep', 'NP'),\n",
+       "  '0##W 1##chwili 2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala'),\n",
+       " ('*PrepNP',\n",
+       "  ('*PrepNP',),\n",
+       "  '0##W 1##chwili 2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala'),\n",
+       " ('*S',\n",
+       "  ('AdvP', '*VP', 'PrepNP', 'NP'),\n",
+       "  '3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala'),\n",
+       " ('*V', ('4##przeprowadzał', '5##em'), '4##przeprowadzał 5##em'),\n",
+       " ('*VP', ('*V',), '4##przeprowadzał 5##em'),\n",
+       " ('AdvP', ('*Adv',), '3##gdy'),\n",
+       " ('CP',\n",
+       "  ('Punct', '*S'),\n",
+       "  '2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala'),\n",
+       " ('NP', ('*N',), '7##Alpy'),\n",
+       " ('NP', ('*N',), '9##Hannibala'),\n",
+       " ('NP',\n",
+       "  ('*NP', 'CP'),\n",
+       "  '1##chwili 2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala'),\n",
+       " ('NP', ('*NP', 'NP'), '8##słonie 9##Hannibala'),\n",
+       " ('PrepNP', ('*Prep', 'NP'), '6##przez 7##Alpy'),\n",
+       " ('Punct', ('10##.',), '10##.'),\n",
+       " ('Punct', ('2##,',), '2##,'),\n",
+       " ('ROOT',\n",
+       "  ('*PrepNP', 'Punct'),\n",
+       "  '0##W 1##chwili 2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala 10##.')}"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "!!!!!!!!!!!!!!! *PrepNP 0##W 1##chwili 2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "{('*Adv', ('3##gdy',), '3##gdy'),\n",
+       " ('*N', ('1##chwili',), '1##chwili'),\n",
+       " ('*N', ('7##Alpy',), '7##Alpy'),\n",
+       " ('*N', ('8##słonie',), '8##słonie'),\n",
+       " ('*N', ('9##Hannibala',), '9##Hannibala'),\n",
+       " ('*NP', ('*N',), '1##chwili'),\n",
+       " ('*NP', ('*N',), '8##słonie'),\n",
+       " ('*Prep', ('0##W',), '0##W'),\n",
+       " ('*Prep', ('6##przez',), '6##przez'),\n",
+       " ('*PrepNP',\n",
+       "  ('*Prep', 'NP'),\n",
+       "  '0##W 1##chwili 2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala'),\n",
+       " ('*PrepNP',\n",
+       "  ('*PrepNP',),\n",
+       "  '0##W 1##chwili 2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala'),\n",
+       " ('*S',\n",
+       "  ('AdvP', '*VP', 'PrepNP', 'NP'),\n",
+       "  '3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala'),\n",
+       " ('*V', ('4##przeprowadzał', '5##em'), '4##przeprowadzał 5##em'),\n",
+       " ('*VP', ('*V',), '4##przeprowadzał 5##em'),\n",
+       " ('AdvP', ('*Adv',), '3##gdy'),\n",
+       " ('CP',\n",
+       "  ('Punct', '*S'),\n",
+       "  '2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala'),\n",
+       " ('NP', ('*N',), '7##Alpy'),\n",
+       " ('NP', ('*N',), '9##Hannibala'),\n",
+       " ('NP',\n",
+       "  ('*NP', 'CP'),\n",
+       "  '1##chwili 2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala'),\n",
+       " ('NP', ('*NP', 'NP'), '8##słonie 9##Hannibala'),\n",
+       " ('PrepNP', ('*Prep', 'NP'), '6##przez 7##Alpy'),\n",
+       " ('Punct', ('10##.',), '10##.'),\n",
+       " ('Punct', ('2##,',), '2##,'),\n",
+       " ('ROOT',\n",
+       "  ('*PrepNP', 'Punct'),\n",
+       "  '0##W 1##chwili 2##, 3##gdy 4##przeprowadzał 5##em 6##przez 7##Alpy 8##słonie 9##Hannibala 10##.')}"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "!!!!!!!!!!!!!!! *PrepNP 1##na 2##roczną 3##misję 4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "{('*Adj', ('2##roczną',), '2##roczną'),\n",
+       " ('*Adj', ('7##czternasty',), '7##czternasty'),\n",
+       " ('*N', ('3##misję',), '3##misję'),\n",
+       " ('*N', ('5##Tytana',), '5##Tytana'),\n",
+       " ('*N', ('8##księżyc',), '8##księżyc'),\n",
+       " ('*N', ('9##Saturna',), '9##Saturna'),\n",
+       " ('*NP', ('*N',), '3##misję'),\n",
+       " ('*NP', ('*N',), '5##Tytana'),\n",
+       " ('*NP', ('*N',), '8##księżyc'),\n",
+       " ('*Prep', ('1##na',), '1##na'),\n",
+       " ('*Prep', ('4##na',), '4##na'),\n",
+       " ('*PrepNP',\n",
+       "  ('*Prep', 'NP'),\n",
+       "  '1##na 2##roczną 3##misję 4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna'),\n",
+       " ('*PrepNP',\n",
+       "  ('*PrepNP',),\n",
+       "  '1##na 2##roczną 3##misję 4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna'),\n",
+       " ('AdjP', ('*Adj',), '2##roczną'),\n",
+       " ('AdjP', ('*Adj',), '7##czternasty'),\n",
+       " ('NP', ('*N',), '9##Saturna'),\n",
+       " ('NP', ('*NP', 'NP'), '5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna'),\n",
+       " ('NP',\n",
+       "  ('AdjP', '*NP', 'PrepNP'),\n",
+       "  '2##roczną 3##misję 4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna'),\n",
+       " ('NP',\n",
+       "  ('Punct', 'AdjP', '*NP', 'NP'),\n",
+       "  '6##, 7##czternasty 8##księżyc 9##Saturna'),\n",
+       " ('PrepNP',\n",
+       "  ('*Prep', 'NP'),\n",
+       "  '4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna'),\n",
+       " ('Punct', ('0##-',), '0##-'),\n",
+       " ('Punct', ('10##.',), '10##.'),\n",
+       " ('Punct', ('6##,',), '6##,'),\n",
+       " ('ROOT',\n",
+       "  ('Punct', '*PrepNP', 'Punct'),\n",
+       "  '0##- 1##na 2##roczną 3##misję 4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna 10##.')}"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "!!!!!!!!!!!!!!! *PrepNP 1##na 2##roczną 3##misję 4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "{('*Adj', ('2##roczną',), '2##roczną'),\n",
+       " ('*Adj', ('7##czternasty',), '7##czternasty'),\n",
+       " ('*N', ('3##misję',), '3##misję'),\n",
+       " ('*N', ('5##Tytana',), '5##Tytana'),\n",
+       " ('*N', ('8##księżyc',), '8##księżyc'),\n",
+       " ('*N', ('9##Saturna',), '9##Saturna'),\n",
+       " ('*NP', ('*N',), '3##misję'),\n",
+       " ('*NP', ('*N',), '5##Tytana'),\n",
+       " ('*NP', ('*N',), '8##księżyc'),\n",
+       " ('*Prep', ('1##na',), '1##na'),\n",
+       " ('*Prep', ('4##na',), '4##na'),\n",
+       " ('*PrepNP',\n",
+       "  ('*Prep', 'NP'),\n",
+       "  '1##na 2##roczną 3##misję 4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna'),\n",
+       " ('*PrepNP',\n",
+       "  ('*PrepNP',),\n",
+       "  '1##na 2##roczną 3##misję 4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna'),\n",
+       " ('AdjP', ('*Adj',), '2##roczną'),\n",
+       " ('AdjP', ('*Adj',), '7##czternasty'),\n",
+       " ('NP', ('*N',), '9##Saturna'),\n",
+       " ('NP', ('*NP', 'NP'), '5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna'),\n",
+       " ('NP',\n",
+       "  ('AdjP', '*NP', 'PrepNP'),\n",
+       "  '2##roczną 3##misję 4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna'),\n",
+       " ('NP',\n",
+       "  ('Punct', 'AdjP', '*NP', 'NP'),\n",
+       "  '6##, 7##czternasty 8##księżyc 9##Saturna'),\n",
+       " ('PrepNP',\n",
+       "  ('*Prep', 'NP'),\n",
+       "  '4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna'),\n",
+       " ('Punct', ('0##-',), '0##-'),\n",
+       " ('Punct', ('10##.',), '10##.'),\n",
+       " ('Punct', ('6##,',), '6##,'),\n",
+       " ('ROOT',\n",
+       "  ('Punct', '*PrepNP', 'Punct'),\n",
+       "  '0##- 1##na 2##roczną 3##misję 4##na 5##Tytana 6##, 7##czternasty 8##księżyc 9##Saturna 10##.')}"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    }
+   ],
+   "source": [
+    "evaluation_val, errors_val = eval_trees(val_trees, val_pred_trees)\n",
+    "evaluation_test, errors_test = eval_trees(test_trees, test_pred_trees)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 56,
+   "id": "65af3522",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "DEV:\n",
+      "precision:    0.974400637684714\n",
+      "recall:       0.9742960930674555\n",
+      "f1:           0.9743483625717548\n"
+     ]
+    }
+   ],
+   "source": [
+    "tp, fp, fn = list(map(sum, zip(*evaluation_val)))\n",
+    "p, r = tp / (tp + fp), tp / (tp + fn)\n",
+    "f1 = 2 * tp / (2 * tp + fp + fn)\n",
+    "print('DEV:')\n",
+    "print('precision:   ', p)\n",
+    "print('recall:      ', r)\n",
+    "print('f1:          ', f1)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 57,
+   "id": "8e0f3f93",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "TEST:\n",
+      "precision:    0.9774147274466051\n",
+      "recall:       0.9775082092645137\n",
+      "f1:           0.9774614661204711\n"
+     ]
+    }
+   ],
+   "source": [
+    "tp, fp, fn = list(map(sum, zip(*evaluation_test)))\n",
+    "p, r = tp / (tp + fp), tp / (tp + fn)\n",
+    "f1 = 2 * tp / (2 * tp + fp + fn)\n",
+    "print('TEST:')\n",
+    "print('precision:   ', p)\n",
+    "print('recall:      ', r)\n",
+    "print('f1:          ', f1)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "302b2333",
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "torch_benepar",
+   "language": "python",
+   "name": "torch_benepar"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.10.6"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git b/COMBO/DataPreparation.ipynb a/COMBO/DataPreparation.ipynb
new file mode 100644
index 0000000..fde3938
--- /dev/null
+++ a/COMBO/DataPreparation.ipynb
@@ -0,0 +1,213 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 46,
+   "id": "5cd26f6f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "\n",
+    "from datasets import load_dataset\n",
+    "\n",
+    "from IPython.display import display"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 47,
+   "id": "fecef4af",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Found cached dataset pdb_c_beta (/home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1)\n"
+     ]
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "1c89c7103bba4347a3fa7d23cac42cfe",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  0%|          | 0/3 [00:00<?, ?it/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    }
+   ],
+   "source": [
+    "pdbc_dataset = load_dataset('../pdb_c_beta')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 48,
+   "id": "23da801f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "CONLLU_DIR = 'connlu'\n",
+    "! rm -r {CONLLU_DIR}\n",
+    "! mkdir {CONLLU_DIR}"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 50,
+   "id": "91fb3bf3",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import sys\n",
+    "sys.path.append('../')\n",
+    "from neural_parser.hybrid_tree_utils import tree_from_dataset_instance"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 60,
+   "id": "c105feff",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "train\n",
+      "    connlu/pdbc-train.conllu\n",
+      "        17659\n",
+      "    connlu/pdbc-cont-train.conllu\n",
+      "        15903\n",
+      "validation\n",
+      "    connlu/pdbc-validation.conllu\n",
+      "        2211\n",
+      "    connlu/pdbc-cont-validation.conllu\n",
+      "        1980\n",
+      "test\n",
+      "    connlu/pdbc-test.conllu\n",
+      "        2205\n",
+      "    connlu/pdbc-cont-test.conllu\n",
+      "        1990\n"
+     ]
+    }
+   ],
+   "source": [
+    "features = pdbc_dataset['train'].features\n",
+    "\n",
+    "for part, dataset in pdbc_dataset.items():\n",
+    "    print(part)\n",
+    "    s_cont, s_all = [], [] \n",
+    "    for sentence in dataset:\n",
+    "        # TODO! check if discont\n",
+    "        tokens = sentence['tokens']\n",
+    "        lemmas = sentence['lemmas']\n",
+    "        heads = sentence['heads']\n",
+    "        heads = [h + 1 if h is not None else 0 for i, h in enumerate(heads)]\n",
+    "        deprels = [features['deprels'].feature.int2str(d) for d in sentence['deprels']]\n",
+    "        deprels = ['root' if deprel == 'ROOT' else deprel for deprel in deprels]\n",
+    "        rows = [f'# text = {\" \".join(tokens)}'] + [\n",
+    "            f'{i + 1}\\t{t}\\t{l}\\t_\\t_\\t_\\t{h}\\t{d}\\t{h}:{d}\\t_'\n",
+    "            for i, (t, l, h, d) in enumerate(zip(tokens, lemmas, heads, deprels))\n",
+    "        ]\n",
+    "        s_all.append(rows)\n",
+    "        if tree_from_dataset_instance(sentence, features).is_continuous():\n",
+    "            s_cont.append(rows)\n",
+    "    f_all = os.path.join(CONLLU_DIR, f'pdbc-{part}.conllu')\n",
+    "    f_cont = os.path.join(CONLLU_DIR, f'pdbc-cont-{part}.conllu')\n",
+    "    with open(f_all, 'w') as f:\n",
+    "        print('   ', f_all)\n",
+    "        print('       ', len(s_all))\n",
+    "        for rows in s_all:\n",
+    "            print('\\n'.join(rows), end='\\n\\n', file=f)\n",
+    "    with open(f_cont, 'w') as f:\n",
+    "        print('   ', f_cont)\n",
+    "        print('       ', len(s_cont))\n",
+    "        for rows in s_cont:\n",
+    "            print('\\n'.join(rows), end='\\n\\n', file=f)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 61,
+   "id": "c849233c",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "   32509   319813  1398303 connlu/pdbc-cont-test.conllu\n",
+      "   32509   319813  1198902 connlu/pdbc-cont-test-pred.conllu\n",
+      "  271337  2682725 11781617 connlu/pdbc-cont-train.conllu\n",
+      "   33491   330792  1452373 connlu/pdbc-cont-validation.conllu\n",
+      "   33491   330792  1244192 connlu/pdbc-cont-validation-pred.conllu\n",
+      "   37754   373431  1639937 connlu/pdbc-test.conllu\n",
+      "   37754   373431  1406776 connlu/pdbc-test-pred.conllu\n",
+      "  315364  3133712 13808053 connlu/pdbc-train.conllu\n",
+      "   38987   386865  1704685 connlu/pdbc-validation.conllu\n",
+      "   38987   386865  1461922 connlu/pdbc-validation-pred.conllu\n",
+      "  872183  8638239 37096760 total\n"
+     ]
+    }
+   ],
+   "source": [
+    "! wc {CONLLU_DIR}/*.conllu"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 62,
+   "id": "6b571716",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "# text = Skośnooka dziewczynka trzyma w rękach drewniane pałeczki , a przed nią znajdują się naczynia kuchenne .\r\n",
+      "1\tSkośnooka\tskośnooki\t_\t_\t_\t2\tadjunct\t2:adjunct\t_\r\n",
+      "2\tdziewczynka\tdziewczynka\t_\t_\t_\t3\tsubj\t3:subj\t_\r\n",
+      "3\ttrzyma\ttrzymać\t_\t_\t_\t9\tconjunct\t9:conjunct\t_\r\n",
+      "4\tw\tw\t_\t_\t_\t3\tadjunct_locat\t3:adjunct_locat\t_\r\n",
+      "5\trękach\tręka\t_\t_\t_\t4\tcomp\t4:comp\t_\r\n",
+      "6\tdrewniane\tdrewniany\t_\t_\t_\t7\tadjunct\t7:adjunct\t_\r\n",
+      "7\tpałeczki\tpałeczka\t_\t_\t_\t3\tobj\t3:obj\t_\r\n",
+      "8\t,\t,\t_\t_\t_\t9\tpunct\t9:punct\t_\r\n",
+      "9\ta\ta\t_\t_\t_\t0\troot\t0:root\t_\r\n"
+     ]
+    }
+   ],
+   "source": [
+    "! head {CONLLU_DIR}/pdbc-train.conllu"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "TF_zajecia",
+   "language": "python",
+   "name": "tf_zajecia"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.10.6"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git b/COMBO/ParseValAndTrain.ipynb a/COMBO/ParseValAndTrain.ipynb
new file mode 100644
index 0000000..a8e8ad0
--- /dev/null
+++ a/COMBO/ParseValAndTrain.ipynb
@@ -0,0 +1,1213 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "aabfb24b",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "COMBO = '/home/kkrasnowska/anaconda3/envs/combo_p39/bin/combo'"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "787fff78",
+   "metadata": {},
+   "source": [
+    "Main model"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "1d9daaa9",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "I0407 10:49:31.448594 140072765682752 archival.py:184] loading archive file model-pdbc/model.tar.gz\n",
+      "I0407 10:49:31.449148 140072765682752 archival.py:263] extracting archive file model-pdbc/model.tar.gz to temp dir /tmp/tmp_htckuhc\n",
+      "I0407 10:49:48.075045 140072765682752 params.py:248] dataset_reader.type = conllu\n",
+      "I0407 10:49:48.075561 140072765682752 params.py:248] dataset_reader.lazy = False\n",
+      "I0407 10:49:48.075693 140072765682752 params.py:248] dataset_reader.cache_directory = None\n",
+      "I0407 10:49:48.075764 140072765682752 params.py:248] dataset_reader.max_instances = None\n",
+      "I0407 10:49:48.075832 140072765682752 params.py:248] dataset_reader.manual_distributed_sharding = False\n",
+      "I0407 10:49:48.075901 140072765682752 params.py:248] dataset_reader.manual_multi_process_sharding = False\n",
+      "I0407 10:49:48.076193 140072765682752 params.py:248] dataset_reader.token_indexers.char.type = characters_const_padding\n",
+      "I0407 10:49:48.076388 140072765682752 params.py:248] dataset_reader.token_indexers.char.namespace = token_characters\n",
+      "I0407 10:49:48.076621 140072765682752 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:49:48.076697 140072765682752 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:49:48.076790 140072765682752 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:49:48.076939 140072765682752 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:49:48.077063 140072765682752 params.py:248] dataset_reader.token_indexers.char.start_tokens = None\n",
+      "I0407 10:49:48.077118 140072765682752 params.py:248] dataset_reader.token_indexers.char.end_tokens = None\n",
+      "I0407 10:49:48.077185 140072765682752 params.py:248] dataset_reader.token_indexers.char.min_padding_length = 32\n",
+      "I0407 10:49:48.077238 140072765682752 params.py:248] dataset_reader.token_indexers.char.token_min_padding_length = 0\n",
+      "I0407 10:49:48.077383 140072765682752 params.py:248] dataset_reader.token_indexers.feats.type = feats_indexer\n",
+      "I0407 10:49:48.077555 140072765682752 params.py:248] dataset_reader.token_indexers.feats.namespace = feats\n",
+      "I0407 10:49:48.077628 140072765682752 params.py:248] dataset_reader.token_indexers.feats.feature_name = feats_\n",
+      "I0407 10:49:48.077702 140072765682752 params.py:248] dataset_reader.token_indexers.feats.token_min_padding_length = 0\n",
+      "I0407 10:49:48.077838 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.type = characters_const_padding\n",
+      "I0407 10:49:48.078031 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.namespace = token_characters\n",
+      "I0407 10:49:48.078231 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:49:48.078300 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:49:48.078378 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:49:48.078666 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:49:48.078786 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.start_tokens = None\n",
+      "I0407 10:49:48.078862 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.end_tokens = None\n",
+      "I0407 10:49:48.078916 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.min_padding_length = 32\n",
+      "I0407 10:49:48.078969 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.token_min_padding_length = 0\n",
+      "I0407 10:49:48.079103 140072765682752 params.py:248] dataset_reader.token_indexers.token.type = pretrained_transformer_mismatched_fixed\n",
+      "I0407 10:49:48.079328 140072765682752 params.py:248] dataset_reader.token_indexers.token.token_min_padding_length = 0\n",
+      "I0407 10:49:48.079406 140072765682752 params.py:248] dataset_reader.token_indexers.token.model_name = allegro/herbert-large-cased\n",
+      "I0407 10:49:48.079461 140072765682752 params.py:248] dataset_reader.token_indexers.token.namespace = tags\n",
+      "I0407 10:49:48.079525 140072765682752 params.py:248] dataset_reader.token_indexers.token.max_length = None\n",
+      "I0407 10:49:48.079628 140072765682752 params.py:384] dataset_reader.token_indexers.token.tokenizer_kwargs.use_fast = False\n",
+      "I0407 10:49:51.185825 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.type = single_id\n",
+      "I0407 10:49:51.186234 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.namespace = upostag\n",
+      "I0407 10:49:51.186336 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.lowercase_tokens = False\n",
+      "I0407 10:49:51.186398 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.start_tokens = None\n",
+      "I0407 10:49:51.186465 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.end_tokens = None\n",
+      "I0407 10:49:51.186517 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.feature_name = pos_\n",
+      "I0407 10:49:51.186579 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
+      "I0407 10:49:51.186631 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.token_min_padding_length = 0\n",
+      "I0407 10:49:51.186791 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.type = single_id\n",
+      "I0407 10:49:51.186975 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.namespace = xpostag\n",
+      "I0407 10:49:51.187041 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.lowercase_tokens = False\n",
+      "I0407 10:49:51.187107 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.start_tokens = None\n",
+      "I0407 10:49:51.187170 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.end_tokens = None\n",
+      "I0407 10:49:51.187220 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.feature_name = tag_\n",
+      "I0407 10:49:51.187275 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
+      "I0407 10:49:51.187334 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.token_min_padding_length = 0\n",
+      "I0407 10:49:51.187556 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.type = characters_const_padding\n",
+      "I0407 10:49:51.187731 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.namespace = lemma_characters\n",
+      "I0407 10:49:51.187935 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:49:51.187995 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:49:51.188073 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:49:51.188217 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:49:51.188334 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.start_tokens = None\n",
+      "I0407 10:49:51.188398 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.end_tokens = None\n",
+      "I0407 10:49:51.188460 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.min_padding_length = 32\n",
+      "I0407 10:49:51.188522 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.token_min_padding_length = 0\n",
+      "I0407 10:49:51.188614 140072765682752 params.py:248] dataset_reader.features = ['token', 'char']\n",
+      "I0407 10:49:51.188712 140072765682752 params.py:248] dataset_reader.targets = ['head', 'deprel']\n",
+      "I0407 10:49:51.188802 140072765682752 params.py:248] dataset_reader.use_sem = False\n",
+      "I0407 10:49:51.188952 140072765682752 params.py:248] dataset_reader.type = conllu\n",
+      "I0407 10:49:51.189191 140072765682752 params.py:248] dataset_reader.lazy = False\n",
+      "I0407 10:49:51.189266 140072765682752 params.py:248] dataset_reader.cache_directory = None\n",
+      "I0407 10:49:51.189324 140072765682752 params.py:248] dataset_reader.max_instances = None\n",
+      "I0407 10:49:51.189382 140072765682752 params.py:248] dataset_reader.manual_distributed_sharding = False\n",
+      "I0407 10:49:51.189436 140072765682752 params.py:248] dataset_reader.manual_multi_process_sharding = False\n",
+      "I0407 10:49:51.189675 140072765682752 params.py:248] dataset_reader.token_indexers.char.type = characters_const_padding\n",
+      "I0407 10:49:51.189843 140072765682752 params.py:248] dataset_reader.token_indexers.char.namespace = token_characters\n",
+      "I0407 10:49:51.190060 140072765682752 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:49:51.190128 140072765682752 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:49:51.190197 140072765682752 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:49:51.190324 140072765682752 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:49:51.190443 140072765682752 params.py:248] dataset_reader.token_indexers.char.start_tokens = None\n",
+      "I0407 10:49:51.190508 140072765682752 params.py:248] dataset_reader.token_indexers.char.end_tokens = None\n",
+      "I0407 10:49:51.190564 140072765682752 params.py:248] dataset_reader.token_indexers.char.min_padding_length = 32\n",
+      "I0407 10:49:51.190627 140072765682752 params.py:248] dataset_reader.token_indexers.char.token_min_padding_length = 0\n",
+      "I0407 10:49:51.190772 140072765682752 params.py:248] dataset_reader.token_indexers.feats.type = feats_indexer\n",
+      "I0407 10:49:51.190932 140072765682752 params.py:248] dataset_reader.token_indexers.feats.namespace = feats\n",
+      "I0407 10:49:51.191003 140072765682752 params.py:248] dataset_reader.token_indexers.feats.feature_name = feats_\n",
+      "I0407 10:49:51.191065 140072765682752 params.py:248] dataset_reader.token_indexers.feats.token_min_padding_length = 0\n",
+      "I0407 10:49:51.191206 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.type = characters_const_padding\n",
+      "I0407 10:49:51.191369 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.namespace = token_characters\n",
+      "I0407 10:49:51.191561 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:49:51.191629 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:49:51.191706 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:49:51.191827 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:49:51.191938 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.start_tokens = None\n",
+      "I0407 10:49:51.191999 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.end_tokens = None\n",
+      "I0407 10:49:51.192067 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.min_padding_length = 32\n",
+      "I0407 10:49:51.192142 140072765682752 params.py:248] dataset_reader.token_indexers.lemma.token_min_padding_length = 0\n",
+      "I0407 10:49:51.192281 140072765682752 params.py:248] dataset_reader.token_indexers.token.type = pretrained_transformer_mismatched_fixed\n",
+      "I0407 10:49:51.192501 140072765682752 params.py:248] dataset_reader.token_indexers.token.token_min_padding_length = 0\n",
+      "I0407 10:49:51.192575 140072765682752 params.py:248] dataset_reader.token_indexers.token.model_name = allegro/herbert-large-cased\n",
+      "I0407 10:49:51.192638 140072765682752 params.py:248] dataset_reader.token_indexers.token.namespace = tags\n",
+      "I0407 10:49:51.192698 140072765682752 params.py:248] dataset_reader.token_indexers.token.max_length = None\n",
+      "I0407 10:49:51.192795 140072765682752 params.py:384] dataset_reader.token_indexers.token.tokenizer_kwargs.use_fast = False\n",
+      "I0407 10:49:51.194080 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.type = single_id\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "I0407 10:49:51.194318 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.namespace = upostag\n",
+      "I0407 10:49:51.194404 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.lowercase_tokens = False\n",
+      "I0407 10:49:51.194471 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.start_tokens = None\n",
+      "I0407 10:49:51.194532 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.end_tokens = None\n",
+      "I0407 10:49:51.194586 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.feature_name = pos_\n",
+      "I0407 10:49:51.194648 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
+      "I0407 10:49:51.194708 140072765682752 params.py:248] dataset_reader.token_indexers.upostag.token_min_padding_length = 0\n",
+      "I0407 10:49:51.194854 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.type = single_id\n",
+      "I0407 10:49:51.195033 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.namespace = xpostag\n",
+      "I0407 10:49:51.195105 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.lowercase_tokens = False\n",
+      "I0407 10:49:51.195167 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.start_tokens = None\n",
+      "I0407 10:49:51.195222 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.end_tokens = None\n",
+      "I0407 10:49:51.195280 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.feature_name = tag_\n",
+      "I0407 10:49:51.195338 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
+      "I0407 10:49:51.195398 140072765682752 params.py:248] dataset_reader.token_indexers.xpostag.token_min_padding_length = 0\n",
+      "I0407 10:49:51.195601 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.type = characters_const_padding\n",
+      "I0407 10:49:51.195774 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.namespace = lemma_characters\n",
+      "I0407 10:49:51.195971 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:49:51.196039 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:49:51.196113 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:49:51.196244 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:49:51.196364 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.start_tokens = None\n",
+      "I0407 10:49:51.196430 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.end_tokens = None\n",
+      "I0407 10:49:51.196492 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.min_padding_length = 32\n",
+      "I0407 10:49:51.196552 140072765682752 params.py:248] dataset_reader.lemma_indexers.char.token_min_padding_length = 0\n",
+      "I0407 10:49:51.196640 140072765682752 params.py:248] dataset_reader.features = ['token', 'char']\n",
+      "I0407 10:49:51.196732 140072765682752 params.py:248] dataset_reader.targets = ['head', 'deprel']\n",
+      "I0407 10:49:51.196815 140072765682752 params.py:248] dataset_reader.use_sem = False\n",
+      "I0407 10:49:51.197346 140072765682752 params.py:248] vocabulary.type = from_instances_extended\n",
+      "I0407 10:49:51.197421 140072765682752 vocabulary.py:323] Loading token dictionary from /tmp/tmp_htckuhc/vocabulary.\n",
+      "I0407 10:49:51.197736 140072765682752 filelock.py:254] Lock 140069359832176 acquired on /tmp/tmp_htckuhc/vocabulary/.lock\n",
+      "I0407 10:49:51.198361 140072765682752 filelock.py:317] Lock 140069359832176 released on /tmp/tmp_htckuhc/vocabulary/.lock\n",
+      "I0407 10:49:51.198865 140072765682752 params.py:248] model.type = semantic_multitask\n",
+      "I0407 10:49:51.199399 140072765682752 params.py:248] model.text_field_embedder.type = basic\n",
+      "I0407 10:49:51.199762 140072765682752 params.py:248] model.text_field_embedder.token_embedders.char.type = char_embeddings_from_config\n",
+      "I0407 10:49:51.199955 140072765682752 params.py:248] model.text_field_embedder.token_embedders.char.embedding_dim = 64\n",
+      "I0407 10:49:51.200206 140072765682752 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.input_dim = 64\n",
+      "I0407 10:49:51.200286 140072765682752 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.filters = [512, 256, 64]\n",
+      "I0407 10:49:51.200380 140072765682752 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.kernel_size = [3, 3, 3]\n",
+      "I0407 10:49:51.200467 140072765682752 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.stride = [1, 1, 1]\n",
+      "I0407 10:49:51.200556 140072765682752 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.padding = [1, 2, 4]\n",
+      "I0407 10:49:51.200649 140072765682752 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.dilation = [1, 2, 4]\n",
+      "I0407 10:49:51.200745 140072765682752 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.activations = ['relu', 'relu', 'linear']\n",
+      "I0407 10:49:51.200886 140072765682752 params.py:248] type = relu\n",
+      "I0407 10:49:51.201073 140072765682752 params.py:248] type = relu\n",
+      "I0407 10:49:51.201222 140072765682752 params.py:248] type = linear\n",
+      "I0407 10:49:51.208180 140072765682752 params.py:248] model.text_field_embedder.token_embedders.char.vocab_namespace = token_characters\n",
+      "I0407 10:49:51.208718 140072765682752 params.py:248] model.text_field_embedder.token_embedders.token.type = transformers_word_embeddings\n",
+      "I0407 10:49:51.208946 140072765682752 params.py:248] model.text_field_embedder.token_embedders.token.model_name = allegro/herbert-large-cased\n",
+      "I0407 10:49:51.209028 140072765682752 params.py:248] model.text_field_embedder.token_embedders.token.projection_dim = 100\n",
+      "I0407 10:49:51.209110 140072765682752 params.py:248] model.text_field_embedder.token_embedders.token.projection_activation = <function TransformersWordEmbedder.<lambda> at 0x7f646dd85280>\n",
+      "I0407 10:49:51.209182 140072765682752 params.py:248] model.text_field_embedder.token_embedders.token.projection_dropout_rate = 0.0\n",
+      "I0407 10:49:51.209239 140072765682752 params.py:248] model.text_field_embedder.token_embedders.token.freeze_transformer = True\n",
+      "I0407 10:49:51.209295 140072765682752 params.py:248] model.text_field_embedder.token_embedders.token.last_layer_only = True\n",
+      "I0407 10:49:51.209401 140072765682752 params.py:384] model.text_field_embedder.token_embedders.token.tokenizer_kwargs.use_fast = False\n",
+      "I0407 10:49:51.209471 140072765682752 params.py:248] model.text_field_embedder.token_embedders.token.transformer_kwargs = None\n",
+      "I0407 10:49:58.747374 140072765682752 params.py:248] model.seq_encoder.type = combo_encoder\n",
+      "I0407 10:49:58.747746 140072765682752 params.py:248] model.seq_encoder.stacked_bilstm.input_size = 164\n",
+      "I0407 10:49:58.747819 140072765682752 params.py:248] model.seq_encoder.stacked_bilstm.hidden_size = 512\n",
+      "I0407 10:49:58.747869 140072765682752 params.py:248] model.seq_encoder.stacked_bilstm.num_layers = 2\n",
+      "I0407 10:49:58.747919 140072765682752 params.py:248] model.seq_encoder.stacked_bilstm.recurrent_dropout_probability = 0.33\n",
+      "I0407 10:49:58.747966 140072765682752 params.py:248] model.seq_encoder.stacked_bilstm.layer_dropout_probability = 0.33\n",
+      "I0407 10:49:58.748013 140072765682752 params.py:248] model.seq_encoder.stacked_bilstm.use_highway = False\n",
+      "I0407 10:49:59.084017 140072765682752 params.py:248] model.seq_encoder.layer_dropout_probability = 0.33\n",
+      "I0407 10:49:59.084280 140072765682752 params.py:248] model.use_sample_weight = True\n",
+      "I0407 10:49:59.084377 140072765682752 params.py:248] model.lemmatizer = None\n",
+      "I0407 10:49:59.084436 140072765682752 params.py:248] model.upos_tagger = None\n",
+      "I0407 10:49:59.084487 140072765682752 params.py:248] model.xpos_tagger = None\n",
+      "I0407 10:49:59.084537 140072765682752 params.py:248] model.semantic_relation = None\n",
+      "I0407 10:49:59.084585 140072765682752 params.py:248] model.morphological_feat = None\n",
+      "I0407 10:49:59.084832 140072765682752 params.py:248] model.dependency_relation.type = combo_dependency_parsing_from_vocab\n",
+      "I0407 10:49:59.085025 140072765682752 params.py:248] model.dependency_relation.vocab_namespace = deprel_labels\n",
+      "I0407 10:49:59.085301 140072765682752 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.in_features = 1024\n",
+      "I0407 10:49:59.085365 140072765682752 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.out_features = 512\n",
+      "I0407 10:49:59.085421 140072765682752 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.activation = tanh\n",
+      "I0407 10:49:59.085520 140072765682752 params.py:248] type = tanh\n",
+      "I0407 10:49:59.085608 140072765682752 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.dropout_rate = 0.0\n",
+      "I0407 10:49:59.089095 140072765682752 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.in_features = 1024\n",
+      "I0407 10:49:59.089183 140072765682752 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.out_features = 512\n",
+      "I0407 10:49:59.089244 140072765682752 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.activation = tanh\n",
+      "I0407 10:49:59.089346 140072765682752 params.py:248] type = tanh\n",
+      "I0407 10:49:59.089423 140072765682752 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.dropout_rate = 0.0\n",
+      "I0407 10:49:59.092701 140072765682752 params.py:248] model.dependency_relation.head_predictor.cycle_loss_n = 0\n",
+      "I0407 10:49:59.092917 140072765682752 params.py:248] model.dependency_relation.head_projection_layer.in_features = 1024\n",
+      "I0407 10:49:59.092972 140072765682752 params.py:248] model.dependency_relation.head_projection_layer.out_features = 128\n",
+      "I0407 10:49:59.093022 140072765682752 params.py:248] model.dependency_relation.head_projection_layer.activation = tanh\n",
+      "I0407 10:49:59.093108 140072765682752 params.py:248] type = tanh\n",
+      "I0407 10:49:59.093183 140072765682752 params.py:248] model.dependency_relation.head_projection_layer.dropout_rate = 0.25\n",
+      "I0407 10:49:59.094336 140072765682752 params.py:248] model.dependency_relation.dependency_projection_layer.in_features = 1024\n",
+      "I0407 10:49:59.094411 140072765682752 params.py:248] model.dependency_relation.dependency_projection_layer.out_features = 128\n",
+      "I0407 10:49:59.094463 140072765682752 params.py:248] model.dependency_relation.dependency_projection_layer.activation = tanh\n",
+      "I0407 10:49:59.094551 140072765682752 params.py:248] type = tanh\n",
+      "I0407 10:49:59.094618 140072765682752 params.py:248] model.dependency_relation.dependency_projection_layer.dropout_rate = 0.25\n",
+      "I0407 10:49:59.095806 140072765682752 params.py:248] model.enhanced_dependency_relation = None\n",
+      "I0407 10:49:59.096206 140072765682752 params.py:248] model.regularizer.regexes.0.1.type = l2\n",
+      "I0407 10:49:59.096345 140072765682752 params.py:248] model.regularizer.regexes.0.1.alpha = 1e-06\n",
+      "I0407 10:49:59.096471 140072765682752 params.py:248] model.regularizer.regexes.1.1.type = l2\n",
+      "I0407 10:49:59.096584 140072765682752 params.py:248] model.regularizer.regexes.1.1.alpha = 1e-06\n",
+      "I0407 10:49:59.096696 140072765682752 params.py:248] model.regularizer.regexes.2.1.type = l2\n",
+      "I0407 10:49:59.096809 140072765682752 params.py:248] model.regularizer.regexes.2.1.alpha = 1e-06\n",
+      "I0407 10:49:59.096917 140072765682752 params.py:248] model.regularizer.regexes.3.1.type = l2\n",
+      "I0407 10:49:59.097025 140072765682752 params.py:248] model.regularizer.regexes.3.1.alpha = 1e-05\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "I0407 10:50:01.854557 140072765682752 archival.py:211] removing temporary unarchived model dir at /tmp/tmp_htckuhc\n",
+      "reading instances: 2211it [01:52, 19.69it/s]\n"
+     ]
+    }
+   ],
+   "source": [
+    "! {COMBO} --mode predict \\\n",
+    "    --cuda_device 0 \\\n",
+    "    --model_path model-pdbc/model.tar.gz \\\n",
+    "    --input_file connlu/pdbc-validation.conllu \\\n",
+    "    --output_file connlu/pdbc-validation-pred.conllu"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "11f1b7b1",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "# text = Dwie dziewczynki opierają się o dach kapliczki , chłopiec wspina się na niego , a trzecia dziewczynka stoi obok .\r\n",
+      "1\tDwie\tdwa\t_\t_\t_\t3\tsubj\t3:subj\t_\r\n",
+      "2\tdziewczynki\tdziewczynka\t_\t_\t_\t1\tcomp\t1:comp\t_\r\n",
+      "3\topierają\topierać\t_\t_\t_\t15\tconjunct\t15:conjunct\t_\r\n",
+      "4\tsię\tsię\t_\t_\t_\t3\trefl\t3:refl\t_\r\n",
+      "5\to\to\t_\t_\t_\t3\tcomp\t3:comp\t_\r\n",
+      "6\tdach\tdach\t_\t_\t_\t5\tcomp\t5:comp\t_\r\n",
+      "7\tkapliczki\tkapliczka\t_\t_\t_\t6\tadjunct\t6:adjunct\t_\r\n",
+      "8\t,\t,\t_\t_\t_\t15\tpunct\t15:punct\t_\r\n",
+      "9\tchłopiec\tchłopiec\t_\t_\t_\t10\tsubj\t10:subj\t_\r\n"
+     ]
+    }
+   ],
+   "source": [
+    "! head connlu/pdbc-validation.conllu"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "8fa72124",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "# text = Dwie dziewczynki opierają się o dach kapliczki , chłopiec wspina się na niego , a trzecia dziewczynka stoi obok .\r\n",
+      "1\tDwie\tdwa\t_\t_\t_\t3\tsubj\t3:subj\t_\r\n",
+      "2\tdziewczynki\tdziewczynka\t_\t_\t_\t1\tcomp\t1:comp\t_\r\n",
+      "3\topierają\topierać\t_\t_\t_\t15\tconjunct\t15:conjunct\t_\r\n",
+      "4\tsię\tsię\t_\t_\t_\t3\trefl\t3:refl\t_\r\n",
+      "5\to\to\t_\t_\t_\t3\tcomp\t3:comp\t_\r\n",
+      "6\tdach\tdach\t_\t_\t_\t5\tcomp\t5:comp\t_\r\n",
+      "7\tkapliczki\tkapliczka\t_\t_\t_\t6\tadjunct\t6:adjunct\t_\r\n",
+      "8\t,\t,\t_\t_\t_\t15\tpunct\t15:punct\t_\r\n",
+      "9\tchłopiec\tchłopiec\t_\t_\t_\t10\tsubj\t10:subj\t_\r\n"
+     ]
+    }
+   ],
+   "source": [
+    "! head connlu/pdbc-validation-pred.conllu"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "dde6dd31",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "I0407 10:52:00.220404 139754138821696 archival.py:184] loading archive file model-pdbc/model.tar.gz\n",
+      "I0407 10:52:00.221079 139754138821696 archival.py:263] extracting archive file model-pdbc/model.tar.gz to temp dir /tmp/tmp2jhqu3i6\n",
+      "I0407 10:52:16.996590 139754138821696 params.py:248] dataset_reader.type = conllu\n",
+      "I0407 10:52:16.997079 139754138821696 params.py:248] dataset_reader.lazy = False\n",
+      "I0407 10:52:16.997236 139754138821696 params.py:248] dataset_reader.cache_directory = None\n",
+      "I0407 10:52:16.997326 139754138821696 params.py:248] dataset_reader.max_instances = None\n",
+      "I0407 10:52:16.997391 139754138821696 params.py:248] dataset_reader.manual_distributed_sharding = False\n",
+      "I0407 10:52:16.997456 139754138821696 params.py:248] dataset_reader.manual_multi_process_sharding = False\n",
+      "I0407 10:52:16.997756 139754138821696 params.py:248] dataset_reader.token_indexers.char.type = characters_const_padding\n",
+      "I0407 10:52:16.997950 139754138821696 params.py:248] dataset_reader.token_indexers.char.namespace = token_characters\n",
+      "I0407 10:52:16.998211 139754138821696 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:52:16.998285 139754138821696 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:52:16.998367 139754138821696 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:52:16.998522 139754138821696 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:52:16.998643 139754138821696 params.py:248] dataset_reader.token_indexers.char.start_tokens = None\n",
+      "I0407 10:52:16.998707 139754138821696 params.py:248] dataset_reader.token_indexers.char.end_tokens = None\n",
+      "I0407 10:52:16.998770 139754138821696 params.py:248] dataset_reader.token_indexers.char.min_padding_length = 32\n",
+      "I0407 10:52:16.998831 139754138821696 params.py:248] dataset_reader.token_indexers.char.token_min_padding_length = 0\n",
+      "I0407 10:52:16.998980 139754138821696 params.py:248] dataset_reader.token_indexers.feats.type = feats_indexer\n",
+      "I0407 10:52:16.999143 139754138821696 params.py:248] dataset_reader.token_indexers.feats.namespace = feats\n",
+      "I0407 10:52:16.999213 139754138821696 params.py:248] dataset_reader.token_indexers.feats.feature_name = feats_\n",
+      "I0407 10:52:16.999269 139754138821696 params.py:248] dataset_reader.token_indexers.feats.token_min_padding_length = 0\n",
+      "I0407 10:52:16.999412 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.type = characters_const_padding\n",
+      "I0407 10:52:16.999578 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.namespace = token_characters\n",
+      "I0407 10:52:16.999774 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:52:16.999842 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:52:16.999923 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:52:17.000045 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:52:17.000156 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.start_tokens = None\n",
+      "I0407 10:52:17.000220 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.end_tokens = None\n",
+      "I0407 10:52:17.000282 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.min_padding_length = 32\n",
+      "I0407 10:52:17.000344 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.token_min_padding_length = 0\n",
+      "I0407 10:52:17.000521 139754138821696 params.py:248] dataset_reader.token_indexers.token.type = pretrained_transformer_mismatched_fixed\n",
+      "I0407 10:52:17.000770 139754138821696 params.py:248] dataset_reader.token_indexers.token.token_min_padding_length = 0\n",
+      "I0407 10:52:17.000865 139754138821696 params.py:248] dataset_reader.token_indexers.token.model_name = allegro/herbert-large-cased\n",
+      "I0407 10:52:17.000947 139754138821696 params.py:248] dataset_reader.token_indexers.token.namespace = tags\n",
+      "I0407 10:52:17.001028 139754138821696 params.py:248] dataset_reader.token_indexers.token.max_length = None\n",
+      "I0407 10:52:17.001172 139754138821696 params.py:384] dataset_reader.token_indexers.token.tokenizer_kwargs.use_fast = False\n",
+      "I0407 10:52:20.459573 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.type = single_id\n",
+      "I0407 10:52:20.459947 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.namespace = upostag\n",
+      "I0407 10:52:20.460046 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.lowercase_tokens = False\n",
+      "I0407 10:52:20.460119 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.start_tokens = None\n",
+      "I0407 10:52:20.460172 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.end_tokens = None\n",
+      "I0407 10:52:20.460235 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.feature_name = pos_\n",
+      "I0407 10:52:20.460288 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
+      "I0407 10:52:20.460351 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.token_min_padding_length = 0\n",
+      "I0407 10:52:20.460508 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.type = single_id\n",
+      "I0407 10:52:20.460695 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.namespace = xpostag\n",
+      "I0407 10:52:20.460773 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.lowercase_tokens = False\n",
+      "I0407 10:52:20.460840 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.start_tokens = None\n",
+      "I0407 10:52:20.460901 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.end_tokens = None\n",
+      "I0407 10:52:20.460962 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.feature_name = tag_\n",
+      "I0407 10:52:20.461021 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
+      "I0407 10:52:20.461083 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.token_min_padding_length = 0\n",
+      "I0407 10:52:20.461313 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.type = characters_const_padding\n",
+      "I0407 10:52:20.461496 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.namespace = lemma_characters\n",
+      "I0407 10:52:20.461706 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:52:20.461774 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:52:20.461853 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:52:20.462028 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:52:20.462157 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.start_tokens = None\n",
+      "I0407 10:52:20.462226 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.end_tokens = None\n",
+      "I0407 10:52:20.462283 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.min_padding_length = 32\n",
+      "I0407 10:52:20.462336 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.token_min_padding_length = 0\n",
+      "I0407 10:52:20.462417 139754138821696 params.py:248] dataset_reader.features = ['token', 'char']\n",
+      "I0407 10:52:20.462514 139754138821696 params.py:248] dataset_reader.targets = ['head', 'deprel']\n",
+      "I0407 10:52:20.462607 139754138821696 params.py:248] dataset_reader.use_sem = False\n",
+      "I0407 10:52:20.462767 139754138821696 params.py:248] dataset_reader.type = conllu\n",
+      "I0407 10:52:20.463083 139754138821696 params.py:248] dataset_reader.lazy = False\n",
+      "I0407 10:52:20.463172 139754138821696 params.py:248] dataset_reader.cache_directory = None\n",
+      "I0407 10:52:20.463237 139754138821696 params.py:248] dataset_reader.max_instances = None\n",
+      "I0407 10:52:20.463301 139754138821696 params.py:248] dataset_reader.manual_distributed_sharding = False\n",
+      "I0407 10:52:20.463361 139754138821696 params.py:248] dataset_reader.manual_multi_process_sharding = False\n",
+      "I0407 10:52:20.463605 139754138821696 params.py:248] dataset_reader.token_indexers.char.type = characters_const_padding\n",
+      "I0407 10:52:20.463779 139754138821696 params.py:248] dataset_reader.token_indexers.char.namespace = token_characters\n",
+      "I0407 10:52:20.463980 139754138821696 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:52:20.464051 139754138821696 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:52:20.464129 139754138821696 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:52:20.464254 139754138821696 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:52:20.464366 139754138821696 params.py:248] dataset_reader.token_indexers.char.start_tokens = None\n",
+      "I0407 10:52:20.464429 139754138821696 params.py:248] dataset_reader.token_indexers.char.end_tokens = None\n",
+      "I0407 10:52:20.464490 139754138821696 params.py:248] dataset_reader.token_indexers.char.min_padding_length = 32\n",
+      "I0407 10:52:20.464552 139754138821696 params.py:248] dataset_reader.token_indexers.char.token_min_padding_length = 0\n",
+      "I0407 10:52:20.464691 139754138821696 params.py:248] dataset_reader.token_indexers.feats.type = feats_indexer\n",
+      "I0407 10:52:20.464847 139754138821696 params.py:248] dataset_reader.token_indexers.feats.namespace = feats\n",
+      "I0407 10:52:20.464918 139754138821696 params.py:248] dataset_reader.token_indexers.feats.feature_name = feats_\n",
+      "I0407 10:52:20.464980 139754138821696 params.py:248] dataset_reader.token_indexers.feats.token_min_padding_length = 0\n",
+      "I0407 10:52:20.465120 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.type = characters_const_padding\n",
+      "I0407 10:52:20.465285 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.namespace = token_characters\n",
+      "I0407 10:52:20.465479 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:52:20.465544 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:52:20.465618 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:52:20.465741 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:52:20.465851 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.start_tokens = None\n",
+      "I0407 10:52:20.465914 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.end_tokens = None\n",
+      "I0407 10:52:20.466024 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.min_padding_length = 32\n",
+      "I0407 10:52:20.466112 139754138821696 params.py:248] dataset_reader.token_indexers.lemma.token_min_padding_length = 0\n",
+      "I0407 10:52:20.466268 139754138821696 params.py:248] dataset_reader.token_indexers.token.type = pretrained_transformer_mismatched_fixed\n",
+      "I0407 10:52:20.466485 139754138821696 params.py:248] dataset_reader.token_indexers.token.token_min_padding_length = 0\n",
+      "I0407 10:52:20.466559 139754138821696 params.py:248] dataset_reader.token_indexers.token.model_name = allegro/herbert-large-cased\n",
+      "I0407 10:52:20.466621 139754138821696 params.py:248] dataset_reader.token_indexers.token.namespace = tags\n",
+      "I0407 10:52:20.466682 139754138821696 params.py:248] dataset_reader.token_indexers.token.max_length = None\n",
+      "I0407 10:52:20.466777 139754138821696 params.py:384] dataset_reader.token_indexers.token.tokenizer_kwargs.use_fast = False\n",
+      "I0407 10:52:20.468071 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.type = single_id\n",
+      "I0407 10:52:20.468319 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.namespace = upostag\n",
+      "I0407 10:52:20.468404 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.lowercase_tokens = False\n",
+      "I0407 10:52:20.468464 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.start_tokens = None\n",
+      "I0407 10:52:20.468523 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.end_tokens = None\n",
+      "I0407 10:52:20.468573 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.feature_name = pos_\n",
+      "I0407 10:52:20.468636 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
+      "I0407 10:52:20.468697 139754138821696 params.py:248] dataset_reader.token_indexers.upostag.token_min_padding_length = 0\n",
+      "I0407 10:52:20.468832 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.type = single_id\n",
+      "I0407 10:52:20.469012 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.namespace = xpostag\n",
+      "I0407 10:52:20.469086 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.lowercase_tokens = False\n",
+      "I0407 10:52:20.469144 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.start_tokens = None\n",
+      "I0407 10:52:20.469196 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.end_tokens = None\n",
+      "I0407 10:52:20.469256 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.feature_name = tag_\n",
+      "I0407 10:52:20.469320 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
+      "I0407 10:52:20.469382 139754138821696 params.py:248] dataset_reader.token_indexers.xpostag.token_min_padding_length = 0\n",
+      "I0407 10:52:20.469586 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.type = characters_const_padding\n",
+      "I0407 10:52:20.469758 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.namespace = lemma_characters\n",
+      "I0407 10:52:20.469957 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:52:20.470050 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:52:20.470128 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:52:20.470261 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:52:20.470381 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.start_tokens = None\n",
+      "I0407 10:52:20.470448 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.end_tokens = None\n",
+      "I0407 10:52:20.470509 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.min_padding_length = 32\n",
+      "I0407 10:52:20.470579 139754138821696 params.py:248] dataset_reader.lemma_indexers.char.token_min_padding_length = 0\n",
+      "I0407 10:52:20.470668 139754138821696 params.py:248] dataset_reader.features = ['token', 'char']\n",
+      "I0407 10:52:20.470764 139754138821696 params.py:248] dataset_reader.targets = ['head', 'deprel']\n",
+      "I0407 10:52:20.470849 139754138821696 params.py:248] dataset_reader.use_sem = False\n",
+      "I0407 10:52:20.471387 139754138821696 params.py:248] vocabulary.type = from_instances_extended\n",
+      "I0407 10:52:20.471461 139754138821696 vocabulary.py:323] Loading token dictionary from /tmp/tmp2jhqu3i6/vocabulary.\n",
+      "I0407 10:52:20.471798 139754138821696 filelock.py:254] Lock 139750732975216 acquired on /tmp/tmp2jhqu3i6/vocabulary/.lock\n",
+      "I0407 10:52:20.472387 139754138821696 filelock.py:317] Lock 139750732975216 released on /tmp/tmp2jhqu3i6/vocabulary/.lock\n",
+      "I0407 10:52:20.472922 139754138821696 params.py:248] model.type = semantic_multitask\n",
+      "I0407 10:52:20.473455 139754138821696 params.py:248] model.text_field_embedder.type = basic\n",
+      "I0407 10:52:20.473808 139754138821696 params.py:248] model.text_field_embedder.token_embedders.char.type = char_embeddings_from_config\n",
+      "I0407 10:52:20.474030 139754138821696 params.py:248] model.text_field_embedder.token_embedders.char.embedding_dim = 64\n",
+      "I0407 10:52:20.474286 139754138821696 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.input_dim = 64\n",
+      "I0407 10:52:20.474377 139754138821696 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.filters = [512, 256, 64]\n",
+      "I0407 10:52:20.474480 139754138821696 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.kernel_size = [3, 3, 3]\n",
+      "I0407 10:52:20.474578 139754138821696 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.stride = [1, 1, 1]\n",
+      "I0407 10:52:20.474673 139754138821696 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.padding = [1, 2, 4]\n",
+      "I0407 10:52:20.474768 139754138821696 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.dilation = [1, 2, 4]\n",
+      "I0407 10:52:20.474864 139754138821696 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.activations = ['relu', 'relu', 'linear']\n",
+      "I0407 10:52:20.475005 139754138821696 params.py:248] type = relu\n",
+      "I0407 10:52:20.475197 139754138821696 params.py:248] type = relu\n",
+      "I0407 10:52:20.475347 139754138821696 params.py:248] type = linear\n",
+      "I0407 10:52:20.481609 139754138821696 params.py:248] model.text_field_embedder.token_embedders.char.vocab_namespace = token_characters\n",
+      "I0407 10:52:20.482178 139754138821696 params.py:248] model.text_field_embedder.token_embedders.token.type = transformers_word_embeddings\n",
+      "I0407 10:52:20.482446 139754138821696 params.py:248] model.text_field_embedder.token_embedders.token.model_name = allegro/herbert-large-cased\n",
+      "I0407 10:52:20.482533 139754138821696 params.py:248] model.text_field_embedder.token_embedders.token.projection_dim = 100\n",
+      "I0407 10:52:20.482632 139754138821696 params.py:248] model.text_field_embedder.token_embedders.token.projection_activation = <function TransformersWordEmbedder.<lambda> at 0x7f1a3e346280>\n",
+      "I0407 10:52:20.482703 139754138821696 params.py:248] model.text_field_embedder.token_embedders.token.projection_dropout_rate = 0.0\n",
+      "I0407 10:52:20.482769 139754138821696 params.py:248] model.text_field_embedder.token_embedders.token.freeze_transformer = True\n",
+      "I0407 10:52:20.482831 139754138821696 params.py:248] model.text_field_embedder.token_embedders.token.last_layer_only = True\n",
+      "I0407 10:52:20.482933 139754138821696 params.py:384] model.text_field_embedder.token_embedders.token.tokenizer_kwargs.use_fast = False\n",
+      "I0407 10:52:20.483003 139754138821696 params.py:248] model.text_field_embedder.token_embedders.token.transformer_kwargs = None\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "I0407 10:52:28.699278 139754138821696 params.py:248] model.seq_encoder.type = combo_encoder\n",
+      "I0407 10:52:28.699747 139754138821696 params.py:248] model.seq_encoder.stacked_bilstm.input_size = 164\n",
+      "I0407 10:52:28.699841 139754138821696 params.py:248] model.seq_encoder.stacked_bilstm.hidden_size = 512\n",
+      "I0407 10:52:28.699910 139754138821696 params.py:248] model.seq_encoder.stacked_bilstm.num_layers = 2\n",
+      "I0407 10:52:28.699976 139754138821696 params.py:248] model.seq_encoder.stacked_bilstm.recurrent_dropout_probability = 0.33\n",
+      "I0407 10:52:28.700042 139754138821696 params.py:248] model.seq_encoder.stacked_bilstm.layer_dropout_probability = 0.33\n",
+      "I0407 10:52:28.700106 139754138821696 params.py:248] model.seq_encoder.stacked_bilstm.use_highway = False\n",
+      "I0407 10:52:29.089101 139754138821696 params.py:248] model.seq_encoder.layer_dropout_probability = 0.33\n",
+      "I0407 10:52:29.089426 139754138821696 params.py:248] model.use_sample_weight = True\n",
+      "I0407 10:52:29.089556 139754138821696 params.py:248] model.lemmatizer = None\n",
+      "I0407 10:52:29.089638 139754138821696 params.py:248] model.upos_tagger = None\n",
+      "I0407 10:52:29.089704 139754138821696 params.py:248] model.xpos_tagger = None\n",
+      "I0407 10:52:29.089766 139754138821696 params.py:248] model.semantic_relation = None\n",
+      "I0407 10:52:29.089827 139754138821696 params.py:248] model.morphological_feat = None\n",
+      "I0407 10:52:29.090160 139754138821696 params.py:248] model.dependency_relation.type = combo_dependency_parsing_from_vocab\n",
+      "I0407 10:52:29.090409 139754138821696 params.py:248] model.dependency_relation.vocab_namespace = deprel_labels\n",
+      "I0407 10:52:29.090762 139754138821696 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.in_features = 1024\n",
+      "I0407 10:52:29.090843 139754138821696 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.out_features = 512\n",
+      "I0407 10:52:29.090915 139754138821696 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.activation = tanh\n",
+      "I0407 10:52:29.091041 139754138821696 params.py:248] type = tanh\n",
+      "I0407 10:52:29.091149 139754138821696 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.dropout_rate = 0.0\n",
+      "I0407 10:52:29.096003 139754138821696 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.in_features = 1024\n",
+      "I0407 10:52:29.096106 139754138821696 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.out_features = 512\n",
+      "I0407 10:52:29.096185 139754138821696 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.activation = tanh\n",
+      "I0407 10:52:29.096311 139754138821696 params.py:248] type = tanh\n",
+      "I0407 10:52:29.096407 139754138821696 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.dropout_rate = 0.0\n",
+      "I0407 10:52:29.101276 139754138821696 params.py:248] model.dependency_relation.head_predictor.cycle_loss_n = 0\n",
+      "I0407 10:52:29.101581 139754138821696 params.py:248] model.dependency_relation.head_projection_layer.in_features = 1024\n",
+      "I0407 10:52:29.101692 139754138821696 params.py:248] model.dependency_relation.head_projection_layer.out_features = 128\n",
+      "I0407 10:52:29.101771 139754138821696 params.py:248] model.dependency_relation.head_projection_layer.activation = tanh\n",
+      "I0407 10:52:29.101904 139754138821696 params.py:248] type = tanh\n",
+      "I0407 10:52:29.102032 139754138821696 params.py:248] model.dependency_relation.head_projection_layer.dropout_rate = 0.25\n",
+      "I0407 10:52:29.103649 139754138821696 params.py:248] model.dependency_relation.dependency_projection_layer.in_features = 1024\n",
+      "I0407 10:52:29.103747 139754138821696 params.py:248] model.dependency_relation.dependency_projection_layer.out_features = 128\n",
+      "I0407 10:52:29.103819 139754138821696 params.py:248] model.dependency_relation.dependency_projection_layer.activation = tanh\n",
+      "I0407 10:52:29.103948 139754138821696 params.py:248] type = tanh\n",
+      "I0407 10:52:29.104044 139754138821696 params.py:248] model.dependency_relation.dependency_projection_layer.dropout_rate = 0.25\n",
+      "I0407 10:52:29.105780 139754138821696 params.py:248] model.enhanced_dependency_relation = None\n",
+      "I0407 10:52:29.106371 139754138821696 params.py:248] model.regularizer.regexes.0.1.type = l2\n",
+      "I0407 10:52:29.106555 139754138821696 params.py:248] model.regularizer.regexes.0.1.alpha = 1e-06\n",
+      "I0407 10:52:29.106724 139754138821696 params.py:248] model.regularizer.regexes.1.1.type = l2\n",
+      "I0407 10:52:29.106879 139754138821696 params.py:248] model.regularizer.regexes.1.1.alpha = 1e-06\n",
+      "I0407 10:52:29.107035 139754138821696 params.py:248] model.regularizer.regexes.2.1.type = l2\n",
+      "I0407 10:52:29.107207 139754138821696 params.py:248] model.regularizer.regexes.2.1.alpha = 1e-06\n",
+      "I0407 10:52:29.107368 139754138821696 params.py:248] model.regularizer.regexes.3.1.type = l2\n",
+      "I0407 10:52:29.107544 139754138821696 params.py:248] model.regularizer.regexes.3.1.alpha = 1e-05\n",
+      "I0407 10:52:32.063793 139754138821696 archival.py:211] removing temporary unarchived model dir at /tmp/tmp2jhqu3i6\n",
+      "reading instances: 2205it [01:49, 20.15it/s]\n"
+     ]
+    }
+   ],
+   "source": [
+    "! {COMBO} --mode predict \\\n",
+    "    --cuda_device 0 \\\n",
+    "    --model_path model-pdbc/model.tar.gz \\\n",
+    "    --input_file connlu/pdbc-test.conllu \\\n",
+    "    --output_file connlu/pdbc-test-pred.conllu"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "13748ca1",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "# text = Mały chłopiec patrzy w bok po ściągnięciu okularów .\r\n",
+      "1\tMały\tmały\t_\t_\t_\t2\tadjunct\t2:adjunct\t_\r\n",
+      "2\tchłopiec\tchłopiec\t_\t_\t_\t3\tsubj\t3:subj\t_\r\n",
+      "3\tpatrzy\tpatrzeć\t_\t_\t_\t0\troot\t0:root\t_\r\n",
+      "4\tw\tw\t_\t_\t_\t3\tadjunct_adl\t3:adjunct_adl\t_\r\n",
+      "5\tbok\tbok\t_\t_\t_\t4\tcomp\t4:comp\t_\r\n",
+      "6\tpo\tpo\t_\t_\t_\t3\tadjunct_temp\t3:adjunct_temp\t_\r\n",
+      "7\tściągnięciu\tściągnąć\t_\t_\t_\t6\tcomp\t6:comp\t_\r\n",
+      "8\tokularów\tokulary\t_\t_\t_\t7\tobj\t7:obj\t_\r\n",
+      "9\t.\t.\t_\t_\t_\t3\tpunct\t3:punct\t_\r\n"
+     ]
+    }
+   ],
+   "source": [
+    "! head connlu/pdbc-test.conllu"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "30021124",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "# text = Mały chłopiec patrzy w bok po ściągnięciu okularów .\r\n",
+      "1\tMały\tmały\t_\t_\t_\t2\tadjunct\t2:adjunct\t_\r\n",
+      "2\tchłopiec\tchłopiec\t_\t_\t_\t3\tsubj\t3:subj\t_\r\n",
+      "3\tpatrzy\tpatrzeć\t_\t_\t_\t0\troot\t0:root\t_\r\n",
+      "4\tw\tw\t_\t_\t_\t3\tcomp\t3:adjunct_adl\t_\r\n",
+      "5\tbok\tbok\t_\t_\t_\t4\tcomp\t4:comp\t_\r\n",
+      "6\tpo\tpo\t_\t_\t_\t3\tadjunct_temp\t3:adjunct_temp\t_\r\n",
+      "7\tściągnięciu\tściągnąć\t_\t_\t_\t6\tcomp\t6:comp\t_\r\n",
+      "8\tokularów\tokulary\t_\t_\t_\t7\tobj\t7:obj\t_\r\n",
+      "9\t.\t.\t_\t_\t_\t3\tpunct\t3:punct\t_\r\n"
+     ]
+    }
+   ],
+   "source": [
+    "! head connlu/pdbc-test-pred.conllu"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "99359d8c",
+   "metadata": {},
+   "source": [
+    "Continuous-only model"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "id": "30a66da6",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "I0407 10:54:27.401382 140321380496448 archival.py:184] loading archive file model-pdbc-cont/model.tar.gz\n",
+      "I0407 10:54:27.402150 140321380496448 archival.py:263] extracting archive file model-pdbc-cont/model.tar.gz to temp dir /tmp/tmpuvesoi4q\n",
+      "I0407 10:54:43.091615 140321380496448 params.py:248] dataset_reader.type = conllu\n",
+      "I0407 10:54:43.092000 140321380496448 params.py:248] dataset_reader.lazy = False\n",
+      "I0407 10:54:43.092082 140321380496448 params.py:248] dataset_reader.cache_directory = None\n",
+      "I0407 10:54:43.092129 140321380496448 params.py:248] dataset_reader.max_instances = None\n",
+      "I0407 10:54:43.092173 140321380496448 params.py:248] dataset_reader.manual_distributed_sharding = False\n",
+      "I0407 10:54:43.092208 140321380496448 params.py:248] dataset_reader.manual_multi_process_sharding = False\n",
+      "I0407 10:54:43.092409 140321380496448 params.py:248] dataset_reader.token_indexers.char.type = characters_const_padding\n",
+      "I0407 10:54:43.092535 140321380496448 params.py:248] dataset_reader.token_indexers.char.namespace = token_characters\n",
+      "I0407 10:54:43.092682 140321380496448 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:54:43.092730 140321380496448 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:54:43.092786 140321380496448 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:54:43.092888 140321380496448 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:54:43.092970 140321380496448 params.py:248] dataset_reader.token_indexers.char.start_tokens = None\n",
+      "I0407 10:54:43.093014 140321380496448 params.py:248] dataset_reader.token_indexers.char.end_tokens = None\n",
+      "I0407 10:54:43.093051 140321380496448 params.py:248] dataset_reader.token_indexers.char.min_padding_length = 32\n",
+      "I0407 10:54:43.093093 140321380496448 params.py:248] dataset_reader.token_indexers.char.token_min_padding_length = 0\n",
+      "I0407 10:54:43.093198 140321380496448 params.py:248] dataset_reader.token_indexers.feats.type = feats_indexer\n",
+      "I0407 10:54:43.093306 140321380496448 params.py:248] dataset_reader.token_indexers.feats.namespace = feats\n",
+      "I0407 10:54:43.093353 140321380496448 params.py:248] dataset_reader.token_indexers.feats.feature_name = feats_\n",
+      "I0407 10:54:43.093388 140321380496448 params.py:248] dataset_reader.token_indexers.feats.token_min_padding_length = 0\n",
+      "I0407 10:54:43.093482 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.type = characters_const_padding\n",
+      "I0407 10:54:43.093593 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.namespace = token_characters\n",
+      "I0407 10:54:43.093723 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:54:43.093769 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:54:43.093816 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:54:43.093899 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:54:43.093993 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.start_tokens = None\n",
+      "I0407 10:54:43.094043 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.end_tokens = None\n",
+      "I0407 10:54:43.094079 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.min_padding_length = 32\n",
+      "I0407 10:54:43.094121 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.token_min_padding_length = 0\n",
+      "I0407 10:54:43.094226 140321380496448 params.py:248] dataset_reader.token_indexers.token.type = pretrained_transformer_mismatched_fixed\n",
+      "I0407 10:54:43.094377 140321380496448 params.py:248] dataset_reader.token_indexers.token.token_min_padding_length = 0\n",
+      "I0407 10:54:43.094430 140321380496448 params.py:248] dataset_reader.token_indexers.token.model_name = allegro/herbert-large-cased\n",
+      "I0407 10:54:43.094474 140321380496448 params.py:248] dataset_reader.token_indexers.token.namespace = tags\n",
+      "I0407 10:54:43.094522 140321380496448 params.py:248] dataset_reader.token_indexers.token.max_length = None\n",
+      "I0407 10:54:43.094592 140321380496448 params.py:384] dataset_reader.token_indexers.token.tokenizer_kwargs.use_fast = False\n",
+      "I0407 10:54:45.858621 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.type = single_id\n",
+      "I0407 10:54:45.858990 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.namespace = upostag\n",
+      "I0407 10:54:45.859087 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.lowercase_tokens = False\n",
+      "I0407 10:54:45.859157 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.start_tokens = None\n",
+      "I0407 10:54:45.859210 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.end_tokens = None\n",
+      "I0407 10:54:45.859268 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.feature_name = pos_\n",
+      "I0407 10:54:45.859321 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
+      "I0407 10:54:45.859382 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.token_min_padding_length = 0\n",
+      "I0407 10:54:45.859541 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.type = single_id\n",
+      "I0407 10:54:45.859729 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.namespace = xpostag\n",
+      "I0407 10:54:45.859802 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.lowercase_tokens = False\n",
+      "I0407 10:54:45.859875 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.start_tokens = None\n",
+      "I0407 10:54:45.859931 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.end_tokens = None\n",
+      "I0407 10:54:45.859991 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.feature_name = tag_\n",
+      "I0407 10:54:45.860045 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
+      "I0407 10:54:45.860103 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.token_min_padding_length = 0\n",
+      "I0407 10:54:45.860332 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.type = characters_const_padding\n",
+      "I0407 10:54:45.860523 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.namespace = lemma_characters\n",
+      "I0407 10:54:45.860739 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:54:45.860809 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:54:45.860888 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:54:45.861032 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:54:45.861149 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.start_tokens = None\n",
+      "I0407 10:54:45.861213 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.end_tokens = None\n",
+      "I0407 10:54:45.861277 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.min_padding_length = 32\n",
+      "I0407 10:54:45.861337 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.token_min_padding_length = 0\n",
+      "I0407 10:54:45.861427 140321380496448 params.py:248] dataset_reader.features = ['token', 'char']\n",
+      "I0407 10:54:45.861522 140321380496448 params.py:248] dataset_reader.targets = ['head', 'deprel']\n",
+      "I0407 10:54:45.861611 140321380496448 params.py:248] dataset_reader.use_sem = False\n",
+      "I0407 10:54:45.861762 140321380496448 params.py:248] dataset_reader.type = conllu\n",
+      "I0407 10:54:45.862029 140321380496448 params.py:248] dataset_reader.lazy = False\n",
+      "I0407 10:54:45.862116 140321380496448 params.py:248] dataset_reader.cache_directory = None\n",
+      "I0407 10:54:45.862177 140321380496448 params.py:248] dataset_reader.max_instances = None\n",
+      "I0407 10:54:45.862234 140321380496448 params.py:248] dataset_reader.manual_distributed_sharding = False\n",
+      "I0407 10:54:45.862295 140321380496448 params.py:248] dataset_reader.manual_multi_process_sharding = False\n",
+      "I0407 10:54:45.862535 140321380496448 params.py:248] dataset_reader.token_indexers.char.type = characters_const_padding\n",
+      "I0407 10:54:45.862701 140321380496448 params.py:248] dataset_reader.token_indexers.char.namespace = token_characters\n",
+      "I0407 10:54:45.862900 140321380496448 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:54:45.862966 140321380496448 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:54:45.863043 140321380496448 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:54:45.863168 140321380496448 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:54:45.863281 140321380496448 params.py:248] dataset_reader.token_indexers.char.start_tokens = None\n",
+      "I0407 10:54:45.863344 140321380496448 params.py:248] dataset_reader.token_indexers.char.end_tokens = None\n",
+      "I0407 10:54:45.863406 140321380496448 params.py:248] dataset_reader.token_indexers.char.min_padding_length = 32\n",
+      "I0407 10:54:45.863469 140321380496448 params.py:248] dataset_reader.token_indexers.char.token_min_padding_length = 0\n",
+      "I0407 10:54:45.863596 140321380496448 params.py:248] dataset_reader.token_indexers.feats.type = feats_indexer\n",
+      "I0407 10:54:45.863752 140321380496448 params.py:248] dataset_reader.token_indexers.feats.namespace = feats\n",
+      "I0407 10:54:45.863821 140321380496448 params.py:248] dataset_reader.token_indexers.feats.feature_name = feats_\n",
+      "I0407 10:54:45.863883 140321380496448 params.py:248] dataset_reader.token_indexers.feats.token_min_padding_length = 0\n",
+      "I0407 10:54:45.864030 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.type = characters_const_padding\n",
+      "I0407 10:54:45.864196 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.namespace = token_characters\n",
+      "I0407 10:54:45.864392 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:54:45.864460 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:54:45.864540 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:54:45.864660 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:54:45.864772 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.start_tokens = None\n",
+      "I0407 10:54:45.864835 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.end_tokens = None\n",
+      "I0407 10:54:45.864896 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.min_padding_length = 32\n",
+      "I0407 10:54:45.864965 140321380496448 params.py:248] dataset_reader.token_indexers.lemma.token_min_padding_length = 0\n",
+      "I0407 10:54:45.865104 140321380496448 params.py:248] dataset_reader.token_indexers.token.type = pretrained_transformer_mismatched_fixed\n",
+      "I0407 10:54:45.865323 140321380496448 params.py:248] dataset_reader.token_indexers.token.token_min_padding_length = 0\n",
+      "I0407 10:54:45.865396 140321380496448 params.py:248] dataset_reader.token_indexers.token.model_name = allegro/herbert-large-cased\n",
+      "I0407 10:54:45.865460 140321380496448 params.py:248] dataset_reader.token_indexers.token.namespace = tags\n",
+      "I0407 10:54:45.865518 140321380496448 params.py:248] dataset_reader.token_indexers.token.max_length = None\n",
+      "I0407 10:54:45.865614 140321380496448 params.py:384] dataset_reader.token_indexers.token.tokenizer_kwargs.use_fast = False\n",
+      "I0407 10:54:45.866884 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.type = single_id\n",
+      "I0407 10:54:45.867116 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.namespace = upostag\n",
+      "I0407 10:54:45.867190 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.lowercase_tokens = False\n",
+      "I0407 10:54:45.867258 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.start_tokens = None\n",
+      "I0407 10:54:45.867316 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.end_tokens = None\n",
+      "I0407 10:54:45.867376 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.feature_name = pos_\n",
+      "I0407 10:54:45.867437 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
+      "I0407 10:54:45.867497 140321380496448 params.py:248] dataset_reader.token_indexers.upostag.token_min_padding_length = 0\n",
+      "I0407 10:54:45.867640 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.type = single_id\n",
+      "I0407 10:54:45.867815 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.namespace = xpostag\n",
+      "I0407 10:54:45.867887 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.lowercase_tokens = False\n",
+      "I0407 10:54:45.867951 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.start_tokens = None\n",
+      "I0407 10:54:45.868006 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.end_tokens = None\n",
+      "I0407 10:54:45.868063 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.feature_name = tag_\n",
+      "I0407 10:54:45.868122 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
+      "I0407 10:54:45.868181 140321380496448 params.py:248] dataset_reader.token_indexers.xpostag.token_min_padding_length = 0\n",
+      "I0407 10:54:45.868388 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.type = characters_const_padding\n",
+      "I0407 10:54:45.868559 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.namespace = lemma_characters\n",
+      "I0407 10:54:45.868757 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:54:45.868824 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:54:45.868897 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:54:45.869028 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:54:45.869139 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.start_tokens = None\n",
+      "I0407 10:54:45.869202 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.end_tokens = None\n",
+      "I0407 10:54:45.869256 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.min_padding_length = 32\n",
+      "I0407 10:54:45.869315 140321380496448 params.py:248] dataset_reader.lemma_indexers.char.token_min_padding_length = 0\n",
+      "I0407 10:54:45.869398 140321380496448 params.py:248] dataset_reader.features = ['token', 'char']\n",
+      "I0407 10:54:45.869489 140321380496448 params.py:248] dataset_reader.targets = ['head', 'deprel']\n",
+      "I0407 10:54:45.869572 140321380496448 params.py:248] dataset_reader.use_sem = False\n",
+      "I0407 10:54:45.870136 140321380496448 params.py:248] vocabulary.type = from_instances_extended\n",
+      "I0407 10:54:45.870218 140321380496448 vocabulary.py:323] Loading token dictionary from /tmp/tmpuvesoi4q/vocabulary.\n",
+      "I0407 10:54:45.870543 140321380496448 filelock.py:254] Lock 140317974842768 acquired on /tmp/tmpuvesoi4q/vocabulary/.lock\n",
+      "I0407 10:54:45.871132 140321380496448 filelock.py:317] Lock 140317974842768 released on /tmp/tmpuvesoi4q/vocabulary/.lock\n",
+      "I0407 10:54:45.871641 140321380496448 params.py:248] model.type = semantic_multitask\n",
+      "I0407 10:54:45.872183 140321380496448 params.py:248] model.text_field_embedder.type = basic\n",
+      "I0407 10:54:45.872548 140321380496448 params.py:248] model.text_field_embedder.token_embedders.char.type = char_embeddings_from_config\n",
+      "I0407 10:54:45.872749 140321380496448 params.py:248] model.text_field_embedder.token_embedders.char.embedding_dim = 64\n",
+      "I0407 10:54:45.873004 140321380496448 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.input_dim = 64\n",
+      "I0407 10:54:45.873091 140321380496448 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.filters = [512, 256, 64]\n",
+      "I0407 10:54:45.873195 140321380496448 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.kernel_size = [3, 3, 3]\n",
+      "I0407 10:54:45.873291 140321380496448 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.stride = [1, 1, 1]\n",
+      "I0407 10:54:45.873384 140321380496448 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.padding = [1, 2, 4]\n",
+      "I0407 10:54:45.873478 140321380496448 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.dilation = [1, 2, 4]\n",
+      "I0407 10:54:45.873572 140321380496448 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.activations = ['relu', 'relu', 'linear']\n",
+      "I0407 10:54:45.873714 140321380496448 params.py:248] type = relu\n",
+      "I0407 10:54:45.873904 140321380496448 params.py:248] type = relu\n",
+      "I0407 10:54:45.874098 140321380496448 params.py:248] type = linear\n",
+      "I0407 10:54:45.880232 140321380496448 params.py:248] model.text_field_embedder.token_embedders.char.vocab_namespace = token_characters\n",
+      "I0407 10:54:45.880783 140321380496448 params.py:248] model.text_field_embedder.token_embedders.token.type = transformers_word_embeddings\n",
+      "I0407 10:54:45.881011 140321380496448 params.py:248] model.text_field_embedder.token_embedders.token.model_name = allegro/herbert-large-cased\n",
+      "I0407 10:54:45.881093 140321380496448 params.py:248] model.text_field_embedder.token_embedders.token.projection_dim = 100\n",
+      "I0407 10:54:45.881184 140321380496448 params.py:248] model.text_field_embedder.token_embedders.token.projection_activation = <function TransformersWordEmbedder.<lambda> at 0x7f9e50745280>\n",
+      "I0407 10:54:45.881261 140321380496448 params.py:248] model.text_field_embedder.token_embedders.token.projection_dropout_rate = 0.0\n",
+      "I0407 10:54:45.881328 140321380496448 params.py:248] model.text_field_embedder.token_embedders.token.freeze_transformer = True\n",
+      "I0407 10:54:45.881389 140321380496448 params.py:248] model.text_field_embedder.token_embedders.token.last_layer_only = True\n",
+      "I0407 10:54:45.881492 140321380496448 params.py:384] model.text_field_embedder.token_embedders.token.tokenizer_kwargs.use_fast = False\n",
+      "I0407 10:54:45.881562 140321380496448 params.py:248] model.text_field_embedder.token_embedders.token.transformer_kwargs = None\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "I0407 10:54:52.911276 140321380496448 params.py:248] model.seq_encoder.type = combo_encoder\n",
+      "I0407 10:54:52.911743 140321380496448 params.py:248] model.seq_encoder.stacked_bilstm.input_size = 164\n",
+      "I0407 10:54:52.911836 140321380496448 params.py:248] model.seq_encoder.stacked_bilstm.hidden_size = 512\n",
+      "I0407 10:54:52.911902 140321380496448 params.py:248] model.seq_encoder.stacked_bilstm.num_layers = 2\n",
+      "I0407 10:54:52.911965 140321380496448 params.py:248] model.seq_encoder.stacked_bilstm.recurrent_dropout_probability = 0.33\n",
+      "I0407 10:54:52.912029 140321380496448 params.py:248] model.seq_encoder.stacked_bilstm.layer_dropout_probability = 0.33\n",
+      "I0407 10:54:52.912090 140321380496448 params.py:248] model.seq_encoder.stacked_bilstm.use_highway = False\n",
+      "I0407 10:54:53.279199 140321380496448 params.py:248] model.seq_encoder.layer_dropout_probability = 0.33\n",
+      "I0407 10:54:53.279505 140321380496448 params.py:248] model.use_sample_weight = True\n",
+      "I0407 10:54:53.279624 140321380496448 params.py:248] model.lemmatizer = None\n",
+      "I0407 10:54:53.279695 140321380496448 params.py:248] model.upos_tagger = None\n",
+      "I0407 10:54:53.279757 140321380496448 params.py:248] model.xpos_tagger = None\n",
+      "I0407 10:54:53.279815 140321380496448 params.py:248] model.semantic_relation = None\n",
+      "I0407 10:54:53.279873 140321380496448 params.py:248] model.morphological_feat = None\n",
+      "I0407 10:54:53.280155 140321380496448 params.py:248] model.dependency_relation.type = combo_dependency_parsing_from_vocab\n",
+      "I0407 10:54:53.280393 140321380496448 params.py:248] model.dependency_relation.vocab_namespace = deprel_labels\n",
+      "I0407 10:54:53.280741 140321380496448 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.in_features = 1024\n",
+      "I0407 10:54:53.280819 140321380496448 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.out_features = 512\n",
+      "I0407 10:54:53.280887 140321380496448 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.activation = tanh\n",
+      "I0407 10:54:53.281012 140321380496448 params.py:248] type = tanh\n",
+      "I0407 10:54:53.281121 140321380496448 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.dropout_rate = 0.0\n",
+      "I0407 10:54:53.285843 140321380496448 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.in_features = 1024\n",
+      "I0407 10:54:53.286010 140321380496448 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.out_features = 512\n",
+      "I0407 10:54:53.286088 140321380496448 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.activation = tanh\n",
+      "I0407 10:54:53.286234 140321380496448 params.py:248] type = tanh\n",
+      "I0407 10:54:53.286334 140321380496448 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.dropout_rate = 0.0\n",
+      "I0407 10:54:53.290788 140321380496448 params.py:248] model.dependency_relation.head_predictor.cycle_loss_n = 0\n",
+      "I0407 10:54:53.291093 140321380496448 params.py:248] model.dependency_relation.head_projection_layer.in_features = 1024\n",
+      "I0407 10:54:53.291184 140321380496448 params.py:248] model.dependency_relation.head_projection_layer.out_features = 128\n",
+      "I0407 10:54:53.291281 140321380496448 params.py:248] model.dependency_relation.head_projection_layer.activation = tanh\n",
+      "I0407 10:54:53.291444 140321380496448 params.py:248] type = tanh\n",
+      "I0407 10:54:53.291567 140321380496448 params.py:248] model.dependency_relation.head_projection_layer.dropout_rate = 0.25\n",
+      "I0407 10:54:53.293048 140321380496448 params.py:248] model.dependency_relation.dependency_projection_layer.in_features = 1024\n",
+      "I0407 10:54:53.293147 140321380496448 params.py:248] model.dependency_relation.dependency_projection_layer.out_features = 128\n",
+      "I0407 10:54:53.293218 140321380496448 params.py:248] model.dependency_relation.dependency_projection_layer.activation = tanh\n",
+      "I0407 10:54:53.293342 140321380496448 params.py:248] type = tanh\n",
+      "I0407 10:54:53.293437 140321380496448 params.py:248] model.dependency_relation.dependency_projection_layer.dropout_rate = 0.25\n",
+      "I0407 10:54:53.295091 140321380496448 params.py:248] model.enhanced_dependency_relation = None\n",
+      "I0407 10:54:53.295609 140321380496448 params.py:248] model.regularizer.regexes.0.1.type = l2\n",
+      "I0407 10:54:53.295784 140321380496448 params.py:248] model.regularizer.regexes.0.1.alpha = 1e-06\n",
+      "I0407 10:54:53.295953 140321380496448 params.py:248] model.regularizer.regexes.1.1.type = l2\n",
+      "I0407 10:54:53.296107 140321380496448 params.py:248] model.regularizer.regexes.1.1.alpha = 1e-06\n",
+      "I0407 10:54:53.296261 140321380496448 params.py:248] model.regularizer.regexes.2.1.type = l2\n",
+      "I0407 10:54:53.296412 140321380496448 params.py:248] model.regularizer.regexes.2.1.alpha = 1e-06\n",
+      "I0407 10:54:53.296564 140321380496448 params.py:248] model.regularizer.regexes.3.1.type = l2\n",
+      "I0407 10:54:53.296715 140321380496448 params.py:248] model.regularizer.regexes.3.1.alpha = 1e-05\n",
+      "I0407 10:54:56.194218 140321380496448 archival.py:211] removing temporary unarchived model dir at /tmp/tmpuvesoi4q\n",
+      "reading instances: 1980it [01:33, 21.15it/s]\n"
+     ]
+    }
+   ],
+   "source": [
+    "! {COMBO} --mode predict \\\n",
+    "    --cuda_device 0 \\\n",
+    "    --model_path model-pdbc-cont/model.tar.gz \\\n",
+    "    --input_file connlu/pdbc-cont-validation.conllu \\\n",
+    "    --output_file connlu/pdbc-cont-validation-pred.conllu"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "id": "cfe7a3c4",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "# text = Dwie dziewczynki opierają się o dach kapliczki , chłopiec wspina się na niego , a trzecia dziewczynka stoi obok .\r\n",
+      "1\tDwie\tdwa\t_\t_\t_\t3\tsubj\t3:subj\t_\r\n",
+      "2\tdziewczynki\tdziewczynka\t_\t_\t_\t1\tcomp\t1:comp\t_\r\n",
+      "3\topierają\topierać\t_\t_\t_\t15\tconjunct\t15:conjunct\t_\r\n",
+      "4\tsię\tsię\t_\t_\t_\t3\trefl\t3:refl\t_\r\n",
+      "5\to\to\t_\t_\t_\t3\tcomp\t3:comp\t_\r\n",
+      "6\tdach\tdach\t_\t_\t_\t5\tcomp\t5:comp\t_\r\n",
+      "7\tkapliczki\tkapliczka\t_\t_\t_\t6\tadjunct\t6:adjunct\t_\r\n",
+      "8\t,\t,\t_\t_\t_\t15\tpunct\t15:punct\t_\r\n",
+      "9\tchłopiec\tchłopiec\t_\t_\t_\t10\tsubj\t10:subj\t_\r\n"
+     ]
+    }
+   ],
+   "source": [
+    "! head connlu/pdbc-cont-validation.conllu"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "id": "7dba9571",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "# text = Dwie dziewczynki opierają się o dach kapliczki , chłopiec wspina się na niego , a trzecia dziewczynka stoi obok .\r\n",
+      "1\tDwie\tdwa\t_\t_\t_\t3\tsubj\t3:subj\t_\r\n",
+      "2\tdziewczynki\tdziewczynka\t_\t_\t_\t1\tcomp\t1:comp\t_\r\n",
+      "3\topierają\topierać\t_\t_\t_\t15\tconjunct\t15:conjunct\t_\r\n",
+      "4\tsię\tsię\t_\t_\t_\t3\trefl\t3:refl\t_\r\n",
+      "5\to\to\t_\t_\t_\t3\tcomp\t3:comp\t_\r\n",
+      "6\tdach\tdach\t_\t_\t_\t5\tcomp\t5:comp\t_\r\n",
+      "7\tkapliczki\tkapliczka\t_\t_\t_\t6\tadjunct\t6:adjunct\t_\r\n",
+      "8\t,\t,\t_\t_\t_\t15\tpunct\t15:punct\t_\r\n",
+      "9\tchłopiec\tchłopiec\t_\t_\t_\t10\tsubj\t10:subj\t_\r\n"
+     ]
+    }
+   ],
+   "source": [
+    "! head connlu/pdbc-cont-validation-pred.conllu"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "id": "679601c2",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "I0407 10:56:35.295660 140254825452608 archival.py:184] loading archive file model-pdbc-cont/model.tar.gz\n",
+      "I0407 10:56:35.296370 140254825452608 archival.py:263] extracting archive file model-pdbc-cont/model.tar.gz to temp dir /tmp/tmpdhtf4et1\n",
+      "I0407 10:56:52.876630 140254825452608 params.py:248] dataset_reader.type = conllu\n",
+      "I0407 10:56:52.877122 140254825452608 params.py:248] dataset_reader.lazy = False\n",
+      "I0407 10:56:52.877243 140254825452608 params.py:248] dataset_reader.cache_directory = None\n",
+      "I0407 10:56:52.877313 140254825452608 params.py:248] dataset_reader.max_instances = None\n",
+      "I0407 10:56:52.877380 140254825452608 params.py:248] dataset_reader.manual_distributed_sharding = False\n",
+      "I0407 10:56:52.877446 140254825452608 params.py:248] dataset_reader.manual_multi_process_sharding = False\n",
+      "I0407 10:56:52.877737 140254825452608 params.py:248] dataset_reader.token_indexers.char.type = characters_const_padding\n",
+      "I0407 10:56:52.877938 140254825452608 params.py:248] dataset_reader.token_indexers.char.namespace = token_characters\n",
+      "I0407 10:56:52.878201 140254825452608 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:56:52.878276 140254825452608 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:56:52.878360 140254825452608 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:56:52.878507 140254825452608 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:56:52.878633 140254825452608 params.py:248] dataset_reader.token_indexers.char.start_tokens = None\n",
+      "I0407 10:56:52.878702 140254825452608 params.py:248] dataset_reader.token_indexers.char.end_tokens = None\n",
+      "I0407 10:56:52.878761 140254825452608 params.py:248] dataset_reader.token_indexers.char.min_padding_length = 32\n",
+      "I0407 10:56:52.878825 140254825452608 params.py:248] dataset_reader.token_indexers.char.token_min_padding_length = 0\n",
+      "I0407 10:56:52.878969 140254825452608 params.py:248] dataset_reader.token_indexers.feats.type = feats_indexer\n",
+      "I0407 10:56:52.879144 140254825452608 params.py:248] dataset_reader.token_indexers.feats.namespace = feats\n",
+      "I0407 10:56:52.879218 140254825452608 params.py:248] dataset_reader.token_indexers.feats.feature_name = feats_\n",
+      "I0407 10:56:52.879282 140254825452608 params.py:248] dataset_reader.token_indexers.feats.token_min_padding_length = 0\n",
+      "I0407 10:56:52.879426 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.type = characters_const_padding\n",
+      "I0407 10:56:52.879594 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.namespace = token_characters\n",
+      "I0407 10:56:52.879792 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:56:52.879862 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:56:52.879944 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:56:52.880068 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:56:52.880184 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.start_tokens = None\n",
+      "I0407 10:56:52.880254 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.end_tokens = None\n",
+      "I0407 10:56:52.880316 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.min_padding_length = 32\n",
+      "I0407 10:56:52.880378 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.token_min_padding_length = 0\n",
+      "I0407 10:56:52.880523 140254825452608 params.py:248] dataset_reader.token_indexers.token.type = pretrained_transformer_mismatched_fixed\n",
+      "I0407 10:56:52.880748 140254825452608 params.py:248] dataset_reader.token_indexers.token.token_min_padding_length = 0\n",
+      "I0407 10:56:52.880829 140254825452608 params.py:248] dataset_reader.token_indexers.token.model_name = allegro/herbert-large-cased\n",
+      "I0407 10:56:52.880893 140254825452608 params.py:248] dataset_reader.token_indexers.token.namespace = tags\n",
+      "I0407 10:56:52.880957 140254825452608 params.py:248] dataset_reader.token_indexers.token.max_length = None\n",
+      "I0407 10:56:52.881069 140254825452608 params.py:384] dataset_reader.token_indexers.token.tokenizer_kwargs.use_fast = False\n",
+      "I0407 10:56:55.893562 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.type = single_id\n",
+      "I0407 10:56:55.894115 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.namespace = upostag\n",
+      "I0407 10:56:55.894256 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.lowercase_tokens = False\n",
+      "I0407 10:56:55.894343 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.start_tokens = None\n",
+      "I0407 10:56:55.894395 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.end_tokens = None\n",
+      "I0407 10:56:55.894465 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.feature_name = pos_\n",
+      "I0407 10:56:55.894520 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
+      "I0407 10:56:55.894590 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.token_min_padding_length = 0\n",
+      "I0407 10:56:55.894762 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.type = single_id\n",
+      "I0407 10:56:55.894958 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.namespace = xpostag\n",
+      "I0407 10:56:55.895048 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.lowercase_tokens = False\n",
+      "I0407 10:56:55.895111 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.start_tokens = None\n",
+      "I0407 10:56:55.895176 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.end_tokens = None\n",
+      "I0407 10:56:55.895228 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.feature_name = tag_\n",
+      "I0407 10:56:55.895297 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
+      "I0407 10:56:55.895349 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.token_min_padding_length = 0\n",
+      "I0407 10:56:55.895593 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.type = characters_const_padding\n",
+      "I0407 10:56:55.895786 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.namespace = lemma_characters\n",
+      "I0407 10:56:55.896016 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:56:55.896095 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:56:55.896188 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:56:55.896353 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:56:55.896480 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.start_tokens = None\n",
+      "I0407 10:56:55.896552 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.end_tokens = None\n",
+      "I0407 10:56:55.896607 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.min_padding_length = 32\n",
+      "I0407 10:56:55.896675 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.token_min_padding_length = 0\n",
+      "I0407 10:56:55.896760 140254825452608 params.py:248] dataset_reader.features = ['token', 'char']\n",
+      "I0407 10:56:55.896864 140254825452608 params.py:248] dataset_reader.targets = ['head', 'deprel']\n",
+      "I0407 10:56:55.896962 140254825452608 params.py:248] dataset_reader.use_sem = False\n",
+      "I0407 10:56:55.897153 140254825452608 params.py:248] dataset_reader.type = conllu\n",
+      "I0407 10:56:55.897414 140254825452608 params.py:248] dataset_reader.lazy = False\n",
+      "I0407 10:56:55.897499 140254825452608 params.py:248] dataset_reader.cache_directory = None\n",
+      "I0407 10:56:55.897570 140254825452608 params.py:248] dataset_reader.max_instances = None\n",
+      "I0407 10:56:55.897637 140254825452608 params.py:248] dataset_reader.manual_distributed_sharding = False\n",
+      "I0407 10:56:55.897707 140254825452608 params.py:248] dataset_reader.manual_multi_process_sharding = False\n",
+      "I0407 10:56:55.897995 140254825452608 params.py:248] dataset_reader.token_indexers.char.type = characters_const_padding\n",
+      "I0407 10:56:55.898183 140254825452608 params.py:248] dataset_reader.token_indexers.char.namespace = token_characters\n",
+      "I0407 10:56:55.898398 140254825452608 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:56:55.898473 140254825452608 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:56:55.898542 140254825452608 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:56:55.898677 140254825452608 params.py:248] dataset_reader.token_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:56:55.898799 140254825452608 params.py:248] dataset_reader.token_indexers.char.start_tokens = None\n",
+      "I0407 10:56:55.898869 140254825452608 params.py:248] dataset_reader.token_indexers.char.end_tokens = None\n",
+      "I0407 10:56:55.898936 140254825452608 params.py:248] dataset_reader.token_indexers.char.min_padding_length = 32\n",
+      "I0407 10:56:55.898998 140254825452608 params.py:248] dataset_reader.token_indexers.char.token_min_padding_length = 0\n",
+      "I0407 10:56:55.899158 140254825452608 params.py:248] dataset_reader.token_indexers.feats.type = feats_indexer\n",
+      "I0407 10:56:55.899337 140254825452608 params.py:248] dataset_reader.token_indexers.feats.namespace = feats\n",
+      "I0407 10:56:55.899414 140254825452608 params.py:248] dataset_reader.token_indexers.feats.feature_name = feats_\n",
+      "I0407 10:56:55.899485 140254825452608 params.py:248] dataset_reader.token_indexers.feats.token_min_padding_length = 0\n",
+      "I0407 10:56:55.899629 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.type = characters_const_padding\n",
+      "I0407 10:56:55.899797 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.namespace = token_characters\n",
+      "I0407 10:56:55.899995 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:56:55.900055 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:56:55.900130 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:56:55.900250 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:56:55.900363 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.start_tokens = None\n",
+      "I0407 10:56:55.900426 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.end_tokens = None\n",
+      "I0407 10:56:55.900486 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.min_padding_length = 32\n",
+      "I0407 10:56:55.900547 140254825452608 params.py:248] dataset_reader.token_indexers.lemma.token_min_padding_length = 0\n",
+      "I0407 10:56:55.900689 140254825452608 params.py:248] dataset_reader.token_indexers.token.type = pretrained_transformer_mismatched_fixed\n",
+      "I0407 10:56:55.900916 140254825452608 params.py:248] dataset_reader.token_indexers.token.token_min_padding_length = 0\n",
+      "I0407 10:56:55.900995 140254825452608 params.py:248] dataset_reader.token_indexers.token.model_name = allegro/herbert-large-cased\n",
+      "I0407 10:56:55.901061 140254825452608 params.py:248] dataset_reader.token_indexers.token.namespace = tags\n",
+      "I0407 10:56:55.901125 140254825452608 params.py:248] dataset_reader.token_indexers.token.max_length = None\n",
+      "I0407 10:56:55.901226 140254825452608 params.py:384] dataset_reader.token_indexers.token.tokenizer_kwargs.use_fast = False\n",
+      "I0407 10:56:55.902561 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.type = single_id\n",
+      "I0407 10:56:55.902824 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.namespace = upostag\n",
+      "I0407 10:56:55.902909 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.lowercase_tokens = False\n",
+      "I0407 10:56:55.902969 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.start_tokens = None\n",
+      "I0407 10:56:55.903034 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.end_tokens = None\n",
+      "I0407 10:56:55.903095 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.feature_name = pos_\n",
+      "I0407 10:56:55.903159 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
+      "I0407 10:56:55.903219 140254825452608 params.py:248] dataset_reader.token_indexers.upostag.token_min_padding_length = 0\n",
+      "I0407 10:56:55.903364 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.type = single_id\n",
+      "I0407 10:56:55.903547 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.namespace = xpostag\n",
+      "I0407 10:56:55.903621 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.lowercase_tokens = False\n",
+      "I0407 10:56:55.903687 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.start_tokens = None\n",
+      "I0407 10:56:55.903748 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.end_tokens = None\n",
+      "I0407 10:56:55.903811 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.feature_name = tag_\n",
+      "I0407 10:56:55.903868 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
+      "I0407 10:56:55.903931 140254825452608 params.py:248] dataset_reader.token_indexers.xpostag.token_min_padding_length = 0\n",
+      "I0407 10:56:55.904146 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.type = characters_const_padding\n",
+      "I0407 10:56:55.904325 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.namespace = lemma_characters\n",
+      "I0407 10:56:55.904539 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.byte_encoding = None\n",
+      "I0407 10:56:55.904611 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.lowercase_characters = False\n",
+      "I0407 10:56:55.904691 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
+      "I0407 10:56:55.904827 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
+      "I0407 10:56:55.904946 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.start_tokens = None\n",
+      "I0407 10:56:55.905013 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.end_tokens = None\n",
+      "I0407 10:56:55.905084 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.min_padding_length = 32\n",
+      "I0407 10:56:55.905149 140254825452608 params.py:248] dataset_reader.lemma_indexers.char.token_min_padding_length = 0\n",
+      "I0407 10:56:55.905237 140254825452608 params.py:248] dataset_reader.features = ['token', 'char']\n",
+      "I0407 10:56:55.905334 140254825452608 params.py:248] dataset_reader.targets = ['head', 'deprel']\n",
+      "I0407 10:56:55.905422 140254825452608 params.py:248] dataset_reader.use_sem = False\n",
+      "I0407 10:56:55.906047 140254825452608 params.py:248] vocabulary.type = from_instances_extended\n",
+      "I0407 10:56:55.906157 140254825452608 vocabulary.py:323] Loading token dictionary from /tmp/tmpdhtf4et1/vocabulary.\n",
+      "I0407 10:56:55.906635 140254825452608 filelock.py:254] Lock 140251419626896 acquired on /tmp/tmpdhtf4et1/vocabulary/.lock\n",
+      "I0407 10:56:55.907354 140254825452608 filelock.py:317] Lock 140251419626896 released on /tmp/tmpdhtf4et1/vocabulary/.lock\n",
+      "I0407 10:56:55.907914 140254825452608 params.py:248] model.type = semantic_multitask\n",
+      "I0407 10:56:55.908506 140254825452608 params.py:248] model.text_field_embedder.type = basic\n",
+      "I0407 10:56:55.908878 140254825452608 params.py:248] model.text_field_embedder.token_embedders.char.type = char_embeddings_from_config\n",
+      "I0407 10:56:55.909080 140254825452608 params.py:248] model.text_field_embedder.token_embedders.char.embedding_dim = 64\n",
+      "I0407 10:56:55.909353 140254825452608 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.input_dim = 64\n",
+      "I0407 10:56:55.909446 140254825452608 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.filters = [512, 256, 64]\n",
+      "I0407 10:56:55.909554 140254825452608 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.kernel_size = [3, 3, 3]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "I0407 10:56:55.909654 140254825452608 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.stride = [1, 1, 1]\n",
+      "I0407 10:56:55.909750 140254825452608 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.padding = [1, 2, 4]\n",
+      "I0407 10:56:55.909847 140254825452608 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.dilation = [1, 2, 4]\n",
+      "I0407 10:56:55.909946 140254825452608 params.py:248] model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.activations = ['relu', 'relu', 'linear']\n",
+      "I0407 10:56:55.910176 140254825452608 params.py:248] type = relu\n",
+      "I0407 10:56:55.910410 140254825452608 params.py:248] type = relu\n",
+      "I0407 10:56:55.910567 140254825452608 params.py:248] type = linear\n",
+      "I0407 10:56:55.917278 140254825452608 params.py:248] model.text_field_embedder.token_embedders.char.vocab_namespace = token_characters\n",
+      "I0407 10:56:55.917941 140254825452608 params.py:248] model.text_field_embedder.token_embedders.token.type = transformers_word_embeddings\n",
+      "I0407 10:56:55.918267 140254825452608 params.py:248] model.text_field_embedder.token_embedders.token.model_name = allegro/herbert-large-cased\n",
+      "I0407 10:56:55.918358 140254825452608 params.py:248] model.text_field_embedder.token_embedders.token.projection_dim = 100\n",
+      "I0407 10:56:55.918458 140254825452608 params.py:248] model.text_field_embedder.token_embedders.token.projection_activation = <function TransformersWordEmbedder.<lambda> at 0x7f8ed1745280>\n",
+      "I0407 10:56:55.918541 140254825452608 params.py:248] model.text_field_embedder.token_embedders.token.projection_dropout_rate = 0.0\n",
+      "I0407 10:56:55.918609 140254825452608 params.py:248] model.text_field_embedder.token_embedders.token.freeze_transformer = True\n",
+      "I0407 10:56:55.918674 140254825452608 params.py:248] model.text_field_embedder.token_embedders.token.last_layer_only = True\n",
+      "I0407 10:56:55.918785 140254825452608 params.py:384] model.text_field_embedder.token_embedders.token.tokenizer_kwargs.use_fast = False\n",
+      "I0407 10:56:55.918858 140254825452608 params.py:248] model.text_field_embedder.token_embedders.token.transformer_kwargs = None\n",
+      "I0407 10:57:03.624983 140254825452608 params.py:248] model.seq_encoder.type = combo_encoder\n",
+      "I0407 10:57:03.625626 140254825452608 params.py:248] model.seq_encoder.stacked_bilstm.input_size = 164\n",
+      "I0407 10:57:03.625742 140254825452608 params.py:248] model.seq_encoder.stacked_bilstm.hidden_size = 512\n",
+      "I0407 10:57:03.625796 140254825452608 params.py:248] model.seq_encoder.stacked_bilstm.num_layers = 2\n",
+      "I0407 10:57:03.625844 140254825452608 params.py:248] model.seq_encoder.stacked_bilstm.recurrent_dropout_probability = 0.33\n",
+      "I0407 10:57:03.625942 140254825452608 params.py:248] model.seq_encoder.stacked_bilstm.layer_dropout_probability = 0.33\n",
+      "I0407 10:57:03.626068 140254825452608 params.py:248] model.seq_encoder.stacked_bilstm.use_highway = False\n",
+      "I0407 10:57:03.933019 140254825452608 params.py:248] model.seq_encoder.layer_dropout_probability = 0.33\n",
+      "I0407 10:57:03.933302 140254825452608 params.py:248] model.use_sample_weight = True\n",
+      "I0407 10:57:03.933391 140254825452608 params.py:248] model.lemmatizer = None\n",
+      "I0407 10:57:03.933440 140254825452608 params.py:248] model.upos_tagger = None\n",
+      "I0407 10:57:03.933486 140254825452608 params.py:248] model.xpos_tagger = None\n",
+      "I0407 10:57:03.933528 140254825452608 params.py:248] model.semantic_relation = None\n",
+      "I0407 10:57:03.933570 140254825452608 params.py:248] model.morphological_feat = None\n",
+      "I0407 10:57:03.933835 140254825452608 params.py:248] model.dependency_relation.type = combo_dependency_parsing_from_vocab\n",
+      "I0407 10:57:03.934096 140254825452608 params.py:248] model.dependency_relation.vocab_namespace = deprel_labels\n",
+      "I0407 10:57:03.934389 140254825452608 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.in_features = 1024\n",
+      "I0407 10:57:03.934459 140254825452608 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.out_features = 512\n",
+      "I0407 10:57:03.934515 140254825452608 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.activation = tanh\n",
+      "I0407 10:57:03.934614 140254825452608 params.py:248] type = tanh\n",
+      "I0407 10:57:03.934703 140254825452608 params.py:248] model.dependency_relation.head_predictor.head_projection_layer.dropout_rate = 0.0\n",
+      "I0407 10:57:03.938141 140254825452608 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.in_features = 1024\n",
+      "I0407 10:57:03.938247 140254825452608 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.out_features = 512\n",
+      "I0407 10:57:03.938306 140254825452608 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.activation = tanh\n",
+      "I0407 10:57:03.938404 140254825452608 params.py:248] type = tanh\n",
+      "I0407 10:57:03.938489 140254825452608 params.py:248] model.dependency_relation.head_predictor.dependency_projection_layer.dropout_rate = 0.0\n",
+      "I0407 10:57:03.941669 140254825452608 params.py:248] model.dependency_relation.head_predictor.cycle_loss_n = 0\n",
+      "I0407 10:57:03.941908 140254825452608 params.py:248] model.dependency_relation.head_projection_layer.in_features = 1024\n",
+      "I0407 10:57:03.941985 140254825452608 params.py:248] model.dependency_relation.head_projection_layer.out_features = 128\n",
+      "I0407 10:57:03.942037 140254825452608 params.py:248] model.dependency_relation.head_projection_layer.activation = tanh\n",
+      "I0407 10:57:03.942123 140254825452608 params.py:248] type = tanh\n",
+      "I0407 10:57:03.942194 140254825452608 params.py:248] model.dependency_relation.head_projection_layer.dropout_rate = 0.25\n",
+      "I0407 10:57:03.943288 140254825452608 params.py:248] model.dependency_relation.dependency_projection_layer.in_features = 1024\n",
+      "I0407 10:57:03.943376 140254825452608 params.py:248] model.dependency_relation.dependency_projection_layer.out_features = 128\n",
+      "I0407 10:57:03.943423 140254825452608 params.py:248] model.dependency_relation.dependency_projection_layer.activation = tanh\n",
+      "I0407 10:57:03.943510 140254825452608 params.py:248] type = tanh\n",
+      "I0407 10:57:03.943577 140254825452608 params.py:248] model.dependency_relation.dependency_projection_layer.dropout_rate = 0.25\n",
+      "I0407 10:57:03.944838 140254825452608 params.py:248] model.enhanced_dependency_relation = None\n",
+      "I0407 10:57:03.945286 140254825452608 params.py:248] model.regularizer.regexes.0.1.type = l2\n",
+      "I0407 10:57:03.945443 140254825452608 params.py:248] model.regularizer.regexes.0.1.alpha = 1e-06\n",
+      "I0407 10:57:03.945568 140254825452608 params.py:248] model.regularizer.regexes.1.1.type = l2\n",
+      "I0407 10:57:03.945679 140254825452608 params.py:248] model.regularizer.regexes.1.1.alpha = 1e-06\n",
+      "I0407 10:57:03.945787 140254825452608 params.py:248] model.regularizer.regexes.2.1.type = l2\n",
+      "I0407 10:57:03.945892 140254825452608 params.py:248] model.regularizer.regexes.2.1.alpha = 1e-06\n",
+      "I0407 10:57:03.946047 140254825452608 params.py:248] model.regularizer.regexes.3.1.type = l2\n",
+      "I0407 10:57:03.946158 140254825452608 params.py:248] model.regularizer.regexes.3.1.alpha = 1e-05\n",
+      "I0407 10:57:06.549506 140254825452608 archival.py:211] removing temporary unarchived model dir at /tmp/tmpdhtf4et1\n",
+      "reading instances: 1990it [01:39, 20.00it/s]\n"
+     ]
+    }
+   ],
+   "source": [
+    "! {COMBO} --mode predict \\\n",
+    "    --cuda_device 0 \\\n",
+    "    --model_path model-pdbc-cont/model.tar.gz \\\n",
+    "    --input_file connlu/pdbc-cont-test.conllu \\\n",
+    "    --output_file connlu/pdbc-cont-test-pred.conllu"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "id": "ddc3986b",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "# text = Mały chłopiec patrzy w bok po ściągnięciu okularów .\r\n",
+      "1\tMały\tmały\t_\t_\t_\t2\tadjunct\t2:adjunct\t_\r\n",
+      "2\tchłopiec\tchłopiec\t_\t_\t_\t3\tsubj\t3:subj\t_\r\n",
+      "3\tpatrzy\tpatrzeć\t_\t_\t_\t0\troot\t0:root\t_\r\n",
+      "4\tw\tw\t_\t_\t_\t3\tadjunct_adl\t3:adjunct_adl\t_\r\n",
+      "5\tbok\tbok\t_\t_\t_\t4\tcomp\t4:comp\t_\r\n",
+      "6\tpo\tpo\t_\t_\t_\t3\tadjunct_temp\t3:adjunct_temp\t_\r\n",
+      "7\tściągnięciu\tściągnąć\t_\t_\t_\t6\tcomp\t6:comp\t_\r\n",
+      "8\tokularów\tokulary\t_\t_\t_\t7\tobj\t7:obj\t_\r\n",
+      "9\t.\t.\t_\t_\t_\t3\tpunct\t3:punct\t_\r\n"
+     ]
+    }
+   ],
+   "source": [
+    "! head connlu/pdbc-cont-test.conllu"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 13,
+   "id": "34aa16d9",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "# text = Mały chłopiec patrzy w bok po ściągnięciu okularów .\r\n",
+      "1\tMały\tmały\t_\t_\t_\t2\tadjunct\t2:adjunct\t_\r\n",
+      "2\tchłopiec\tchłopiec\t_\t_\t_\t3\tsubj\t3:subj\t_\r\n",
+      "3\tpatrzy\tpatrzeć\t_\t_\t_\t0\troot\t0:root\t_\r\n",
+      "4\tw\tw\t_\t_\t_\t3\tcomp\t3:adjunct_adl\t_\r\n",
+      "5\tbok\tbok\t_\t_\t_\t4\tcomp\t4:comp\t_\r\n",
+      "6\tpo\tpo\t_\t_\t_\t3\tadjunct_temp\t3:adjunct_temp\t_\r\n",
+      "7\tściągnięciu\tściągnąć\t_\t_\t_\t6\tcomp\t6:comp\t_\r\n",
+      "8\tokularów\tokulary\t_\t_\t_\t7\tobj\t7:obj\t_\r\n",
+      "9\t.\t.\t_\t_\t_\t3\tpunct\t3:punct\t_\r\n"
+     ]
+    }
+   ],
+   "source": [
+    "! head connlu/pdbc-cont-test-pred.conllu"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "combo_python39",
+   "language": "python",
+   "name": "combo_python39"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.16"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git b/COMBO/TrainContModel.ipynb a/COMBO/TrainContModel.ipynb
new file mode 100644
index 0000000..8c58186
--- /dev/null
+++ a/COMBO/TrainContModel.ipynb
@@ -0,0 +1,14293 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "e613a4cf",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "COMBO = '/home/kkrasnowska/anaconda3/envs/combo_p39/bin/combo'"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "e2563423",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "I0406 22:49:10.502099 139680283460672 params.py:248] include_in_archive = None\n",
+      "2023-04-06 22:49:10,503 - INFO - allennlp.common.params - random_seed = 8787\n",
+      "2023-04-06 22:49:10,503 - INFO - allennlp.common.params - numpy_seed = 8787\n",
+      "2023-04-06 22:49:10,503 - INFO - allennlp.common.params - pytorch_seed = 8787\n",
+      "2023-04-06 22:49:10,504 - INFO - allennlp.common.checks - Pytorch version: 1.13.1\n",
+      "2023-04-06 22:49:10,505 - INFO - allennlp.common.params - type = default\n",
+      "2023-04-06 22:49:10,506 - INFO - allennlp.common.params - dataset_reader.type = conllu\n",
+      "2023-04-06 22:49:10,506 - INFO - allennlp.common.params - dataset_reader.lazy = False\n",
+      "2023-04-06 22:49:10,506 - INFO - allennlp.common.params - dataset_reader.cache_directory = None\n",
+      "2023-04-06 22:49:10,506 - INFO - allennlp.common.params - dataset_reader.max_instances = None\n",
+      "2023-04-06 22:49:10,506 - INFO - allennlp.common.params - dataset_reader.manual_distributed_sharding = False\n",
+      "2023-04-06 22:49:10,506 - INFO - allennlp.common.params - dataset_reader.manual_multi_process_sharding = False\n",
+      "2023-04-06 22:49:10,506 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.type = characters_const_padding\n",
+      "2023-04-06 22:49:10,507 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.namespace = token_characters\n",
+      "2023-04-06 22:49:10,507 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.character_tokenizer.byte_encoding = None\n",
+      "2023-04-06 22:49:10,507 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.character_tokenizer.lowercase_characters = False\n",
+      "2023-04-06 22:49:10,507 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
+      "2023-04-06 22:49:10,507 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
+      "2023-04-06 22:49:10,507 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.start_tokens = None\n",
+      "2023-04-06 22:49:10,507 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.end_tokens = None\n",
+      "2023-04-06 22:49:10,508 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.min_padding_length = 32\n",
+      "2023-04-06 22:49:10,508 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.token_min_padding_length = 0\n",
+      "2023-04-06 22:49:10,508 - INFO - allennlp.common.params - dataset_reader.token_indexers.feats.type = feats_indexer\n",
+      "2023-04-06 22:49:10,508 - INFO - allennlp.common.params - dataset_reader.token_indexers.feats.namespace = feats\n",
+      "2023-04-06 22:49:10,508 - INFO - allennlp.common.params - dataset_reader.token_indexers.feats.feature_name = feats_\n",
+      "2023-04-06 22:49:10,508 - INFO - allennlp.common.params - dataset_reader.token_indexers.feats.token_min_padding_length = 0\n",
+      "2023-04-06 22:49:10,508 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.type = characters_const_padding\n",
+      "2023-04-06 22:49:10,508 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.namespace = token_characters\n",
+      "2023-04-06 22:49:10,509 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.character_tokenizer.byte_encoding = None\n",
+      "2023-04-06 22:49:10,509 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.character_tokenizer.lowercase_characters = False\n",
+      "2023-04-06 22:49:10,509 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.character_tokenizer.start_tokens = ['__START__']\n",
+      "2023-04-06 22:49:10,509 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.character_tokenizer.end_tokens = ['__END__']\n",
+      "2023-04-06 22:49:10,509 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.start_tokens = None\n",
+      "2023-04-06 22:49:10,509 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.end_tokens = None\n",
+      "2023-04-06 22:49:10,509 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.min_padding_length = 32\n",
+      "2023-04-06 22:49:10,509 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.token_min_padding_length = 0\n",
+      "2023-04-06 22:49:10,509 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.type = pretrained_transformer_mismatched_fixed\n",
+      "2023-04-06 22:49:10,510 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.token_min_padding_length = 0\n",
+      "2023-04-06 22:49:10,510 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.model_name = allegro/herbert-large-cased\n",
+      "2023-04-06 22:49:10,510 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.namespace = tags\n",
+      "2023-04-06 22:49:10,510 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.max_length = None\n",
+      "2023-04-06 22:49:10,510 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.tokenizer_kwargs.use_fast = False\n",
+      "2023-04-06 22:49:13,444 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.type = single_id\n",
+      "2023-04-06 22:49:13,444 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.namespace = upostag\n",
+      "2023-04-06 22:49:13,444 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.lowercase_tokens = False\n",
+      "2023-04-06 22:49:13,444 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.start_tokens = None\n",
+      "2023-04-06 22:49:13,444 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.end_tokens = None\n",
+      "2023-04-06 22:49:13,444 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.feature_name = pos_\n",
+      "2023-04-06 22:49:13,444 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
+      "2023-04-06 22:49:13,445 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.token_min_padding_length = 0\n",
+      "2023-04-06 22:49:13,445 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.type = single_id\n",
+      "2023-04-06 22:49:13,445 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.namespace = xpostag\n",
+      "2023-04-06 22:49:13,445 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.lowercase_tokens = False\n",
+      "2023-04-06 22:49:13,445 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.start_tokens = None\n",
+      "2023-04-06 22:49:13,445 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.end_tokens = None\n",
+      "2023-04-06 22:49:13,445 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.feature_name = tag_\n",
+      "2023-04-06 22:49:13,445 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
+      "2023-04-06 22:49:13,445 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.token_min_padding_length = 0\n",
+      "2023-04-06 22:49:13,446 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.type = characters_const_padding\n",
+      "2023-04-06 22:49:13,446 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.namespace = lemma_characters\n",
+      "2023-04-06 22:49:13,446 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.character_tokenizer.byte_encoding = None\n",
+      "2023-04-06 22:49:13,446 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.character_tokenizer.lowercase_characters = False\n",
+      "2023-04-06 22:49:13,446 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
+      "2023-04-06 22:49:13,446 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
+      "2023-04-06 22:49:13,446 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.start_tokens = None\n",
+      "2023-04-06 22:49:13,447 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.end_tokens = None\n",
+      "2023-04-06 22:49:13,447 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.min_padding_length = 32\n",
+      "2023-04-06 22:49:13,447 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.token_min_padding_length = 0\n",
+      "2023-04-06 22:49:13,447 - INFO - allennlp.common.params - dataset_reader.features = ['token', 'char']\n",
+      "2023-04-06 22:49:13,447 - INFO - allennlp.common.params - dataset_reader.targets = ['head', 'deprel']\n",
+      "2023-04-06 22:49:13,447 - INFO - allennlp.common.params - dataset_reader.use_sem = False\n",
+      "2023-04-06 22:49:13,447 - INFO - allennlp.common.params - train_data_path = connlu/pdbc-cont-train.conllu\n",
+      "2023-04-06 22:49:13,448 - INFO - allennlp.common.params - datasets_for_vocab_creation = ['train']\n",
+      "2023-04-06 22:49:13,448 - INFO - allennlp.common.params - validation_dataset_reader = None\n",
+      "2023-04-06 22:49:13,448 - INFO - allennlp.common.params - validation_data_path = connlu/pdbc-cont-validation.conllu\n",
+      "2023-04-06 22:49:13,448 - INFO - allennlp.common.params - validation_data_loader = None\n",
+      "2023-04-06 22:49:13,448 - INFO - allennlp.common.params - test_data_path = None\n",
+      "2023-04-06 22:49:13,448 - INFO - allennlp.common.params - evaluate_on_test = False\n",
+      "2023-04-06 22:49:13,448 - INFO - allennlp.common.params - batch_weight_key = \n",
+      "2023-04-06 22:49:13,448 - INFO - allennlp.training.util - Reading training data from connlu/pdbc-cont-train.conllu\n",
+      "reading instances: 0it [00:00, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "reading instances: 3878it [00:02, 1938.62it/s]\n",
+      "reading instances: 8280it [00:04, 2010.38it/s]\n",
+      "reading instances: 11587it [00:06, 1750.85it/s]\n",
+      "reading instances: 15202it [00:08, 1679.50it/s]\n",
+      "reading instances: 15903it [00:09, 1757.51it/s]\n",
+      "2023-04-06 22:49:22,498 - INFO - allennlp.training.util - Reading validation data from connlu/pdbc-cont-validation.conllu\n",
+      "reading instances: 0it [00:00, ?it/s]\n",
+      "reading instances: 1980it [00:00, 3415.26it/s]\n",
+      "2023-04-06 22:49:23,078 - INFO - allennlp.commands.train - From dataset instances, train will be considered for vocabulary creation.\n",
+      "2023-04-06 22:49:23,078 - INFO - allennlp.common.params - vocabulary.type = from_instances_extended\n",
+      "2023-04-06 22:49:23,078 - INFO - allennlp.common.params - vocabulary.min_count = None\n",
+      "2023-04-06 22:49:23,078 - INFO - allennlp.common.params - vocabulary.max_vocab_size = None\n",
+      "2023-04-06 22:49:23,078 - INFO - allennlp.common.params - vocabulary.non_padded_namespaces = ['head_labels']\n",
+      "2023-04-06 22:49:23,079 - INFO - allennlp.common.params - vocabulary.pretrained_files = None\n",
+      "2023-04-06 22:49:23,079 - INFO - allennlp.common.params - vocabulary.only_include_pretrained_words = True\n",
+      "2023-04-06 22:49:23,079 - INFO - allennlp.common.params - vocabulary.min_pretrained_embeddings = None\n",
+      "2023-04-06 22:49:23,079 - INFO - allennlp.common.params - vocabulary.padding_token = __PAD__\n",
+      "2023-04-06 22:49:23,079 - INFO - allennlp.common.params - vocabulary.oov_token = _\n",
+      "2023-04-06 22:49:23,079 - INFO - allennlp.data.vocabulary - Fitting token dictionary from dataset.\n",
+      "building vocab: 0it [00:00, ?it/s]\n",
+      "building vocab: 15903it [00:01, 10066.76it/s]\n",
+      "2023-04-06 22:49:24,659 - INFO - allennlp.common.params - model.type = semantic_multitask\n",
+      "2023-04-06 22:49:24,660 - INFO - allennlp.common.params - model.text_field_embedder.type = basic\n",
+      "2023-04-06 22:49:24,660 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.type = char_embeddings_from_config\n",
+      "2023-04-06 22:49:24,661 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.embedding_dim = 64\n",
+      "2023-04-06 22:49:24,661 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.input_dim = 64\n",
+      "2023-04-06 22:49:24,661 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.filters = [512, 256, 64]\n",
+      "2023-04-06 22:49:24,661 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.kernel_size = [3, 3, 3]\n",
+      "2023-04-06 22:49:24,661 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.stride = [1, 1, 1]\n",
+      "2023-04-06 22:49:24,661 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.padding = [1, 2, 4]\n",
+      "2023-04-06 22:49:24,661 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.dilation = [1, 2, 4]\n",
+      "2023-04-06 22:49:24,661 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.activations = ['relu', 'relu', 'linear']\n",
+      "2023-04-06 22:49:24,661 - INFO - allennlp.common.params - type = relu\n",
+      "2023-04-06 22:49:24,661 - INFO - allennlp.common.params - type = relu\n",
+      "2023-04-06 22:49:24,662 - INFO - allennlp.common.params - type = linear\n",
+      "2023-04-06 22:49:24,666 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.vocab_namespace = token_characters\n",
+      "2023-04-06 22:49:24,667 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.type = transformers_word_embeddings\n",
+      "2023-04-06 22:49:24,667 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.model_name = allegro/herbert-large-cased\n",
+      "2023-04-06 22:49:24,667 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.projection_dim = 100\n",
+      "2023-04-06 22:49:24,667 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.projection_activation = <function TransformersWordEmbedder.<lambda> at 0x7f090c144280>\n",
+      "2023-04-06 22:49:24,667 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.projection_dropout_rate = 0.0\n",
+      "2023-04-06 22:49:24,667 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.freeze_transformer = True\n",
+      "2023-04-06 22:49:24,667 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.last_layer_only = True\n",
+      "2023-04-06 22:49:24,668 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.tokenizer_kwargs.use_fast = False\n",
+      "2023-04-06 22:49:24,668 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.transformer_kwargs = None\n",
+      "2023-04-06 22:49:33,577 - INFO - allennlp.common.params - model.seq_encoder.type = combo_encoder\n",
+      "2023-04-06 22:49:33,577 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.input_size = 164\n",
+      "2023-04-06 22:49:33,577 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.hidden_size = 512\n",
+      "2023-04-06 22:49:33,577 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.num_layers = 2\n",
+      "2023-04-06 22:49:33,577 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.recurrent_dropout_probability = 0.33\n",
+      "2023-04-06 22:49:33,577 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.layer_dropout_probability = 0.33\n",
+      "2023-04-06 22:49:33,578 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.use_highway = False\n",
+      "2023-04-06 22:49:34,201 - INFO - allennlp.common.params - model.seq_encoder.layer_dropout_probability = 0.33\n",
+      "2023-04-06 22:49:34,201 - INFO - allennlp.common.params - model.use_sample_weight = True\n",
+      "2023-04-06 22:49:34,201 - INFO - allennlp.common.params - model.lemmatizer = None\n",
+      "2023-04-06 22:49:34,201 - INFO - allennlp.common.params - model.upos_tagger = None\n",
+      "2023-04-06 22:49:34,201 - INFO - allennlp.common.params - model.xpos_tagger = None\n",
+      "2023-04-06 22:49:34,201 - INFO - allennlp.common.params - model.semantic_relation = None\n",
+      "2023-04-06 22:49:34,201 - INFO - allennlp.common.params - model.morphological_feat = None\n",
+      "2023-04-06 22:49:34,202 - INFO - allennlp.common.params - model.dependency_relation.type = combo_dependency_parsing_from_vocab\n",
+      "2023-04-06 22:49:34,202 - INFO - allennlp.common.params - model.dependency_relation.vocab_namespace = deprel_labels\n",
+      "2023-04-06 22:49:34,202 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.head_projection_layer.in_features = 1024\n",
+      "2023-04-06 22:49:34,203 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.head_projection_layer.out_features = 512\n",
+      "2023-04-06 22:49:34,203 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.head_projection_layer.activation = tanh\n",
+      "2023-04-06 22:49:34,203 - INFO - allennlp.common.params - type = tanh\n",
+      "2023-04-06 22:49:34,203 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.head_projection_layer.dropout_rate = 0.0\n",
+      "2023-04-06 22:49:34,207 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.dependency_projection_layer.in_features = 1024\n",
+      "2023-04-06 22:49:34,208 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.dependency_projection_layer.out_features = 512\n",
+      "2023-04-06 22:49:34,208 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.dependency_projection_layer.activation = tanh\n",
+      "2023-04-06 22:49:34,208 - INFO - allennlp.common.params - type = tanh\n",
+      "2023-04-06 22:49:34,208 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.dependency_projection_layer.dropout_rate = 0.0\n",
+      "2023-04-06 22:49:34,212 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.cycle_loss_n = 0\n",
+      "2023-04-06 22:49:34,213 - INFO - allennlp.common.params - model.dependency_relation.head_projection_layer.in_features = 1024\n",
+      "2023-04-06 22:49:34,213 - INFO - allennlp.common.params - model.dependency_relation.head_projection_layer.out_features = 128\n",
+      "2023-04-06 22:49:34,213 - INFO - allennlp.common.params - model.dependency_relation.head_projection_layer.activation = tanh\n",
+      "2023-04-06 22:49:34,213 - INFO - allennlp.common.params - type = tanh\n",
+      "2023-04-06 22:49:34,213 - INFO - allennlp.common.params - model.dependency_relation.head_projection_layer.dropout_rate = 0.25\n",
+      "2023-04-06 22:49:34,215 - INFO - allennlp.common.params - model.dependency_relation.dependency_projection_layer.in_features = 1024\n",
+      "2023-04-06 22:49:34,215 - INFO - allennlp.common.params - model.dependency_relation.dependency_projection_layer.out_features = 128\n",
+      "2023-04-06 22:49:34,215 - INFO - allennlp.common.params - model.dependency_relation.dependency_projection_layer.activation = tanh\n",
+      "2023-04-06 22:49:34,215 - INFO - allennlp.common.params - type = tanh\n",
+      "2023-04-06 22:49:34,215 - INFO - allennlp.common.params - model.dependency_relation.dependency_projection_layer.dropout_rate = 0.25\n",
+      "2023-04-06 22:49:34,217 - INFO - allennlp.common.params - model.enhanced_dependency_relation = None\n",
+      "2023-04-06 22:49:34,217 - INFO - allennlp.common.params - model.regularizer.regexes.0.1.type = l2\n",
+      "2023-04-06 22:49:34,217 - INFO - allennlp.common.params - model.regularizer.regexes.0.1.alpha = 1e-06\n",
+      "2023-04-06 22:49:34,218 - INFO - allennlp.common.params - model.regularizer.regexes.1.1.type = l2\n",
+      "2023-04-06 22:49:34,218 - INFO - allennlp.common.params - model.regularizer.regexes.1.1.alpha = 1e-06\n",
+      "2023-04-06 22:49:34,218 - INFO - allennlp.common.params - model.regularizer.regexes.2.1.type = l2\n",
+      "2023-04-06 22:49:34,218 - INFO - allennlp.common.params - model.regularizer.regexes.2.1.alpha = 1e-06\n",
+      "2023-04-06 22:49:34,218 - INFO - allennlp.common.params - model.regularizer.regexes.3.1.type = l2\n",
+      "2023-04-06 22:49:34,218 - INFO - allennlp.common.params - model.regularizer.regexes.3.1.alpha = 1e-05\n",
+      "2023-04-06 22:49:34,219 - INFO - filelock - Lock 139674732932928 acquired on ./allennlp867qpopk/vocabulary/.lock\n",
+      "2023-04-06 22:49:34,220 - INFO - filelock - Lock 139674732932928 released on ./allennlp867qpopk/vocabulary/.lock\n",
+      "2023-04-06 22:49:34,220 - INFO - allennlp.common.params - data_loader.type = pytorch_dataloader\n",
+      "2023-04-06 22:49:34,220 - INFO - allennlp.common.params - data_loader.batch_size = 1\n",
+      "2023-04-06 22:49:34,220 - INFO - allennlp.common.params - data_loader.shuffle = False\n",
+      "2023-04-06 22:49:34,220 - INFO - allennlp.common.params - data_loader.sampler = None\n",
+      "2023-04-06 22:49:34,221 - INFO - allennlp.common.params - data_loader.num_workers = 0\n",
+      "2023-04-06 22:49:34,221 - INFO - allennlp.common.params - data_loader.pin_memory = False\n",
+      "2023-04-06 22:49:34,221 - INFO - allennlp.common.params - data_loader.drop_last = False\n",
+      "2023-04-06 22:49:34,221 - INFO - allennlp.common.params - data_loader.timeout = 0\n",
+      "2023-04-06 22:49:34,221 - INFO - allennlp.common.params - data_loader.worker_init_fn = None\n",
+      "2023-04-06 22:49:34,221 - INFO - allennlp.common.params - data_loader.multiprocessing_context = None\n",
+      "2023-04-06 22:49:34,221 - INFO - allennlp.common.params - data_loader.batches_per_epoch = None\n",
+      "2023-04-06 22:49:34,221 - INFO - allennlp.common.params - data_loader.batch_sampler.type = token_count\n",
+      "2023-04-06 22:49:34,221 - INFO - allennlp.common.params - data_loader.batch_sampler.word_batch_size = 2500\n",
+      "2023-04-06 22:49:34,221 - INFO - allennlp.common.params - data_loader.batch_sampler.shuffle_dataset = True\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "/home/kkrasnowska/anaconda3/envs/combo_p39/lib/python3.8/site-packages/combo/data/samplers/samplers.py:51: VisibleDeprecationWarning: Creating an ndarray from ragged nested sequences (which is a list-or-tuple of lists-or-tuples-or ndarrays with different lengths or shapes) is deprecated. If you meant to do this, you must specify 'dtype=object' when creating the ndarray.\n",
+      "  self.batch_dataset = np.array(self.batch_dataset)[indices].tolist()\n",
+      "2023-04-06 22:49:34,240 - INFO - allennlp.common.params - data_loader.type = pytorch_dataloader\n",
+      "2023-04-06 22:49:34,241 - INFO - allennlp.common.params - data_loader.batch_size = 1\n",
+      "2023-04-06 22:49:34,241 - INFO - allennlp.common.params - data_loader.shuffle = False\n",
+      "2023-04-06 22:49:34,241 - INFO - allennlp.common.params - data_loader.sampler = None\n",
+      "2023-04-06 22:49:34,241 - INFO - allennlp.common.params - data_loader.num_workers = 0\n",
+      "2023-04-06 22:49:34,241 - INFO - allennlp.common.params - data_loader.pin_memory = False\n",
+      "2023-04-06 22:49:34,241 - INFO - allennlp.common.params - data_loader.drop_last = False\n",
+      "2023-04-06 22:49:34,241 - INFO - allennlp.common.params - data_loader.timeout = 0\n",
+      "2023-04-06 22:49:34,241 - INFO - allennlp.common.params - data_loader.worker_init_fn = None\n",
+      "2023-04-06 22:49:34,241 - INFO - allennlp.common.params - data_loader.multiprocessing_context = None\n",
+      "2023-04-06 22:49:34,242 - INFO - allennlp.common.params - data_loader.batches_per_epoch = None\n",
+      "2023-04-06 22:49:34,242 - INFO - allennlp.common.params - data_loader.batch_sampler.type = token_count\n",
+      "2023-04-06 22:49:34,242 - INFO - allennlp.common.params - data_loader.batch_sampler.word_batch_size = 2500\n",
+      "2023-04-06 22:49:34,242 - INFO - allennlp.common.params - data_loader.batch_sampler.shuffle_dataset = True\n",
+      "2023-04-06 22:49:34,245 - INFO - allennlp.common.params - trainer.type = gradient_descent_validate_n\n",
+      "2023-04-06 22:49:34,245 - INFO - allennlp.common.params - trainer.patience = 1\n",
+      "2023-04-06 22:49:34,245 - INFO - allennlp.common.params - trainer.validation_metric = +EM\n",
+      "2023-04-06 22:49:34,245 - INFO - allennlp.common.params - trainer.num_epochs = 400\n",
+      "2023-04-06 22:49:34,245 - INFO - allennlp.common.params - trainer.cuda_device = 0\n",
+      "2023-04-06 22:49:34,245 - INFO - allennlp.common.params - trainer.grad_norm = None\n",
+      "2023-04-06 22:49:34,245 - INFO - allennlp.common.params - trainer.grad_clipping = 5\n",
+      "2023-04-06 22:49:34,245 - INFO - allennlp.common.params - trainer.distributed = None\n",
+      "2023-04-06 22:49:34,245 - INFO - allennlp.common.params - trainer.world_size = 1\n",
+      "2023-04-06 22:49:34,246 - INFO - allennlp.common.params - trainer.num_gradient_accumulation_steps = 1\n",
+      "2023-04-06 22:49:34,246 - INFO - allennlp.common.params - trainer.use_amp = False\n",
+      "2023-04-06 22:49:34,246 - INFO - allennlp.common.params - trainer.no_grad = None\n",
+      "2023-04-06 22:49:34,246 - INFO - allennlp.common.params - trainer.momentum_scheduler = None\n",
+      "2023-04-06 22:49:34,246 - INFO - allennlp.common.params - trainer.tensorboard_writer = None\n",
+      "2023-04-06 22:49:34,246 - INFO - allennlp.common.params - trainer.moving_average = None\n",
+      "2023-04-06 22:49:34,246 - INFO - allennlp.common.params - trainer.batch_callbacks = None\n",
+      "2023-04-06 22:49:34,246 - INFO - allennlp.common.params - trainer.epoch_callbacks.0.type = transfer_patience\n",
+      "2023-04-06 22:49:34,247 - INFO - allennlp.common.params - trainer.end_callbacks = None\n",
+      "2023-04-06 22:49:34,247 - INFO - allennlp.common.params - trainer.trainer_callbacks = None\n",
+      "2023-04-06 22:49:36,168 - INFO - allennlp.common.params - trainer.optimizer.type = adam\n",
+      "2023-04-06 22:49:36,169 - INFO - allennlp.common.params - trainer.optimizer.parameter_groups = None\n",
+      "2023-04-06 22:49:36,169 - INFO - allennlp.common.params - trainer.optimizer.lr = 0.002\n",
+      "2023-04-06 22:49:36,169 - INFO - allennlp.common.params - trainer.optimizer.betas = [0.9, 0.9]\n",
+      "2023-04-06 22:49:36,169 - INFO - allennlp.common.params - trainer.optimizer.eps = 1e-08\n",
+      "2023-04-06 22:49:36,169 - INFO - allennlp.common.params - trainer.optimizer.weight_decay = 0.0\n",
+      "2023-04-06 22:49:36,169 - INFO - allennlp.common.params - trainer.optimizer.amsgrad = False\n",
+      "2023-04-06 22:49:36,170 - INFO - allennlp.training.optimizers - Number of trainable parameters: 11053808\n",
+      "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - The following parameters are Frozen (without gradient):\n",
+      "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.word_embeddings.weight\n",
+      "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.position_embeddings.weight\n",
+      "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.token_type_embeddings.weight\n",
+      "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,170 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.value.bias\n",
+      "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.output.dense.weight\n",
+      "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.output.dense.bias\n",
+      "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.intermediate.dense.weight\n",
+      "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.intermediate.dense.bias\n",
+      "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.output.dense.weight\n",
+      "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.output.dense.bias\n",
+      "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,171 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.value.bias\n",
+      "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.output.dense.weight\n",
+      "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.output.dense.bias\n",
+      "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.intermediate.dense.weight\n",
+      "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.intermediate.dense.bias\n",
+      "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.output.dense.weight\n",
+      "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.output.dense.bias\n",
+      "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.value.bias\n",
+      "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.output.dense.weight\n",
+      "2023-04-06 22:49:36,172 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.output.dense.bias\n",
+      "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.intermediate.dense.weight\n",
+      "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.intermediate.dense.bias\n",
+      "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.output.dense.weight\n",
+      "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.output.dense.bias\n",
+      "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.value.bias\n",
+      "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.output.dense.weight\n",
+      "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.output.dense.bias\n",
+      "2023-04-06 22:49:36,173 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.intermediate.dense.weight\n",
+      "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.intermediate.dense.bias\n",
+      "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.output.dense.weight\n",
+      "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.output.dense.bias\n",
+      "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.value.bias\n",
+      "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.output.dense.weight\n",
+      "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.output.dense.bias\n",
+      "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,174 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.intermediate.dense.weight\n",
+      "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.intermediate.dense.bias\n",
+      "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.output.dense.weight\n",
+      "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.output.dense.bias\n",
+      "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.value.bias\n",
+      "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.output.dense.weight\n",
+      "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.output.dense.bias\n",
+      "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.intermediate.dense.weight\n",
+      "2023-04-06 22:49:36,175 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.intermediate.dense.bias\n",
+      "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.output.dense.weight\n",
+      "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.output.dense.bias\n",
+      "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.value.bias\n",
+      "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.output.dense.weight\n",
+      "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.output.dense.bias\n",
+      "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.intermediate.dense.weight\n",
+      "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.intermediate.dense.bias\n",
+      "2023-04-06 22:49:36,176 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.output.dense.weight\n",
+      "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.output.dense.bias\n",
+      "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.value.bias\n",
+      "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.output.dense.weight\n",
+      "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.output.dense.bias\n",
+      "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.intermediate.dense.weight\n",
+      "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.intermediate.dense.bias\n",
+      "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.output.dense.weight\n",
+      "2023-04-06 22:49:36,177 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.output.dense.bias\n",
+      "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.value.bias\n",
+      "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.output.dense.weight\n",
+      "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.output.dense.bias\n",
+      "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.intermediate.dense.weight\n",
+      "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.intermediate.dense.bias\n",
+      "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.output.dense.weight\n",
+      "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.output.dense.bias\n",
+      "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,178 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.value.bias\n",
+      "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.output.dense.weight\n",
+      "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.output.dense.bias\n",
+      "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.intermediate.dense.weight\n",
+      "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.intermediate.dense.bias\n",
+      "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.output.dense.weight\n",
+      "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.output.dense.bias\n",
+      "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,179 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.value.bias\n",
+      "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.output.dense.weight\n",
+      "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.output.dense.bias\n",
+      "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.intermediate.dense.weight\n",
+      "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.intermediate.dense.bias\n",
+      "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.output.dense.weight\n",
+      "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.output.dense.bias\n",
+      "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,180 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.value.bias\n",
+      "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.output.dense.weight\n",
+      "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.output.dense.bias\n",
+      "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.intermediate.dense.weight\n",
+      "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.intermediate.dense.bias\n",
+      "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.output.dense.weight\n",
+      "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.output.dense.bias\n",
+      "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,181 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.value.bias\n",
+      "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.output.dense.weight\n",
+      "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.output.dense.bias\n",
+      "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.intermediate.dense.weight\n",
+      "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.intermediate.dense.bias\n",
+      "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.output.dense.weight\n",
+      "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.output.dense.bias\n",
+      "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,182 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.value.bias\n",
+      "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.output.dense.weight\n",
+      "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.output.dense.bias\n",
+      "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.intermediate.dense.weight\n",
+      "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.intermediate.dense.bias\n",
+      "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.output.dense.weight\n",
+      "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.output.dense.bias\n",
+      "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.value.bias\n",
+      "2023-04-06 22:49:36,183 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.output.dense.weight\n",
+      "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.output.dense.bias\n",
+      "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.intermediate.dense.weight\n",
+      "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.intermediate.dense.bias\n",
+      "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.output.dense.weight\n",
+      "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.output.dense.bias\n",
+      "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.value.bias\n",
+      "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.output.dense.weight\n",
+      "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.output.dense.bias\n",
+      "2023-04-06 22:49:36,184 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.intermediate.dense.weight\n",
+      "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.intermediate.dense.bias\n",
+      "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.output.dense.weight\n",
+      "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.output.dense.bias\n",
+      "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.value.bias\n",
+      "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.output.dense.weight\n",
+      "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.output.dense.bias\n",
+      "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,185 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.intermediate.dense.weight\n",
+      "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.intermediate.dense.bias\n",
+      "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.output.dense.weight\n",
+      "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.output.dense.bias\n",
+      "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.value.bias\n",
+      "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.output.dense.weight\n",
+      "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.output.dense.bias\n",
+      "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,186 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.intermediate.dense.weight\n",
+      "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.intermediate.dense.bias\n",
+      "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.output.dense.weight\n",
+      "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.output.dense.bias\n",
+      "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.value.bias\n",
+      "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.output.dense.weight\n",
+      "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.output.dense.bias\n",
+      "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.intermediate.dense.weight\n",
+      "2023-04-06 22:49:36,187 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.intermediate.dense.bias\n",
+      "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.output.dense.weight\n",
+      "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.output.dense.bias\n",
+      "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.value.bias\n",
+      "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.output.dense.weight\n",
+      "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.output.dense.bias\n",
+      "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.intermediate.dense.weight\n",
+      "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.intermediate.dense.bias\n",
+      "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.output.dense.weight\n",
+      "2023-04-06 22:49:36,188 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.output.dense.bias\n",
+      "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.value.bias\n",
+      "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.output.dense.weight\n",
+      "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.output.dense.bias\n",
+      "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.intermediate.dense.weight\n",
+      "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.intermediate.dense.bias\n",
+      "2023-04-06 22:49:36,189 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.output.dense.weight\n",
+      "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.output.dense.bias\n",
+      "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.output.LayerNorm.weight\n",
+      "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.output.LayerNorm.bias\n",
+      "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.query.weight\n",
+      "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.query.bias\n",
+      "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.key.weight\n",
+      "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.key.bias\n",
+      "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.value.weight\n",
+      "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.value.bias\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.output.dense.weight\r\n",
+      "2023-04-06 22:49:36,190 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.output.dense.bias\r\n",
+      "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.output.dense.weight\r\n",
+      "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.output.dense.bias\r\n",
+      "2023-04-06 22:49:36,191 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.output.dense.weight\r\n",
+      "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.output.dense.bias\r\n",
+      "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:36,192 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.pooler.dense.weight\r\n",
+      "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.pooler.dense.bias\r\n",
+      "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - The following parameters are Tunable (with gradient):\r\n",
+      "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - _head_sentinel\r\n",
+      "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.char_embed.weight\r\n",
+      "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.0.weight\r\n",
+      "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.0.bias\r\n",
+      "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.1.weight\r\n",
+      "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.1.bias\r\n",
+      "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.2.weight\r\n",
+      "2023-04-06 22:49:36,193 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.2.bias\r\n",
+      "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token.projection_layer.weight\r\n",
+      "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token.projection_layer.bias\r\n",
+      "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_0.cell.input_linearity.weight\r\n",
+      "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_0.cell.state_linearity.weight\r\n",
+      "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_0.cell.state_linearity.bias\r\n",
+      "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_0.cell.input_linearity.weight\r\n",
+      "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_0.cell.state_linearity.weight\r\n",
+      "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_0.cell.state_linearity.bias\r\n",
+      "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_1.cell.input_linearity.weight\r\n",
+      "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_1.cell.state_linearity.weight\r\n",
+      "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_1.cell.state_linearity.bias\r\n",
+      "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_1.cell.input_linearity.weight\r\n",
+      "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_1.cell.state_linearity.weight\r\n",
+      "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_1.cell.state_linearity.bias\r\n",
+      "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - dependency_relation.head_predictor.head_projection_layer.weight\r\n",
+      "2023-04-06 22:49:36,195 - INFO - allennlp.common.util - dependency_relation.head_predictor.head_projection_layer.bias\r\n",
+      "2023-04-06 22:49:36,196 - INFO - allennlp.common.util - dependency_relation.head_predictor.dependency_projection_layer.weight\r\n",
+      "2023-04-06 22:49:36,196 - INFO - allennlp.common.util - dependency_relation.head_predictor.dependency_projection_layer.bias\r\n",
+      "2023-04-06 22:49:36,196 - INFO - allennlp.common.util - dependency_relation.head_projection_layer.weight\r\n",
+      "2023-04-06 22:49:36,196 - INFO - allennlp.common.util - dependency_relation.head_projection_layer.bias\r\n",
+      "2023-04-06 22:49:36,196 - INFO - allennlp.common.util - dependency_relation.dependency_projection_layer.weight\r\n",
+      "2023-04-06 22:49:36,196 - INFO - allennlp.common.util - dependency_relation.dependency_projection_layer.bias\r\n",
+      "2023-04-06 22:49:36,196 - INFO - allennlp.common.util - dependency_relation.relation_prediction_layer.weight\r\n",
+      "2023-04-06 22:49:36,196 - INFO - allennlp.common.util - dependency_relation.relation_prediction_layer.bias\r\n",
+      "2023-04-06 22:49:36,196 - INFO - allennlp.common.params - trainer.learning_rate_scheduler.type = combo_scheduler\r\n",
+      "2023-04-06 22:49:36,196 - INFO - allennlp.common.params - trainer.learning_rate_scheduler.patience = 6\r\n",
+      "2023-04-06 22:49:36,196 - INFO - allennlp.common.params - trainer.learning_rate_scheduler.decreases = 2\r\n",
+      "2023-04-06 22:49:36,197 - INFO - allennlp.common.params - trainer.learning_rate_scheduler.threshold = 0.001\r\n",
+      "2023-04-06 22:49:36,197 - INFO - allennlp.common.params - trainer.checkpointer.type = finishing_only_checkpointer\r\n",
+      "2023-04-06 22:49:36,197 - INFO - allennlp.common.params - trainer.checkpointer.keep_serialized_model_every_num_seconds = None\r\n",
+      "2023-04-06 22:49:36,197 - INFO - allennlp.common.params - trainer.checkpointer.num_serialized_models_to_keep = 2\r\n",
+      "2023-04-06 22:49:36,197 - INFO - allennlp.common.params - trainer.checkpointer.model_save_interval = None\r\n",
+      "2023-04-06 22:49:36,199 - INFO - combo.training.trainer - Beginning training.\r\n",
+      "2023-04-06 22:49:36,199 - INFO - allennlp.training.trainer - Epoch 0/399\r\n",
+      "2023-04-06 22:49:36,199 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.3G\r\n",
+      "2023-04-06 22:49:36,199 - INFO - allennlp.training.trainer - GPU 0 memory usage: 1.4G\r\n",
+      "2023-04-06 22:49:36,206 - INFO - allennlp.training.trainer - Training\r\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\r\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0004, UAS: 0.0545, LAS: 0.0004, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 8.5812, partial_loss/deprel_loss: 12.1384, partial_loss/cycle_loss: 0.0000, batch_loss: 11.5281, loss: 11.5281, batch_reg_loss: 0.1011, reg_loss: 0.1011 ||:   1%|1         | 1/95 [00:02<03:22,  2.15s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0000, UAS: 0.0534, LAS: 0.0025, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 54.5014, partial_loss/deprel_loss: 9.3042, partial_loss/cycle_loss: 0.0000, batch_loss: 18.4440, loss: 29.0149, batch_reg_loss: 0.1003, reg_loss: 0.1007 ||:   5%|5         | 5/95 [00:04<02:32,  1.69s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0048, UAS: 0.0484, LAS: 0.0043, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 26.8907, partial_loss/deprel_loss: 10.2825, partial_loss/cycle_loss: 0.0000, batch_loss: 13.7041, loss: 28.1204, batch_reg_loss: 0.1000, reg_loss: 0.1004 ||:   9%|9         | 9/95 [00:06<01:56,  1.35s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0075, UAS: 0.0514, LAS: 0.0053, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 16.4258, partial_loss/deprel_loss: 8.9739, partial_loss/cycle_loss: 0.0000, batch_loss: 10.5639, loss: 24.1295, batch_reg_loss: 0.0996, reg_loss: 0.1003 ||:  13%|#2        | 12/95 [00:08<01:35,  1.15s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0248, UAS: 0.0550, LAS: 0.0072, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 30.6838, partial_loss/deprel_loss: 6.7519, partial_loss/cycle_loss: 0.0000, batch_loss: 11.6376, loss: 21.7925, batch_reg_loss: 0.0993, reg_loss: 0.1001 ||:  16%|#5        | 15/95 [00:10<01:20,  1.01s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0128, UAS: 0.0582, LAS: 0.0085, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 12.5911, partial_loss/deprel_loss: 8.4106, partial_loss/cycle_loss: 0.0000, batch_loss: 9.3455, loss: 19.5927, batch_reg_loss: 0.0988, reg_loss: 0.0999 ||:  20%|##        | 19/95 [00:13<01:08,  1.11it/s] \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0032, UAS: 0.0579, LAS: 0.0088, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 18.6420, partial_loss/deprel_loss: 11.9442, partial_loss/cycle_loss: 0.0000, batch_loss: 13.3822, loss: 18.3815, batch_reg_loss: 0.0984, reg_loss: 0.0997 ||:  23%|##3       | 22/95 [00:15<01:01,  1.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0279, UAS: 0.0718, LAS: 0.0148, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 11.8369, partial_loss/deprel_loss: 6.2066, partial_loss/cycle_loss: 0.0000, batch_loss: 7.4307, loss: 17.0702, batch_reg_loss: 0.0980, reg_loss: 0.0995 ||:  26%|##6       | 25/95 [00:18<00:59,  1.17it/s]  \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0260, UAS: 0.0776, LAS: 0.0161, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.1379, partial_loss/deprel_loss: 6.0939, partial_loss/cycle_loss: 0.0000, batch_loss: 6.4003, loss: 16.0644, batch_reg_loss: 0.0976, reg_loss: 0.0993 ||:  29%|##9       | 28/95 [00:22<01:07,  1.01s/it] \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0340, UAS: 0.0781, LAS: 0.0163, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 8.3717, partial_loss/deprel_loss: 6.7100, partial_loss/cycle_loss: 0.0000, batch_loss: 7.1393, loss: 15.1670, batch_reg_loss: 0.0969, reg_loss: 0.0990 ||:  34%|###3      | 32/95 [00:24<00:56,  1.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0187, UAS: 0.0777, LAS: 0.0165, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 10.8800, partial_loss/deprel_loss: 8.6119, partial_loss/cycle_loss: 0.0000, batch_loss: 9.1620, loss: 14.6762, batch_reg_loss: 0.0964, reg_loss: 0.0988 ||:  37%|###6      | 35/95 [00:27<00:51,  1.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0104, UAS: 0.0764, LAS: 0.0161, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 13.7758, partial_loss/deprel_loss: 10.7456, partial_loss/cycle_loss: 0.0000, batch_loss: 11.4476, loss: 14.4105, batch_reg_loss: 0.0959, reg_loss: 0.0986 ||:  40%|####      | 38/95 [00:29<00:46,  1.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0211, UAS: 0.0791, LAS: 0.0156, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.5813, partial_loss/deprel_loss: 7.7125, partial_loss/cycle_loss: 0.0000, batch_loss: 7.7814, loss: 13.8527, batch_reg_loss: 0.0952, reg_loss: 0.0983 ||:  44%|####4     | 42/95 [00:31<00:40,  1.31it/s]   \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0355, UAS: 0.0847, LAS: 0.0172, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.5881, partial_loss/deprel_loss: 5.1220, partial_loss/cycle_loss: 0.0000, batch_loss: 5.1099, loss: 13.3031, batch_reg_loss: 0.0947, reg_loss: 0.0981 ||:  47%|####7     | 45/95 [00:34<00:39,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0147, UAS: 0.0887, LAS: 0.0176, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.7138, partial_loss/deprel_loss: 9.5235, partial_loss/cycle_loss: 0.0000, batch_loss: 9.6557, loss: 12.9664, batch_reg_loss: 0.0941, reg_loss: 0.0978 ||:  51%|#####     | 48/95 [00:36<00:35,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0279, UAS: 0.0896, LAS: 0.0176, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.1660, partial_loss/deprel_loss: 7.7062, partial_loss/cycle_loss: 0.0000, batch_loss: 7.6917, loss: 12.7503, batch_reg_loss: 0.0935, reg_loss: 0.0976 ||:  54%|#####3    | 51/95 [00:38<00:32,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0475, UAS: 0.0943, LAS: 0.0184, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.6122, partial_loss/deprel_loss: 5.5939, partial_loss/cycle_loss: 0.0000, batch_loss: 5.4905, loss: 12.4588, batch_reg_loss: 0.0929, reg_loss: 0.0974 ||:  57%|#####6    | 54/95 [00:40<00:30,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0095, UAS: 0.0959, LAS: 0.0184, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 10.1111, partial_loss/deprel_loss: 9.9458, partial_loss/cycle_loss: 0.0000, batch_loss: 10.0712, loss: 12.2757, batch_reg_loss: 0.0923, reg_loss: 0.0971 ||:  60%|######    | 57/95 [00:43<00:29,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0295, UAS: 0.1010, LAS: 0.0194, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.3592, partial_loss/deprel_loss: 8.1111, partial_loss/cycle_loss: 0.0000, batch_loss: 8.0525, loss: 12.0223, batch_reg_loss: 0.0918, reg_loss: 0.0968 ||:  63%|######3   | 60/95 [00:45<00:27,  1.29it/s]  \n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0211, UAS: 0.1046, LAS: 0.0201, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 12.1219, partial_loss/deprel_loss: 10.9192, partial_loss/cycle_loss: 0.0000, batch_loss: 11.2509, loss: 11.8418, batch_reg_loss: 0.0912, reg_loss: 0.0966 ||:  66%|######6   | 63/95 [00:48<00:24,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0635, UAS: 0.1096, LAS: 0.0216, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.5291, partial_loss/deprel_loss: 5.6521, partial_loss/cycle_loss: 0.0000, batch_loss: 5.5181, loss: 11.5928, batch_reg_loss: 0.0906, reg_loss: 0.0963 ||:  69%|######9   | 66/95 [00:50<00:22,  1.32it/s]   \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0398, UAS: 0.1150, LAS: 0.0234, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.7731, partial_loss/deprel_loss: 9.1982, partial_loss/cycle_loss: 0.0000, batch_loss: 9.4030, loss: 11.3990, batch_reg_loss: 0.0898, reg_loss: 0.0960 ||:  74%|#######3  | 70/95 [00:52<00:18,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0846, UAS: 0.1186, LAS: 0.0248, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.3256, partial_loss/deprel_loss: 6.6774, partial_loss/cycle_loss: 0.0000, batch_loss: 6.6964, loss: 11.2984, batch_reg_loss: 0.0893, reg_loss: 0.0957 ||:  77%|#######6  | 73/95 [00:55<00:16,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0833, UAS: 0.1243, LAS: 0.0270, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.0066, partial_loss/deprel_loss: 6.5017, partial_loss/cycle_loss: 0.0000, batch_loss: 6.4915, loss: 11.1237, batch_reg_loss: 0.0888, reg_loss: 0.0954 ||:  80%|########  | 76/95 [00:57<00:15,  1.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0703, UAS: 0.1299, LAS: 0.0293, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.8032, partial_loss/deprel_loss: 7.2562, partial_loss/cycle_loss: 0.0000, batch_loss: 7.2538, loss: 10.9525, batch_reg_loss: 0.0882, reg_loss: 0.0951 ||:  84%|########4 | 80/95 [01:00<00:11,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1558, UAS: 0.1366, LAS: 0.0323, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.8053, partial_loss/deprel_loss: 4.8429, partial_loss/cycle_loss: 0.0000, batch_loss: 4.7231, loss: 10.7869, batch_reg_loss: 0.0878, reg_loss: 0.0948 ||:  87%|########7 | 83/95 [01:02<00:09,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0715, UAS: 0.1407, LAS: 0.0338, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.0259, partial_loss/deprel_loss: 7.7293, partial_loss/cycle_loss: 0.0000, batch_loss: 7.6759, loss: 10.6741, batch_reg_loss: 0.0873, reg_loss: 0.0946 ||:  91%|######### | 86/95 [01:05<00:06,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2157, UAS: 0.1479, LAS: 0.0369, UEM: 0.0003, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3231, partial_loss/deprel_loss: 3.5750, partial_loss/cycle_loss: 0.0000, batch_loss: 3.4113, loss: 10.5203, batch_reg_loss: 0.0867, reg_loss: 0.0942 ||:  95%|#########4| 90/95 [01:07<00:03,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1474, UAS: 0.1547, LAS: 0.0400, UEM: 0.0003, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.0826, partial_loss/deprel_loss: 5.3748, partial_loss/cycle_loss: 0.0000, batch_loss: 5.2025, loss: 10.3609, batch_reg_loss: 0.0862, reg_loss: 0.0939 ||:  99%|#########8| 94/95 [01:10<00:00,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0841, UAS: 0.1557, LAS: 0.0404, UEM: 0.0003, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.5016, partial_loss/deprel_loss: 7.9801, partial_loss/cycle_loss: 0.0000, batch_loss: 7.9705, loss: 10.3357, batch_reg_loss: 0.0860, reg_loss: 0.0938 ||: 100%|##########| 95/95 [01:11<00:00,  1.33it/s]\n",
+      "2023-04-06 22:50:47,786 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0548, UAS: 0.2285, LAS: 0.0729, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 10.1434, partial_loss/deprel_loss: 20.6559, partial_loss/cycle_loss: 0.0000, batch_loss: 18.5534, loss: 17.4393, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  18%|#8        | 2/11 [00:02<00:12,  1.35s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2127, UAS: 0.3238, LAS: 0.1315, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.1571, partial_loss/deprel_loss: 10.7516, partial_loss/cycle_loss: 0.0000, batch_loss: 9.4327, loss: 13.8287, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  36%|###6      | 4/11 [00:04<00:08,  1.25s/it]  \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1265, UAS: 0.3078, LAS: 0.1205, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.1798, partial_loss/deprel_loss: 12.8523, partial_loss/cycle_loss: 0.0000, batch_loss: 11.5178, loss: 14.0520, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  55%|#####4    | 6/11 [00:06<00:05,  1.20s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2520, UAS: 0.3285, LAS: 0.1346, UEM: 0.0024, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.5845, partial_loss/deprel_loss: 9.4003, partial_loss/cycle_loss: 0.0000, batch_loss: 8.2371, loss: 13.1916, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  73%|#######2  | 8/11 [00:09<00:03,  1.18s/it]  \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1437, UAS: 0.3256, LAS: 0.1316, UEM: 0.0020, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.5130, partial_loss/deprel_loss: 13.1310, partial_loss/cycle_loss: 0.0000, batch_loss: 11.6074, loss: 13.1748, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  91%|######### | 10/11 [00:11<00:01,  1.15s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3640, UAS: 0.3546, LAS: 0.1527, UEM: 0.0525, LEM: 0.0098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4938, partial_loss/deprel_loss: 6.7426, partial_loss/cycle_loss: 0.0000, batch_loss: 5.8929, loss: 12.5128, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:13<00:00,  1.27s/it]  \n",
+      "2023-04-06 22:51:01,759 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 22:51:01,759 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 22:51:01,759 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.094  |     0.000\n",
+      "2023-04-06 22:51:01,759 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 22:51:01,759 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 22:51:01,759 - INFO - combo.training.tensorboard_writer - UEM                      |     0.000  |     0.052\n",
+      "2023-04-06 22:51:01,759 - INFO - combo.training.tensorboard_writer - LEM                      |     0.000  |     0.010\n",
+      "2023-04-06 22:51:01,759 - INFO - combo.training.tensorboard_writer - EM                       |     0.084  |     0.364\n",
+      "2023-04-06 22:51:01,759 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     7.502  |     2.494\n",
+      "2023-04-06 22:51:01,759 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - UAS                      |     0.156  |     0.355\n",
+      "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6412.477  |       N/A\n",
+      "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     7.980  |     6.743\n",
+      "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - loss                     |    10.336  |    12.513\n",
+      "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - LAS                      |     0.040  |     0.153\n",
+      "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  1397.910  |       N/A\n",
+      "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 22:51:01,760 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 22:51:01,761 - INFO - combo.training.trainer - Epoch duration: 0:01:25.561854\n",
+      "2023-04-06 22:51:01,761 - INFO - combo.training.trainer - Estimated training time remaining: 9:28:59\n",
+      "2023-04-06 22:51:01,761 - INFO - allennlp.training.trainer - Epoch 1/399\n",
+      "2023-04-06 22:51:01,762 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 22:51:01,762 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 22:51:01,769 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0892, UAS: 0.3088, LAS: 0.1046, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.4360, partial_loss/deprel_loss: 7.4241, partial_loss/cycle_loss: 0.0000, batch_loss: 7.3119, loss: 7.2408, batch_reg_loss: 0.0855, reg_loss: 0.0857 ||:   4%|4         | 4/95 [00:02<00:53,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1269, UAS: 0.3102, LAS: 0.1127, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.4805, partial_loss/deprel_loss: 6.2504, partial_loss/cycle_loss: 0.0000, batch_loss: 6.1813, loss: 7.0525, batch_reg_loss: 0.0849, reg_loss: 0.0854 ||:   8%|8         | 8/95 [00:04<00:50,  1.73it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3090, UAS: 0.3354, LAS: 0.1310, UEM: 0.0049, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2528, partial_loss/deprel_loss: 3.8317, partial_loss/cycle_loss: 0.0000, batch_loss: 3.6003, loss: 6.8078, batch_reg_loss: 0.0844, reg_loss: 0.0851 ||:  13%|#2        | 12/95 [00:07<00:49,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1101, UAS: 0.3157, LAS: 0.1218, UEM: 0.0043, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.7482, partial_loss/deprel_loss: 7.9708, partial_loss/cycle_loss: 0.0000, batch_loss: 8.0102, loss: 7.3046, batch_reg_loss: 0.0839, reg_loss: 0.0849 ||:  17%|#6        | 16/95 [00:09<00:47,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2304, UAS: 0.3321, LAS: 0.1318, UEM: 0.0033, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.3571, partial_loss/deprel_loss: 4.9808, partial_loss/cycle_loss: 0.0000, batch_loss: 4.7394, loss: 7.0827, batch_reg_loss: 0.0834, reg_loss: 0.0846 ||:  21%|##1       | 20/95 [00:12<00:46,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2079, UAS: 0.3461, LAS: 0.1419, UEM: 0.0027, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.4135, partial_loss/deprel_loss: 4.8411, partial_loss/cycle_loss: 0.0000, batch_loss: 4.6384, loss: 6.8631, batch_reg_loss: 0.0828, reg_loss: 0.0844 ||:  25%|##5       | 24/95 [00:14<00:44,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1619, UAS: 0.3568, LAS: 0.1503, UEM: 0.0023, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.0594, partial_loss/deprel_loss: 7.0292, partial_loss/cycle_loss: 0.0000, batch_loss: 6.9176, loss: 6.7511, batch_reg_loss: 0.0823, reg_loss: 0.0841 ||:  29%|##9       | 28/95 [00:17<00:41,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3035, UAS: 0.3679, LAS: 0.1575, UEM: 0.0038, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5356, partial_loss/deprel_loss: 4.0269, partial_loss/cycle_loss: 0.0000, batch_loss: 3.8104, loss: 6.6715, batch_reg_loss: 0.0818, reg_loss: 0.0838 ||:  34%|###3      | 32/95 [00:19<00:37,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3353, UAS: 0.3790, LAS: 0.1674, UEM: 0.0040, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5441, partial_loss/deprel_loss: 4.1055, partial_loss/cycle_loss: 0.0000, batch_loss: 3.8744, loss: 6.6041, batch_reg_loss: 0.0812, reg_loss: 0.0835 ||:  39%|###8      | 37/95 [00:22<00:33,  1.71it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3046, UAS: 0.3860, LAS: 0.1749, UEM: 0.0036, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.0900, partial_loss/deprel_loss: 4.5535, partial_loss/cycle_loss: 0.0000, batch_loss: 4.3415, loss: 6.5507, batch_reg_loss: 0.0807, reg_loss: 0.0832 ||:  43%|####3     | 41/95 [00:24<00:31,  1.74it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2472, UAS: 0.3908, LAS: 0.1796, UEM: 0.0034, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.3257, partial_loss/deprel_loss: 5.5917, partial_loss/cycle_loss: 0.0000, batch_loss: 5.4187, loss: 6.5291, batch_reg_loss: 0.0802, reg_loss: 0.0830 ||:  47%|####7     | 45/95 [00:26<00:29,  1.72it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3365, UAS: 0.4054, LAS: 0.1916, UEM: 0.0070, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.9531, partial_loss/deprel_loss: 4.3089, partial_loss/cycle_loss: 0.0000, batch_loss: 4.1175, loss: 6.3710, batch_reg_loss: 0.0797, reg_loss: 0.0827 ||:  52%|#####1    | 49/95 [00:29<00:26,  1.74it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2627, UAS: 0.4168, LAS: 0.2021, UEM: 0.0088, LEM: 0.0001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.9681, partial_loss/deprel_loss: 5.8151, partial_loss/cycle_loss: 0.0000, batch_loss: 5.7249, loss: 6.2517, batch_reg_loss: 0.0792, reg_loss: 0.0825 ||:  56%|#####5    | 53/95 [00:31<00:25,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3356, UAS: 0.4249, LAS: 0.2092, UEM: 0.0083, LEM: 0.0001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.5951, partial_loss/deprel_loss: 4.9067, partial_loss/cycle_loss: 0.0000, batch_loss: 4.7231, loss: 6.1661, batch_reg_loss: 0.0787, reg_loss: 0.0822 ||:  60%|######    | 57/95 [00:34<00:24,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3085, UAS: 0.4378, LAS: 0.2220, UEM: 0.0282, LEM: 0.0019, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.5148, partial_loss/deprel_loss: 5.2129, partial_loss/cycle_loss: 0.0000, batch_loss: 5.1516, loss: 6.0099, batch_reg_loss: 0.0783, reg_loss: 0.0820 ||:  64%|######4   | 61/95 [00:37<00:22,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2475, UAS: 0.4450, LAS: 0.2287, UEM: 0.0392, LEM: 0.0028, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.9321, partial_loss/deprel_loss: 6.5389, partial_loss/cycle_loss: 0.0000, batch_loss: 6.4955, loss: 5.9507, batch_reg_loss: 0.0779, reg_loss: 0.0818 ||:  67%|######7   | 64/95 [00:39<00:21,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3958, UAS: 0.4495, LAS: 0.2332, UEM: 0.0377, LEM: 0.0027, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.1590, partial_loss/deprel_loss: 4.3287, partial_loss/cycle_loss: 0.0000, batch_loss: 4.1724, loss: 5.9121, batch_reg_loss: 0.0776, reg_loss: 0.0816 ||:  71%|#######   | 67/95 [00:41<00:19,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2506, UAS: 0.4516, LAS: 0.2357, UEM: 0.0367, LEM: 0.0026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.5986, partial_loss/deprel_loss: 6.4800, partial_loss/cycle_loss: 0.0000, batch_loss: 6.5810, loss: 5.9082, batch_reg_loss: 0.0773, reg_loss: 0.0814 ||:  74%|#######3  | 70/95 [00:43<00:17,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2938, UAS: 0.4553, LAS: 0.2401, UEM: 0.0377, LEM: 0.0027, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.9417, partial_loss/deprel_loss: 6.1287, partial_loss/cycle_loss: 0.0000, batch_loss: 6.1683, loss: 5.8802, batch_reg_loss: 0.0770, reg_loss: 0.0813 ||:  77%|#######6  | 73/95 [00:46<00:15,  1.44it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3746, UAS: 0.4615, LAS: 0.2468, UEM: 0.0361, LEM: 0.0025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.0424, partial_loss/deprel_loss: 4.8777, partial_loss/cycle_loss: 0.0000, batch_loss: 4.7872, loss: 5.8175, batch_reg_loss: 0.0765, reg_loss: 0.0810 ||:  81%|########1 | 77/95 [00:48<00:12,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6636, UAS: 0.4715, LAS: 0.2577, UEM: 0.0619, LEM: 0.0139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5887, partial_loss/deprel_loss: 1.3522, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2757, loss: 5.7031, batch_reg_loss: 0.0762, reg_loss: 0.0808 ||:  84%|########4 | 80/95 [00:51<00:11,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4942, UAS: 0.4770, LAS: 0.2646, UEM: 0.0600, LEM: 0.0134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5109, partial_loss/deprel_loss: 3.5031, partial_loss/cycle_loss: 0.0000, batch_loss: 3.3806, loss: 5.6570, batch_reg_loss: 0.0759, reg_loss: 0.0806 ||:  88%|########8 | 84/95 [00:54<00:07,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3159, UAS: 0.4840, LAS: 0.2728, UEM: 0.0585, LEM: 0.0128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.1182, partial_loss/deprel_loss: 5.8656, partial_loss/cycle_loss: 0.0000, batch_loss: 5.9916, loss: 5.5923, batch_reg_loss: 0.0755, reg_loss: 0.0804 ||:  93%|#########2| 88/95 [00:56<00:04,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4646, UAS: 0.4886, LAS: 0.2786, UEM: 0.0570, LEM: 0.0125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.0568, partial_loss/deprel_loss: 3.9986, partial_loss/cycle_loss: 0.0000, batch_loss: 3.8854, loss: 5.5646, batch_reg_loss: 0.0752, reg_loss: 0.0802 ||:  97%|#########6| 92/95 [00:58<00:01,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6402, UAS: 0.4963, LAS: 0.2871, UEM: 0.0600, LEM: 0.0126, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1759, partial_loss/deprel_loss: 2.2577, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1162, loss: 5.4829, batch_reg_loss: 0.0749, reg_loss: 0.0800 ||: 100%|##########| 95/95 [01:00<00:00,  1.56it/s]\n",
+      "2023-04-06 22:52:02,565 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 22:52:02,565 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 22:52:02,565 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.080  |       N/A\n",
+      "2023-04-06 22:52:02,565 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:52:02,565 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:52:02,565 - INFO - combo.training.tensorboard_writer - UEM                      |     0.060  |       N/A\n",
+      "2023-04-06 22:52:02,565 - INFO - combo.training.tensorboard_writer - LEM                      |     0.013  |       N/A\n",
+      "2023-04-06 22:52:02,565 - INFO - combo.training.tensorboard_writer - EM                       |     0.640  |       N/A\n",
+      "2023-04-06 22:52:02,565 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.176  |       N/A\n",
+      "2023-04-06 22:52:02,565 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - UAS                      |     0.496  |       N/A\n",
+      "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     2.258  |       N/A\n",
+      "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - loss                     |     5.483  |       N/A\n",
+      "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - LAS                      |     0.287  |       N/A\n",
+      "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.722  |       N/A\n",
+      "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:52:02,566 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 22:52:02,567 - INFO - combo.training.trainer - Epoch duration: 0:01:00.805524\n",
+      "2023-04-06 22:52:02,567 - INFO - combo.training.trainer - Estimated training time remaining: 8:05:27\n",
+      "2023-04-06 22:52:02,567 - INFO - allennlp.training.trainer - Epoch 2/399\n",
+      "2023-04-06 22:52:02,567 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 22:52:02,568 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 22:52:02,574 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5070, UAS: 0.6220, LAS: 0.4480, UEM: 0.0040, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.7143, partial_loss/deprel_loss: 3.5357, partial_loss/cycle_loss: 0.0000, batch_loss: 3.4460, loss: 4.2797, batch_reg_loss: 0.0746, reg_loss: 0.0747 ||:   4%|4         | 4/95 [00:02<00:57,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5354, UAS: 0.6512, LAS: 0.4740, UEM: 0.0028, LEM: 0.0009, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6557, partial_loss/deprel_loss: 3.4796, partial_loss/cycle_loss: 0.0000, batch_loss: 3.3891, loss: 3.9798, batch_reg_loss: 0.0743, reg_loss: 0.0745 ||:   8%|8         | 8/95 [00:05<00:54,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5451, UAS: 0.6686, LAS: 0.4905, UEM: 0.0285, LEM: 0.0017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3370, partial_loss/deprel_loss: 3.2024, partial_loss/cycle_loss: 0.0000, batch_loss: 3.1032, loss: 3.8055, batch_reg_loss: 0.0739, reg_loss: 0.0744 ||:  13%|#2        | 12/95 [00:07<00:53,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3732, UAS: 0.6592, LAS: 0.4869, UEM: 0.0549, LEM: 0.0066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.0546, partial_loss/deprel_loss: 5.3551, partial_loss/cycle_loss: 0.0000, batch_loss: 5.5687, loss: 3.9035, batch_reg_loss: 0.0737, reg_loss: 0.0743 ||:  16%|#5        | 15/95 [00:09<00:53,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5262, UAS: 0.6727, LAS: 0.4998, UEM: 0.0628, LEM: 0.0070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6727, partial_loss/deprel_loss: 3.4231, partial_loss/cycle_loss: 0.0000, batch_loss: 3.3465, loss: 3.7405, batch_reg_loss: 0.0735, reg_loss: 0.0741 ||:  19%|#8        | 18/95 [00:12<00:53,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6196, UAS: 0.6788, LAS: 0.5066, UEM: 0.0849, LEM: 0.0087, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5574, partial_loss/deprel_loss: 2.5821, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4504, loss: 3.6848, batch_reg_loss: 0.0733, reg_loss: 0.0740 ||:  22%|##2       | 21/95 [00:14<00:52,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4468, UAS: 0.6777, LAS: 0.5063, UEM: 0.0764, LEM: 0.0079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.3180, partial_loss/deprel_loss: 4.4548, partial_loss/cycle_loss: 0.0000, batch_loss: 4.5005, loss: 3.6993, batch_reg_loss: 0.0731, reg_loss: 0.0739 ||:  25%|##5       | 24/95 [00:16<00:50,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6454, UAS: 0.6869, LAS: 0.5163, UEM: 0.0824, LEM: 0.0090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3747, partial_loss/deprel_loss: 2.2014, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1089, loss: 3.5795, batch_reg_loss: 0.0729, reg_loss: 0.0738 ||:  28%|##8       | 27/95 [00:18<00:48,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6744, UAS: 0.6970, LAS: 0.5267, UEM: 0.2029, LEM: 0.0663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8321, partial_loss/deprel_loss: 1.8400, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7111, loss: 3.4778, batch_reg_loss: 0.0727, reg_loss: 0.0737 ||:  32%|###1      | 30/95 [00:21<00:50,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4503, UAS: 0.6922, LAS: 0.5225, UEM: 0.1897, LEM: 0.0620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.6911, partial_loss/deprel_loss: 4.8424, partial_loss/cycle_loss: 0.0000, batch_loss: 4.8846, loss: 3.5555, batch_reg_loss: 0.0724, reg_loss: 0.0736 ||:  36%|###5      | 34/95 [00:24<00:44,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6986, UAS: 0.7002, LAS: 0.5305, UEM: 0.2109, LEM: 0.0621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6816, partial_loss/deprel_loss: 1.6548, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5324, loss: 3.4693, batch_reg_loss: 0.0723, reg_loss: 0.0735 ||:  39%|###8      | 37/95 [00:26<00:44,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5281, UAS: 0.7007, LAS: 0.5313, UEM: 0.1987, LEM: 0.0581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.2648, partial_loss/deprel_loss: 3.6513, partial_loss/cycle_loss: 0.0000, batch_loss: 3.6460, loss: 3.4727, batch_reg_loss: 0.0720, reg_loss: 0.0733 ||:  43%|####3     | 41/95 [00:29<00:39,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4741, UAS: 0.6962, LAS: 0.5273, UEM: 0.1924, LEM: 0.0563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.4164, partial_loss/deprel_loss: 4.4130, partial_loss/cycle_loss: 0.0000, batch_loss: 4.4855, loss: 3.5359, batch_reg_loss: 0.0718, reg_loss: 0.0732 ||:  46%|####6     | 44/95 [00:31<00:36,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5552, UAS: 0.6990, LAS: 0.5305, UEM: 0.1911, LEM: 0.0544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.7836, partial_loss/deprel_loss: 3.3469, partial_loss/cycle_loss: 0.0000, batch_loss: 3.3059, loss: 3.5092, batch_reg_loss: 0.0717, reg_loss: 0.0731 ||:  49%|####9     | 47/95 [00:33<00:35,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7089, UAS: 0.7034, LAS: 0.5355, UEM: 0.1959, LEM: 0.0544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8202, partial_loss/deprel_loss: 1.7523, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6374, loss: 3.4603, batch_reg_loss: 0.0715, reg_loss: 0.0730 ||:  53%|#####2    | 50/95 [00:35<00:34,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5674, UAS: 0.7029, LAS: 0.5355, UEM: 0.1889, LEM: 0.0524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.8019, partial_loss/deprel_loss: 3.3643, partial_loss/cycle_loss: 0.0000, batch_loss: 3.3231, loss: 3.4721, batch_reg_loss: 0.0713, reg_loss: 0.0729 ||:  56%|#####5    | 53/95 [00:37<00:30,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4533, UAS: 0.7061, LAS: 0.5395, UEM: 0.1821, LEM: 0.0493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.9593, partial_loss/deprel_loss: 4.6140, partial_loss/cycle_loss: 0.0000, batch_loss: 4.7542, loss: 3.4339, batch_reg_loss: 0.0711, reg_loss: 0.0728 ||:  60%|######    | 57/95 [00:40<00:25,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6635, UAS: 0.7108, LAS: 0.5443, UEM: 0.1847, LEM: 0.0478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3704, partial_loss/deprel_loss: 2.2964, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1821, loss: 3.3868, batch_reg_loss: 0.0709, reg_loss: 0.0727 ||:  64%|######4   | 61/95 [00:42<00:22,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5675, UAS: 0.7133, LAS: 0.5472, UEM: 0.1795, LEM: 0.0456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.8984, partial_loss/deprel_loss: 3.5634, partial_loss/cycle_loss: 0.0000, batch_loss: 3.5010, loss: 3.3671, batch_reg_loss: 0.0707, reg_loss: 0.0726 ||:  68%|######8   | 65/95 [00:45<00:20,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6256, UAS: 0.7172, LAS: 0.5516, UEM: 0.1924, LEM: 0.0494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9098, partial_loss/deprel_loss: 2.6757, partial_loss/cycle_loss: 0.0000, batch_loss: 2.5930, loss: 3.3262, batch_reg_loss: 0.0705, reg_loss: 0.0725 ||:  72%|#######1  | 68/95 [00:47<00:19,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6834, UAS: 0.7184, LAS: 0.5535, UEM: 0.1973, LEM: 0.0488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1975, partial_loss/deprel_loss: 2.0961, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9867, loss: 3.3143, batch_reg_loss: 0.0704, reg_loss: 0.0724 ||:  75%|#######4  | 71/95 [00:49<00:17,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5457, UAS: 0.7191, LAS: 0.5544, UEM: 0.1902, LEM: 0.0470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.2685, partial_loss/deprel_loss: 3.7732, partial_loss/cycle_loss: 0.0000, batch_loss: 3.7424, loss: 3.3121, batch_reg_loss: 0.0702, reg_loss: 0.0723 ||:  79%|#######8  | 75/95 [00:52<00:13,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4441, UAS: 0.7213, LAS: 0.5570, UEM: 0.1863, LEM: 0.0451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.3762, partial_loss/deprel_loss: 4.7015, partial_loss/cycle_loss: 0.0000, batch_loss: 4.9064, loss: 3.2949, batch_reg_loss: 0.0700, reg_loss: 0.0722 ||:  83%|########3 | 79/95 [00:54<00:10,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7161, UAS: 0.7224, LAS: 0.5588, UEM: 0.1833, LEM: 0.0441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0918, partial_loss/deprel_loss: 1.9270, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8298, loss: 3.2891, batch_reg_loss: 0.0698, reg_loss: 0.0721 ||:  87%|########7 | 83/95 [00:57<00:07,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5738, UAS: 0.7242, LAS: 0.5609, UEM: 0.1823, LEM: 0.0430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.8083, partial_loss/deprel_loss: 3.3905, partial_loss/cycle_loss: 0.0000, batch_loss: 3.3436, loss: 3.2741, batch_reg_loss: 0.0696, reg_loss: 0.0720 ||:  92%|#########1| 87/95 [01:00<00:05,  1.50it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6708, UAS: 0.7295, LAS: 0.5668, UEM: 0.2018, LEM: 0.0497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4738, partial_loss/deprel_loss: 2.0978, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0424, loss: 3.2064, batch_reg_loss: 0.0694, reg_loss: 0.0718 ||:  96%|#########5| 91/95 [01:03<00:02,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7269, UAS: 0.7333, LAS: 0.5708, UEM: 0.2004, LEM: 0.0483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9830, partial_loss/deprel_loss: 1.8156, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7183, loss: 3.1682, batch_reg_loss: 0.0692, reg_loss: 0.0717 ||: 100%|##########| 95/95 [01:05<00:00,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7269, UAS: 0.7333, LAS: 0.5708, UEM: 0.2004, LEM: 0.0483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9830, partial_loss/deprel_loss: 1.8156, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7183, loss: 3.1682, batch_reg_loss: 0.0692, reg_loss: 0.0717 ||: 100%|##########| 95/95 [01:05<00:00,  1.45it/s]\n",
+      "2023-04-06 22:53:08,051 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.072  |       N/A\n",
+      "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - UEM                      |     0.200  |       N/A\n",
+      "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - LEM                      |     0.048  |       N/A\n",
+      "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - EM                       |     0.727  |       N/A\n",
+      "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.983  |       N/A\n",
+      "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - UAS                      |     0.733  |       N/A\n",
+      "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.816  |       N/A\n",
+      "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - loss                     |     3.168  |       N/A\n",
+      "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - LAS                      |     0.571  |       N/A\n",
+      "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.722  |       N/A\n",
+      "2023-04-06 22:53:08,052 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:53:08,053 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:53:08,053 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:53:08,053 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:53:08,053 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 22:53:08,053 - INFO - combo.training.trainer - Epoch duration: 0:01:05.486109\n",
+      "2023-04-06 22:53:08,053 - INFO - combo.training.trainer - Estimated training time remaining: 7:47:15\n",
+      "2023-04-06 22:53:08,053 - INFO - allennlp.training.trainer - Epoch 3/399\n",
+      "2023-04-06 22:53:08,054 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 22:53:08,054 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 22:53:08,060 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6676, UAS: 0.8632, LAS: 0.7232, UEM: 0.4714, LEM: 0.1227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6770, partial_loss/deprel_loss: 2.2723, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2223, loss: 1.6806, batch_reg_loss: 0.0691, reg_loss: 0.0691 ||:   3%|3         | 3/95 [00:02<01:07,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6184, UAS: 0.8099, LAS: 0.6626, UEM: 0.3402, LEM: 0.0788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0338, partial_loss/deprel_loss: 2.8807, partial_loss/cycle_loss: 0.0000, batch_loss: 2.7803, loss: 2.3373, batch_reg_loss: 0.0689, reg_loss: 0.0690 ||:   7%|7         | 7/95 [00:04<01:01,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7145, UAS: 0.7989, LAS: 0.6512, UEM: 0.2798, LEM: 0.0575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0975, partial_loss/deprel_loss: 1.9117, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8176, loss: 2.4843, batch_reg_loss: 0.0687, reg_loss: 0.0689 ||:  12%|#1        | 11/95 [00:07<00:56,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7915, UAS: 0.7842, LAS: 0.6396, UEM: 0.3657, LEM: 0.1059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3674, partial_loss/deprel_loss: 1.0387, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9730, loss: 2.6558, batch_reg_loss: 0.0686, reg_loss: 0.0689 ||:  15%|#4        | 14/95 [00:09<00:55,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6064, UAS: 0.7826, LAS: 0.6378, UEM: 0.3203, LEM: 0.0919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4228, partial_loss/deprel_loss: 2.9571, partial_loss/cycle_loss: 0.0000, batch_loss: 2.9187, loss: 2.6608, batch_reg_loss: 0.0684, reg_loss: 0.0688 ||:  19%|#8        | 18/95 [00:11<00:51,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7368, UAS: 0.7888, LAS: 0.6459, UEM: 0.3072, LEM: 0.0861, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8931, partial_loss/deprel_loss: 1.4595, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4146, loss: 2.5648, batch_reg_loss: 0.0683, reg_loss: 0.0687 ||:  22%|##2       | 21/95 [00:13<00:50,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6162, UAS: 0.7853, LAS: 0.6437, UEM: 0.2928, LEM: 0.0783, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5406, partial_loss/deprel_loss: 2.8730, partial_loss/cycle_loss: 0.0000, batch_loss: 2.8748, loss: 2.5919, batch_reg_loss: 0.0682, reg_loss: 0.0687 ||:  26%|##6       | 25/95 [00:16<00:45,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7049, UAS: 0.7937, LAS: 0.6520, UEM: 0.2802, LEM: 0.0692, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2069, partial_loss/deprel_loss: 1.8636, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8003, loss: 2.4999, batch_reg_loss: 0.0681, reg_loss: 0.0686 ||:  31%|###       | 29/95 [00:18<00:43,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7526, UAS: 0.7956, LAS: 0.6543, UEM: 0.2755, LEM: 0.0677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9012, partial_loss/deprel_loss: 1.4463, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4053, loss: 2.4758, batch_reg_loss: 0.0679, reg_loss: 0.0685 ||:  34%|###3      | 32/95 [00:21<00:43,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5970, UAS: 0.7955, LAS: 0.6540, UEM: 0.2638, LEM: 0.0624, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.9471, partial_loss/deprel_loss: 3.2983, partial_loss/cycle_loss: 0.0000, batch_loss: 3.2959, loss: 2.4902, batch_reg_loss: 0.0678, reg_loss: 0.0685 ||:  38%|###7      | 36/95 [00:23<00:39,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6423, UAS: 0.7992, LAS: 0.6577, UEM: 0.2635, LEM: 0.0610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0873, partial_loss/deprel_loss: 2.6302, partial_loss/cycle_loss: 0.0000, batch_loss: 2.5893, loss: 2.4497, batch_reg_loss: 0.0677, reg_loss: 0.0684 ||:  41%|####1     | 39/95 [00:25<00:38,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7397, UAS: 0.8000, LAS: 0.6588, UEM: 0.2579, LEM: 0.0586, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1241, partial_loss/deprel_loss: 1.7406, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6849, loss: 2.4383, batch_reg_loss: 0.0676, reg_loss: 0.0683 ||:  44%|####4     | 42/95 [00:27<00:36,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6546, UAS: 0.8001, LAS: 0.6591, UEM: 0.2563, LEM: 0.0575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1341, partial_loss/deprel_loss: 2.6585, partial_loss/cycle_loss: 0.0000, batch_loss: 2.6210, loss: 2.4478, batch_reg_loss: 0.0675, reg_loss: 0.0683 ||:  47%|####7     | 45/95 [00:30<00:35,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7658, UAS: 0.8053, LAS: 0.6651, UEM: 0.2685, LEM: 0.0602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7582, partial_loss/deprel_loss: 1.4311, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3638, loss: 2.3887, batch_reg_loss: 0.0673, reg_loss: 0.0682 ||:  52%|#####1    | 49/95 [00:32<00:31,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6690, UAS: 0.8032, LAS: 0.6633, UEM: 0.2763, LEM: 0.0646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8230, partial_loss/deprel_loss: 2.4741, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4111, loss: 2.4123, batch_reg_loss: 0.0672, reg_loss: 0.0681 ||:  56%|#####5    | 53/95 [00:35<00:29,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6075, UAS: 0.8054, LAS: 0.6659, UEM: 0.3141, LEM: 0.0993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6840, partial_loss/deprel_loss: 3.1979, partial_loss/cycle_loss: 0.0000, batch_loss: 3.1622, loss: 2.3942, batch_reg_loss: 0.0671, reg_loss: 0.0681 ||:  59%|#####8    | 56/95 [00:37<00:28,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6152, UAS: 0.8064, LAS: 0.6669, UEM: 0.3160, LEM: 0.0996, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6132, partial_loss/deprel_loss: 2.9013, partial_loss/cycle_loss: 0.0000, batch_loss: 2.9107, loss: 2.3838, batch_reg_loss: 0.0670, reg_loss: 0.0680 ||:  62%|######2   | 59/95 [00:39<00:25,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7006, UAS: 0.8043, LAS: 0.6649, UEM: 0.3079, LEM: 0.0963, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3980, partial_loss/deprel_loss: 2.0046, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9501, loss: 2.4046, batch_reg_loss: 0.0669, reg_loss: 0.0680 ||:  65%|######5   | 62/95 [00:42<00:23,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7086, UAS: 0.8070, LAS: 0.6679, UEM: 0.3095, LEM: 0.0952, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4375, partial_loss/deprel_loss: 2.0754, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0146, loss: 2.3713, batch_reg_loss: 0.0668, reg_loss: 0.0679 ||:  68%|######8   | 65/95 [00:44<00:21,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6813, UAS: 0.8084, LAS: 0.6699, UEM: 0.3166, LEM: 0.0989, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8208, partial_loss/deprel_loss: 2.2253, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2111, loss: 2.3507, batch_reg_loss: 0.0667, reg_loss: 0.0679 ||:  72%|#######1  | 68/95 [00:46<00:19,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5871, UAS: 0.8070, LAS: 0.6691, UEM: 0.3075, LEM: 0.0954, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.6979, partial_loss/deprel_loss: 3.2119, partial_loss/cycle_loss: 0.0000, batch_loss: 3.3757, loss: 2.3629, batch_reg_loss: 0.0666, reg_loss: 0.0678 ||:  76%|#######5  | 72/95 [00:49<00:16,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7640, UAS: 0.8099, LAS: 0.6725, UEM: 0.3097, LEM: 0.0946, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8809, partial_loss/deprel_loss: 1.5519, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4842, loss: 2.3301, batch_reg_loss: 0.0665, reg_loss: 0.0677 ||:  79%|#######8  | 75/95 [00:51<00:14,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6154, UAS: 0.8082, LAS: 0.6707, UEM: 0.3018, LEM: 0.0919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.9648, partial_loss/deprel_loss: 3.0318, partial_loss/cycle_loss: 0.0000, batch_loss: 3.0848, loss: 2.3541, batch_reg_loss: 0.0664, reg_loss: 0.0677 ||:  83%|########3 | 79/95 [00:53<00:11,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7683, UAS: 0.8076, LAS: 0.6706, UEM: 0.3035, LEM: 0.0922, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6683, partial_loss/deprel_loss: 1.2700, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2159, loss: 2.3611, batch_reg_loss: 0.0662, reg_loss: 0.0676 ||:  87%|########7 | 83/95 [00:56<00:08,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6539, UAS: 0.8071, LAS: 0.6703, UEM: 0.2953, LEM: 0.0894, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9894, partial_loss/deprel_loss: 2.5136, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4749, loss: 2.3662, batch_reg_loss: 0.0661, reg_loss: 0.0675 ||:  92%|#########1| 87/95 [00:58<00:05,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7706, UAS: 0.8079, LAS: 0.6718, UEM: 0.2955, LEM: 0.0888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0825, partial_loss/deprel_loss: 1.6397, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5943, loss: 2.3576, batch_reg_loss: 0.0660, reg_loss: 0.0675 ||:  96%|#########5| 91/95 [01:02<00:02,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6631, UAS: 0.8087, LAS: 0.6729, UEM: 0.2926, LEM: 0.0870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5400, partial_loss/deprel_loss: 2.6590, partial_loss/cycle_loss: 0.0000, batch_loss: 2.7012, loss: 2.3477, batch_reg_loss: 0.0660, reg_loss: 0.0674 ||:  99%|#########8| 94/95 [01:04<00:00,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7584, UAS: 0.8094, LAS: 0.6738, UEM: 0.2935, LEM: 0.0868, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9615, partial_loss/deprel_loss: 1.4679, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4326, loss: 2.3380, batch_reg_loss: 0.0659, reg_loss: 0.0674 ||: 100%|##########| 95/95 [01:05<00:00,  1.46it/s]\n",
+      "2023-04-06 22:54:13,234 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.067  |       N/A\n",
+      "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - UEM                      |     0.293  |       N/A\n",
+      "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - LEM                      |     0.087  |       N/A\n",
+      "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - EM                       |     0.758  |       N/A\n",
+      "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.961  |       N/A\n",
+      "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - UAS                      |     0.809  |       N/A\n",
+      "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.468  |       N/A\n",
+      "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - loss                     |     2.338  |       N/A\n",
+      "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - LAS                      |     0.674  |       N/A\n",
+      "2023-04-06 22:54:13,235 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.722  |       N/A\n",
+      "2023-04-06 22:54:13,236 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:54:13,236 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:54:13,236 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:54:13,236 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:54:13,236 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 22:54:13,236 - INFO - combo.training.trainer - Epoch duration: 0:01:05.182956\n",
+      "2023-04-06 22:54:13,236 - INFO - combo.training.trainer - Estimated training time remaining: 7:37:06\n",
+      "2023-04-06 22:54:13,237 - INFO - allennlp.training.trainer - Epoch 4/399\n",
+      "2023-04-06 22:54:13,237 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 22:54:13,237 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-06 22:54:13,244 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7843, UAS: 0.8423, LAS: 0.7132, UEM: 0.2309, LEM: 0.0471, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7504, partial_loss/deprel_loss: 1.3710, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3127, loss: 2.0264, batch_reg_loss: 0.0659, reg_loss: 0.0659 ||:   3%|3         | 3/95 [00:02<01:08,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6926, UAS: 0.8477, LAS: 0.7204, UEM: 0.3100, LEM: 0.0892, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8003, partial_loss/deprel_loss: 2.2492, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2252, loss: 1.9304, batch_reg_loss: 0.0658, reg_loss: 0.0659 ||:   6%|6         | 6/95 [00:04<01:05,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7859, UAS: 0.8541, LAS: 0.7301, UEM: 0.3025, LEM: 0.0763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7349, partial_loss/deprel_loss: 1.3564, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2978, loss: 1.8328, batch_reg_loss: 0.0657, reg_loss: 0.0658 ||:   9%|9         | 9/95 [00:06<01:02,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8201, UAS: 0.8576, LAS: 0.7345, UEM: 0.3501, LEM: 0.1083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3614, partial_loss/deprel_loss: 0.9258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8785, loss: 1.7845, batch_reg_loss: 0.0656, reg_loss: 0.0658 ||:  14%|#3        | 13/95 [00:09<00:57,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7617, UAS: 0.8507, LAS: 0.7264, UEM: 0.3186, LEM: 0.0950, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9531, partial_loss/deprel_loss: 1.5410, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4890, loss: 1.8748, batch_reg_loss: 0.0656, reg_loss: 0.0657 ||:  18%|#7        | 17/95 [00:11<00:54,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6461, UAS: 0.8475, LAS: 0.7246, UEM: 0.3116, LEM: 0.0926, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6654, partial_loss/deprel_loss: 2.6974, partial_loss/cycle_loss: 0.0000, batch_loss: 2.7565, loss: 1.8976, batch_reg_loss: 0.0655, reg_loss: 0.0657 ||:  21%|##1       | 20/95 [00:14<00:53,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7139, UAS: 0.8476, LAS: 0.7244, UEM: 0.2888, LEM: 0.0847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6077, partial_loss/deprel_loss: 2.1567, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1123, loss: 1.9062, batch_reg_loss: 0.0654, reg_loss: 0.0657 ||:  24%|##4       | 23/95 [00:16<00:50,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7580, UAS: 0.8514, LAS: 0.7285, UEM: 0.2895, LEM: 0.0811, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9473, partial_loss/deprel_loss: 1.4645, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4264, loss: 1.8600, batch_reg_loss: 0.0654, reg_loss: 0.0656 ||:  27%|##7       | 26/95 [00:18<00:50,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6262, UAS: 0.8450, LAS: 0.7213, UEM: 0.2705, LEM: 0.0746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.1282, partial_loss/deprel_loss: 3.0901, partial_loss/cycle_loss: 0.0000, batch_loss: 3.1630, loss: 1.9443, batch_reg_loss: 0.0653, reg_loss: 0.0656 ||:  32%|###1      | 30/95 [00:21<00:46,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5623, UAS: 0.8420, LAS: 0.7187, UEM: 0.2983, LEM: 0.0907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.8987, partial_loss/deprel_loss: 3.4147, partial_loss/cycle_loss: 0.0000, batch_loss: 3.5767, loss: 1.9711, batch_reg_loss: 0.0652, reg_loss: 0.0656 ||:  35%|###4      | 33/95 [00:23<00:45,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7552, UAS: 0.8439, LAS: 0.7209, UEM: 0.2955, LEM: 0.0870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2850, partial_loss/deprel_loss: 1.7603, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7304, loss: 1.9546, batch_reg_loss: 0.0651, reg_loss: 0.0655 ||:  39%|###8      | 37/95 [00:26<00:40,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7858, UAS: 0.8456, LAS: 0.7232, UEM: 0.2993, LEM: 0.0856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7638, partial_loss/deprel_loss: 1.2336, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2048, loss: 1.9263, batch_reg_loss: 0.0651, reg_loss: 0.0655 ||:  42%|####2     | 40/95 [00:28<00:39,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6026, UAS: 0.8447, LAS: 0.7235, UEM: 0.3057, LEM: 0.0879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.5938, partial_loss/deprel_loss: 2.9975, partial_loss/cycle_loss: 0.0000, batch_loss: 3.1818, loss: 1.9216, batch_reg_loss: 0.0650, reg_loss: 0.0655 ||:  45%|####5     | 43/95 [00:30<00:37,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5178, UAS: 0.8369, LAS: 0.7161, UEM: 0.2946, LEM: 0.0839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.1605, partial_loss/deprel_loss: 3.8058, partial_loss/cycle_loss: 0.0000, batch_loss: 4.1417, loss: 2.0016, batch_reg_loss: 0.0649, reg_loss: 0.0654 ||:  49%|####9     | 47/95 [00:33<00:33,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7229, UAS: 0.8353, LAS: 0.7140, UEM: 0.2853, LEM: 0.0808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3310, partial_loss/deprel_loss: 1.8267, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7924, loss: 2.0231, batch_reg_loss: 0.0649, reg_loss: 0.0654 ||:  53%|#####2    | 50/95 [00:35<00:31,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7935, UAS: 0.8356, LAS: 0.7142, UEM: 0.2897, LEM: 0.0806, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8164, partial_loss/deprel_loss: 1.2976, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2662, loss: 2.0258, batch_reg_loss: 0.0648, reg_loss: 0.0654 ||:  56%|#####5    | 53/95 [00:37<00:29,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7302, UAS: 0.8354, LAS: 0.7141, UEM: 0.2827, LEM: 0.0778, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4899, partial_loss/deprel_loss: 1.9265, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9039, loss: 2.0274, batch_reg_loss: 0.0648, reg_loss: 0.0653 ||:  59%|#####8    | 56/95 [00:39<00:27,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7533, UAS: 0.8385, LAS: 0.7180, UEM: 0.3088, LEM: 0.0960, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3812, partial_loss/deprel_loss: 1.7436, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7359, loss: 1.9906, batch_reg_loss: 0.0647, reg_loss: 0.0653 ||:  62%|######2   | 59/95 [00:41<00:26,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8078, UAS: 0.8402, LAS: 0.7202, UEM: 0.3200, LEM: 0.1007, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6234, partial_loss/deprel_loss: 1.1282, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0919, loss: 1.9686, batch_reg_loss: 0.0647, reg_loss: 0.0653 ||:  65%|######5   | 62/95 [00:44<00:24,  1.35it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7705, UAS: 0.8412, LAS: 0.7218, UEM: 0.3186, LEM: 0.0985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0299, partial_loss/deprel_loss: 1.5173, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4845, loss: 1.9581, batch_reg_loss: 0.0646, reg_loss: 0.0652 ||:  69%|######9   | 66/95 [00:46<00:20,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6569, UAS: 0.8412, LAS: 0.7219, UEM: 0.3170, LEM: 0.0974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6073, partial_loss/deprel_loss: 2.6569, partial_loss/cycle_loss: 0.0000, batch_loss: 2.7116, loss: 1.9593, batch_reg_loss: 0.0646, reg_loss: 0.0652 ||:  73%|#######2  | 69/95 [00:48<00:18,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7088, UAS: 0.8419, LAS: 0.7232, UEM: 0.3224, LEM: 0.1000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8421, partial_loss/deprel_loss: 2.0728, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0911, loss: 1.9493, batch_reg_loss: 0.0645, reg_loss: 0.0652 ||:  77%|#######6  | 73/95 [00:51<00:15,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7706, UAS: 0.8427, LAS: 0.7244, UEM: 0.3220, LEM: 0.0990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1610, partial_loss/deprel_loss: 1.5024, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4986, loss: 1.9372, batch_reg_loss: 0.0645, reg_loss: 0.0651 ||:  80%|########  | 76/95 [00:53<00:12,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7085, UAS: 0.8434, LAS: 0.7254, UEM: 0.3490, LEM: 0.1270, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7673, partial_loss/deprel_loss: 2.1132, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1084, loss: 1.9316, batch_reg_loss: 0.0644, reg_loss: 0.0651 ||:  83%|########3 | 79/95 [00:55<00:11,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8151, UAS: 0.8439, LAS: 0.7262, UEM: 0.3482, LEM: 0.1258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4797, partial_loss/deprel_loss: 1.0876, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0303, loss: 1.9255, batch_reg_loss: 0.0643, reg_loss: 0.0651 ||:  87%|########7 | 83/95 [00:58<00:08,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7979, UAS: 0.8448, LAS: 0.7271, UEM: 0.3537, LEM: 0.1279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7547, partial_loss/deprel_loss: 1.3058, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2599, loss: 1.9150, batch_reg_loss: 0.0643, reg_loss: 0.0650 ||:  91%|######### | 86/95 [01:00<00:06,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7795, UAS: 0.8455, LAS: 0.7279, UEM: 0.3476, LEM: 0.1250, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0215, partial_loss/deprel_loss: 1.4794, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4521, loss: 1.9097, batch_reg_loss: 0.0643, reg_loss: 0.0650 ||:  94%|#########3| 89/95 [01:02<00:04,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7703, UAS: 0.8448, LAS: 0.7275, UEM: 0.3426, LEM: 0.1220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0980, partial_loss/deprel_loss: 1.5023, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4857, loss: 1.9164, batch_reg_loss: 0.0642, reg_loss: 0.0650 ||:  98%|#########7| 93/95 [01:05<00:01,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8175, UAS: 0.8456, LAS: 0.7284, UEM: 0.3446, LEM: 0.1221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5265, partial_loss/deprel_loss: 1.0597, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0172, loss: 1.9074, batch_reg_loss: 0.0642, reg_loss: 0.0650 ||: 100%|##########| 95/95 [01:06<00:00,  1.43it/s]\n",
+      "2023-04-06 22:55:19,632 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.065  |       N/A\n",
+      "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - UEM                      |     0.345  |       N/A\n",
+      "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - LEM                      |     0.122  |       N/A\n",
+      "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - EM                       |     0.817  |       N/A\n",
+      "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.526  |       N/A\n",
+      "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - UAS                      |     0.846  |       N/A\n",
+      "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.060  |       N/A\n",
+      "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - loss                     |     1.907  |       N/A\n",
+      "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:55:19,633 - INFO - combo.training.tensorboard_writer - LAS                      |     0.728  |       N/A\n",
+      "2023-04-06 22:55:19,634 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.722  |       N/A\n",
+      "2023-04-06 22:55:19,634 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:55:19,634 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:55:19,634 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:55:19,634 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:55:19,634 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 22:55:19,634 - INFO - combo.training.trainer - Epoch duration: 0:01:06.397867\n",
+      "2023-04-06 22:55:19,635 - INFO - combo.training.trainer - Estimated training time remaining: 7:32:11\n",
+      "2023-04-06 22:55:19,635 - INFO - allennlp.training.trainer - Epoch 5/399\n",
+      "2023-04-06 22:55:19,635 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 22:55:19,635 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 22:55:19,642 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7362, UAS: 0.8409, LAS: 0.7299, UEM: 0.1639, LEM: 0.0250, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5391, partial_loss/deprel_loss: 1.9122, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9017, loss: 1.9255, batch_reg_loss: 0.0641, reg_loss: 0.0642 ||:   3%|3         | 3/95 [00:02<01:11,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7690, UAS: 0.8589, LAS: 0.7505, UEM: 0.2830, LEM: 0.0794, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1920, partial_loss/deprel_loss: 1.5500, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5425, loss: 1.7310, batch_reg_loss: 0.0641, reg_loss: 0.0641 ||:   6%|6         | 6/95 [00:04<01:07,  1.32it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8373, UAS: 0.8832, LAS: 0.7762, UEM: 0.4822, LEM: 0.1763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3430, partial_loss/deprel_loss: 0.8381, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8032, loss: 1.4723, batch_reg_loss: 0.0641, reg_loss: 0.0641 ||:   9%|9         | 9/95 [00:06<01:05,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7172, UAS: 0.8691, LAS: 0.7610, UEM: 0.4246, LEM: 0.1533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8046, partial_loss/deprel_loss: 1.9388, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9760, loss: 1.6106, batch_reg_loss: 0.0640, reg_loss: 0.0641 ||:  14%|#3        | 13/95 [00:09<00:59,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6100, UAS: 0.8599, LAS: 0.7513, UEM: 0.3860, LEM: 0.1360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.4556, partial_loss/deprel_loss: 2.9102, partial_loss/cycle_loss: 0.0000, batch_loss: 3.0833, loss: 1.7038, batch_reg_loss: 0.0640, reg_loss: 0.0641 ||:  17%|#6        | 16/95 [00:11<00:56,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6830, UAS: 0.8635, LAS: 0.7553, UEM: 0.4120, LEM: 0.1493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1722, partial_loss/deprel_loss: 2.3345, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3660, loss: 1.6729, batch_reg_loss: 0.0639, reg_loss: 0.0641 ||:  20%|##        | 19/95 [00:13<00:56,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8055, UAS: 0.8630, LAS: 0.7545, UEM: 0.3829, LEM: 0.1339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8116, partial_loss/deprel_loss: 1.2710, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2430, loss: 1.6813, batch_reg_loss: 0.0639, reg_loss: 0.0640 ||:  24%|##4       | 23/95 [00:16<00:50,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7791, UAS: 0.8597, LAS: 0.7516, UEM: 0.3563, LEM: 0.1215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9777, partial_loss/deprel_loss: 1.4278, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4016, loss: 1.7203, batch_reg_loss: 0.0639, reg_loss: 0.0640 ||:  28%|##8       | 27/95 [00:18<00:45,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8253, UAS: 0.8656, LAS: 0.7593, UEM: 0.4287, LEM: 0.1921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6121, partial_loss/deprel_loss: 0.9983, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9849, loss: 1.6482, batch_reg_loss: 0.0638, reg_loss: 0.0640 ||:  32%|###1      | 30/95 [00:21<00:46,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7071, UAS: 0.8680, LAS: 0.7625, UEM: 0.4650, LEM: 0.2164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0660, partial_loss/deprel_loss: 2.1342, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1843, loss: 1.6122, batch_reg_loss: 0.0638, reg_loss: 0.0640 ||:  35%|###4      | 33/95 [00:23<00:46,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7614, UAS: 0.8645, LAS: 0.7587, UEM: 0.4402, LEM: 0.2026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2990, partial_loss/deprel_loss: 1.6074, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6095, loss: 1.6531, batch_reg_loss: 0.0637, reg_loss: 0.0640 ||:  39%|###8      | 37/95 [00:26<00:41,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6848, UAS: 0.8611, LAS: 0.7551, UEM: 0.4345, LEM: 0.1977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6570, partial_loss/deprel_loss: 2.4016, partial_loss/cycle_loss: 0.0000, batch_loss: 2.5164, loss: 1.6897, batch_reg_loss: 0.0637, reg_loss: 0.0639 ||:  43%|####3     | 41/95 [00:28<00:36,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7787, UAS: 0.8584, LAS: 0.7522, UEM: 0.4205, LEM: 0.1885, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0538, partial_loss/deprel_loss: 1.4761, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4553, loss: 1.7256, batch_reg_loss: 0.0637, reg_loss: 0.0639 ||:  47%|####7     | 45/95 [00:31<00:33,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8132, UAS: 0.8591, LAS: 0.7532, UEM: 0.4148, LEM: 0.1806, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8750, partial_loss/deprel_loss: 1.2898, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2705, loss: 1.7183, batch_reg_loss: 0.0637, reg_loss: 0.0639 ||:  52%|#####1    | 49/95 [00:33<00:30,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7496, UAS: 0.8582, LAS: 0.7519, UEM: 0.4014, LEM: 0.1722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3200, partial_loss/deprel_loss: 1.7153, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6999, loss: 1.7334, batch_reg_loss: 0.0636, reg_loss: 0.0639 ||:  56%|#####5    | 53/95 [00:36<00:27,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6925, UAS: 0.8586, LAS: 0.7525, UEM: 0.4015, LEM: 0.1710, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3983, partial_loss/deprel_loss: 2.4521, partial_loss/cycle_loss: 0.0000, batch_loss: 2.5049, loss: 1.7337, batch_reg_loss: 0.0636, reg_loss: 0.0639 ||:  60%|######    | 57/95 [00:39<00:25,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7734, UAS: 0.8588, LAS: 0.7527, UEM: 0.3885, LEM: 0.1633, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1734, partial_loss/deprel_loss: 1.5985, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5771, loss: 1.7317, batch_reg_loss: 0.0636, reg_loss: 0.0638 ||:  64%|######4   | 61/95 [00:41<00:22,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8247, UAS: 0.8617, LAS: 0.7560, UEM: 0.3955, LEM: 0.1630, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5772, partial_loss/deprel_loss: 0.9634, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9498, loss: 1.6978, batch_reg_loss: 0.0636, reg_loss: 0.0638 ||:  68%|######8   | 65/95 [00:44<00:20,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6948, UAS: 0.8627, LAS: 0.7569, UEM: 0.4035, LEM: 0.1681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5275, partial_loss/deprel_loss: 2.4498, partial_loss/cycle_loss: 0.0000, batch_loss: 2.5289, loss: 1.6927, batch_reg_loss: 0.0635, reg_loss: 0.0638 ||:  72%|#######1  | 68/95 [00:47<00:19,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8050, UAS: 0.8632, LAS: 0.7576, UEM: 0.3997, LEM: 0.1647, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7576, partial_loss/deprel_loss: 1.1395, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1266, loss: 1.6848, batch_reg_loss: 0.0635, reg_loss: 0.0638 ||:  75%|#######4  | 71/95 [00:49<00:17,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8209, UAS: 0.8658, LAS: 0.7608, UEM: 0.4055, LEM: 0.1652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6177, partial_loss/deprel_loss: 0.9915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9802, loss: 1.6526, batch_reg_loss: 0.0635, reg_loss: 0.0638 ||:  79%|#######8  | 75/95 [00:52<00:14,  1.41it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7611, UAS: 0.8631, LAS: 0.7583, UEM: 0.3988, LEM: 0.1623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3472, partial_loss/deprel_loss: 1.7179, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7072, loss: 1.6814, batch_reg_loss: 0.0635, reg_loss: 0.0638 ||:  82%|########2 | 78/95 [00:54<00:12,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8106, UAS: 0.8635, LAS: 0.7589, UEM: 0.3952, LEM: 0.1594, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7722, partial_loss/deprel_loss: 1.0976, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0960, loss: 1.6750, batch_reg_loss: 0.0635, reg_loss: 0.0638 ||:  85%|########5 | 81/95 [00:56<00:09,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7472, UAS: 0.8634, LAS: 0.7587, UEM: 0.3876, LEM: 0.1554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4159, partial_loss/deprel_loss: 1.8051, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7907, loss: 1.6768, batch_reg_loss: 0.0634, reg_loss: 0.0637 ||:  88%|########8 | 84/95 [00:58<00:07,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8146, UAS: 0.8635, LAS: 0.7590, UEM: 0.3890, LEM: 0.1548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7390, partial_loss/deprel_loss: 1.1997, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1710, loss: 1.6739, batch_reg_loss: 0.0634, reg_loss: 0.0637 ||:  92%|#########1| 87/95 [01:00<00:05,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8351, UAS: 0.8644, LAS: 0.7604, UEM: 0.3879, LEM: 0.1527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5983, partial_loss/deprel_loss: 0.9408, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9357, loss: 1.6605, batch_reg_loss: 0.0634, reg_loss: 0.0637 ||:  96%|#########5| 91/95 [01:03<00:02,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8429, UAS: 0.8655, LAS: 0.7616, UEM: 0.3865, LEM: 0.1504, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5037, partial_loss/deprel_loss: 0.9392, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9155, loss: 1.6492, batch_reg_loss: 0.0634, reg_loss: 0.0637 ||:  99%|#########8| 94/95 [01:05<00:00,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7393, UAS: 0.8654, LAS: 0.7613, UEM: 0.3842, LEM: 0.1492, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3101, partial_loss/deprel_loss: 1.8342, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7927, loss: 1.6507, batch_reg_loss: 0.0634, reg_loss: 0.0637 ||: 100%|##########| 95/95 [01:05<00:00,  1.44it/s]\n",
+      "2023-04-06 22:56:25,630 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7846, UAS: 0.9080, LAS: 0.8175, UEM: 0.4009, LEM: 0.1300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2796, partial_loss/deprel_loss: 39.2859, partial_loss/cycle_loss: 0.0000, batch_loss: 31.6847, loss: 23.2949, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  27%|##7       | 3/11 [00:02<00:07,  1.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8544, UAS: 0.9219, LAS: 0.8351, UEM: 0.5020, LEM: 0.1876, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5392, partial_loss/deprel_loss: 25.7007, partial_loss/cycle_loss: 0.0000, batch_loss: 20.6684, loss: 21.8143, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  55%|#####4    | 6/11 [00:05<00:04,  1.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7895, UAS: 0.9238, LAS: 0.8396, UEM: 0.5798, LEM: 0.2751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4669, partial_loss/deprel_loss: 43.6367, partial_loss/cycle_loss: 0.0000, batch_loss: 35.2028, loss: 22.2369, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  82%|########1 | 9/11 [00:08<00:01,  1.05it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7461, UAS: 0.9152, LAS: 0.8299, UEM: 0.5427, LEM: 0.2474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0760, partial_loss/deprel_loss: 51.1684, partial_loss/cycle_loss: 0.0000, batch_loss: 41.3499, loss: 23.5376, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.04it/s]\n",
+      "2023-04-06 22:56:36,165 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 22:56:36,165 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 22:56:36,165 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.064  |     0.000\n",
+      "2023-04-06 22:56:36,165 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 22:56:36,165 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 22:56:36,165 - INFO - combo.training.tensorboard_writer - UEM                      |     0.384  |     0.543\n",
+      "2023-04-06 22:56:36,165 - INFO - combo.training.tensorboard_writer - LEM                      |     0.149  |     0.247\n",
+      "2023-04-06 22:56:36,165 - INFO - combo.training.tensorboard_writer - EM                       |     0.739  |     0.746\n",
+      "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.310  |     2.076\n",
+      "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - UAS                      |     0.865  |     0.915\n",
+      "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.834  |    51.168\n",
+      "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - loss                     |     1.651  |    23.538\n",
+      "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - LAS                      |     0.761  |     0.830\n",
+      "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.722  |       N/A\n",
+      "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 22:56:36,166 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 22:56:36,167 - INFO - combo.training.trainer - Epoch duration: 0:01:16.532214\n",
+      "2023-04-06 22:56:36,167 - INFO - combo.training.trainer - Estimated training time remaining: 7:39:37\n",
+      "2023-04-06 22:56:36,167 - INFO - allennlp.training.trainer - Epoch 6/399\n",
+      "2023-04-06 22:56:36,167 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 22:56:36,167 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 22:56:36,173 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8139, UAS: 0.8852, LAS: 0.7845, UEM: 0.4318, LEM: 0.1699, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7961, partial_loss/deprel_loss: 1.2270, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2042, loss: 1.4337, batch_reg_loss: 0.0634, reg_loss: 0.0634 ||:   4%|4         | 4/95 [00:02<01:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7204, UAS: 0.8715, LAS: 0.7707, UEM: 0.3227, LEM: 0.1179, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0650, partial_loss/deprel_loss: 2.0459, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1131, loss: 1.5804, batch_reg_loss: 0.0634, reg_loss: 0.0634 ||:   7%|7         | 7/95 [00:05<01:02,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8260, UAS: 0.8775, LAS: 0.7779, UEM: 0.3232, LEM: 0.1062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7638, partial_loss/deprel_loss: 1.1360, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1249, loss: 1.5147, batch_reg_loss: 0.0633, reg_loss: 0.0634 ||:  11%|#         | 10/95 [00:07<00:59,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7200, UAS: 0.8655, LAS: 0.7663, UEM: 0.3436, LEM: 0.1184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1232, partial_loss/deprel_loss: 2.0626, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1381, loss: 1.6473, batch_reg_loss: 0.0633, reg_loss: 0.0634 ||:  14%|#3        | 13/95 [00:09<01:00,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7778, UAS: 0.8593, LAS: 0.7603, UEM: 0.3078, LEM: 0.1035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3290, partial_loss/deprel_loss: 1.5895, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6007, loss: 1.7120, batch_reg_loss: 0.0633, reg_loss: 0.0634 ||:  17%|#6        | 16/95 [00:12<01:00,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6399, UAS: 0.8593, LAS: 0.7595, UEM: 0.3445, LEM: 0.1216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.1261, partial_loss/deprel_loss: 2.7053, partial_loss/cycle_loss: 0.0000, batch_loss: 2.8528, loss: 1.7150, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||:  20%|##        | 19/95 [00:14<00:56,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7184, UAS: 0.8653, LAS: 0.7650, UEM: 0.3841, LEM: 0.1386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9814, partial_loss/deprel_loss: 2.0559, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1043, loss: 1.6599, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||:  23%|##3       | 22/95 [00:16<00:54,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8084, UAS: 0.8685, LAS: 0.7680, UEM: 0.3554, LEM: 0.1227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9110, partial_loss/deprel_loss: 1.3132, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2960, loss: 1.6295, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||:  27%|##7       | 26/95 [00:18<00:47,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8365, UAS: 0.8739, LAS: 0.7741, UEM: 0.3662, LEM: 0.1229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5057, partial_loss/deprel_loss: 0.9085, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8912, loss: 1.5664, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||:  32%|###1      | 30/95 [00:21<00:44,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8551, UAS: 0.8775, LAS: 0.7785, UEM: 0.3891, LEM: 0.1362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3909, partial_loss/deprel_loss: 0.7925, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7755, loss: 1.5217, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||:  35%|###4      | 33/95 [00:23<00:44,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7322, UAS: 0.8787, LAS: 0.7806, UEM: 0.4363, LEM: 0.1945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8153, partial_loss/deprel_loss: 1.9592, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9937, loss: 1.5023, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||:  38%|###7      | 36/95 [00:25<00:43,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7980, UAS: 0.8798, LAS: 0.7821, UEM: 0.4186, LEM: 0.1809, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9276, partial_loss/deprel_loss: 1.3685, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3436, loss: 1.4864, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||:  42%|####2     | 40/95 [00:28<00:37,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7367, UAS: 0.8780, LAS: 0.7800, UEM: 0.4028, LEM: 0.1734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7696, partial_loss/deprel_loss: 1.8948, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9331, loss: 1.5062, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||:  45%|####5     | 43/95 [00:30<00:35,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7507, UAS: 0.8786, LAS: 0.7810, UEM: 0.4198, LEM: 0.1913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5450, partial_loss/deprel_loss: 1.7539, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7754, loss: 1.4948, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||:  48%|####8     | 46/95 [00:32<00:34,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8709, UAS: 0.8789, LAS: 0.7816, UEM: 0.4310, LEM: 0.1998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2861, partial_loss/deprel_loss: 0.6546, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6442, loss: 1.4886, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||:  53%|#####2    | 50/95 [00:35<00:31,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8275, UAS: 0.8791, LAS: 0.7819, UEM: 0.4291, LEM: 0.1987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5723, partial_loss/deprel_loss: 0.8703, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8740, loss: 1.4817, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||:  56%|#####5    | 53/95 [00:37<00:29,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8254, UAS: 0.8779, LAS: 0.7809, UEM: 0.4186, LEM: 0.1913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7167, partial_loss/deprel_loss: 1.0576, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0527, loss: 1.4918, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||:  60%|######    | 57/95 [00:39<00:25,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8198, UAS: 0.8802, LAS: 0.7837, UEM: 0.4213, LEM: 0.1882, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7148, partial_loss/deprel_loss: 1.0188, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0213, loss: 1.4653, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||:  64%|######4   | 61/95 [00:42<00:22,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8187, UAS: 0.8810, LAS: 0.7847, UEM: 0.4127, LEM: 0.1803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6354, partial_loss/deprel_loss: 1.0926, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0645, loss: 1.4554, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||:  68%|######8   | 65/95 [00:45<00:20,  1.49it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8493, UAS: 0.8816, LAS: 0.7855, UEM: 0.4126, LEM: 0.1791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4871, partial_loss/deprel_loss: 0.9315, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9059, loss: 1.4468, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||:  73%|#######2  | 69/95 [00:47<00:17,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7504, UAS: 0.8789, LAS: 0.7825, UEM: 0.4021, LEM: 0.1739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5896, partial_loss/deprel_loss: 1.8201, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8373, loss: 1.4763, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||:  77%|#######6  | 73/95 [00:50<00:14,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7718, UAS: 0.8752, LAS: 0.7785, UEM: 0.3939, LEM: 0.1699, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2170, partial_loss/deprel_loss: 1.6286, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6096, loss: 1.5194, batch_reg_loss: 0.0633, reg_loss: 0.0633 ||:  81%|########1 | 77/95 [00:52<00:11,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7139, UAS: 0.8748, LAS: 0.7783, UEM: 0.3947, LEM: 0.1693, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2148, partial_loss/deprel_loss: 2.2443, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3018, loss: 1.5257, batch_reg_loss: 0.0634, reg_loss: 0.0633 ||:  85%|########5 | 81/95 [00:55<00:08,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8317, UAS: 0.8772, LAS: 0.7809, UEM: 0.4104, LEM: 0.1758, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5189, partial_loss/deprel_loss: 0.9438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9222, loss: 1.4992, batch_reg_loss: 0.0634, reg_loss: 0.0633 ||:  89%|########9 | 85/95 [00:58<00:06,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8445, UAS: 0.8758, LAS: 0.7795, UEM: 0.4091, LEM: 0.1736, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5333, partial_loss/deprel_loss: 0.9501, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9301, loss: 1.5140, batch_reg_loss: 0.0634, reg_loss: 0.0633 ||:  93%|#########2| 88/95 [01:00<00:05,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7635, UAS: 0.8765, LAS: 0.7801, UEM: 0.4065, LEM: 0.1706, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2404, partial_loss/deprel_loss: 1.7057, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6761, loss: 1.5071, batch_reg_loss: 0.0634, reg_loss: 0.0633 ||:  96%|#########5| 91/95 [01:03<00:02,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7174, UAS: 0.8776, LAS: 0.7814, UEM: 0.4107, LEM: 0.1699, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1446, partial_loss/deprel_loss: 2.0900, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1643, loss: 1.4954, batch_reg_loss: 0.0634, reg_loss: 0.0633 ||: 100%|##########| 95/95 [01:05<00:00,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7174, UAS: 0.8776, LAS: 0.7814, UEM: 0.4107, LEM: 0.1699, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1446, partial_loss/deprel_loss: 2.0900, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1643, loss: 1.4954, batch_reg_loss: 0.0634, reg_loss: 0.0633 ||: 100%|##########| 95/95 [01:05<00:00,  1.44it/s]\n",
+      "2023-04-06 22:57:41,968 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 22:57:41,968 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.063  |       N/A\n",
+      "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - UEM                      |     0.411  |       N/A\n",
+      "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - LEM                      |     0.170  |       N/A\n",
+      "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - EM                       |     0.717  |       N/A\n",
+      "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     2.145  |       N/A\n",
+      "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - UAS                      |     0.878  |       N/A\n",
+      "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     2.090  |       N/A\n",
+      "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - loss                     |     1.495  |       N/A\n",
+      "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - LAS                      |     0.781  |       N/A\n",
+      "2023-04-06 22:57:41,969 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.907  |       N/A\n",
+      "2023-04-06 22:57:41,970 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:57:41,970 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:57:41,970 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:57:41,970 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:57:41,970 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 22:57:41,970 - INFO - combo.training.trainer - Epoch duration: 0:01:05.803367\n",
+      "2023-04-06 22:57:41,971 - INFO - combo.training.trainer - Estimated training time remaining: 7:34:32\n",
+      "2023-04-06 22:57:41,971 - INFO - allennlp.training.trainer - Epoch 7/399\n",
+      "2023-04-06 22:57:41,971 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 22:57:41,971 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 22:57:41,978 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7544, UAS: 0.8492, LAS: 0.7522, UEM: 0.0364, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5982, partial_loss/deprel_loss: 1.6971, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7408, loss: 1.7857, batch_reg_loss: 0.0634, reg_loss: 0.0634 ||:   3%|3         | 3/95 [00:02<01:01,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8092, UAS: 0.8525, LAS: 0.7608, UEM: 0.2493, LEM: 0.0764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9619, partial_loss/deprel_loss: 1.2887, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2868, loss: 1.7437, batch_reg_loss: 0.0634, reg_loss: 0.0634 ||:   6%|6         | 6/95 [00:04<01:01,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8765, UAS: 0.8710, LAS: 0.7817, UEM: 0.5237, LEM: 0.2864, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2644, partial_loss/deprel_loss: 0.5426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5504, loss: 1.5241, batch_reg_loss: 0.0635, reg_loss: 0.0634 ||:   9%|9         | 9/95 [00:06<01:02,  1.38it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8522, UAS: 0.8785, LAS: 0.7900, UEM: 0.5429, LEM: 0.2839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4888, partial_loss/deprel_loss: 0.8685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8561, loss: 1.4643, batch_reg_loss: 0.0635, reg_loss: 0.0634 ||:  13%|#2        | 12/95 [00:08<01:01,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7300, UAS: 0.8770, LAS: 0.7874, UEM: 0.5009, LEM: 0.2479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7910, partial_loss/deprel_loss: 1.8718, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9192, loss: 1.4855, batch_reg_loss: 0.0635, reg_loss: 0.0635 ||:  17%|#6        | 16/95 [00:11<00:53,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.8833, LAS: 0.7951, UEM: 0.5561, LEM: 0.3169, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1348, partial_loss/deprel_loss: 0.3689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3856, loss: 1.4103, batch_reg_loss: 0.0635, reg_loss: 0.0635 ||:  21%|##1       | 20/95 [00:13<00:50,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7715, UAS: 0.8874, LAS: 0.7989, UEM: 0.5485, LEM: 0.3005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2845, partial_loss/deprel_loss: 1.6086, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6074, loss: 1.3682, batch_reg_loss: 0.0635, reg_loss: 0.0635 ||:  25%|##5       | 24/95 [00:16<00:45,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7687, UAS: 0.8862, LAS: 0.7975, UEM: 0.5455, LEM: 0.2957, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2891, partial_loss/deprel_loss: 1.5481, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5598, loss: 1.3750, batch_reg_loss: 0.0636, reg_loss: 0.0635 ||:  29%|##9       | 28/95 [00:18<00:43,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7934, UAS: 0.8880, LAS: 0.7994, UEM: 0.5226, LEM: 0.2751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0129, partial_loss/deprel_loss: 1.4350, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4142, loss: 1.3573, batch_reg_loss: 0.0636, reg_loss: 0.0635 ||:  34%|###3      | 32/95 [00:20<00:38,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8348, UAS: 0.8865, LAS: 0.7973, UEM: 0.5038, LEM: 0.2591, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7337, partial_loss/deprel_loss: 1.0537, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0533, loss: 1.3775, batch_reg_loss: 0.0636, reg_loss: 0.0635 ||:  38%|###7      | 36/95 [00:23<00:37,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7901, UAS: 0.8859, LAS: 0.7964, UEM: 0.4948, LEM: 0.2505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1651, partial_loss/deprel_loss: 1.4327, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4428, loss: 1.3839, batch_reg_loss: 0.0636, reg_loss: 0.0635 ||:  42%|####2     | 40/95 [00:26<00:36,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8680, UAS: 0.8884, LAS: 0.7995, UEM: 0.4954, LEM: 0.2445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4473, partial_loss/deprel_loss: 0.8673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8470, loss: 1.3582, batch_reg_loss: 0.0636, reg_loss: 0.0635 ||:  46%|####6     | 44/95 [00:28<00:32,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8306, UAS: 0.8885, LAS: 0.7994, UEM: 0.4912, LEM: 0.2366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7249, partial_loss/deprel_loss: 1.0650, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0607, loss: 1.3584, batch_reg_loss: 0.0637, reg_loss: 0.0635 ||:  51%|#####     | 48/95 [00:31<00:31,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7623, UAS: 0.8889, LAS: 0.7999, UEM: 0.4876, LEM: 0.2336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5943, partial_loss/deprel_loss: 1.6767, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7239, loss: 1.3541, batch_reg_loss: 0.0637, reg_loss: 0.0636 ||:  55%|#####4    | 52/95 [00:34<00:27,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8502, UAS: 0.8912, LAS: 0.8026, UEM: 0.4893, LEM: 0.2298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4612, partial_loss/deprel_loss: 0.7483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7546, loss: 1.3281, batch_reg_loss: 0.0637, reg_loss: 0.0636 ||:  59%|#####8    | 56/95 [00:36<00:25,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8561, UAS: 0.8917, LAS: 0.8028, UEM: 0.4824, LEM: 0.2238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4378, partial_loss/deprel_loss: 0.8147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8031, loss: 1.3214, batch_reg_loss: 0.0637, reg_loss: 0.0636 ||:  63%|######3   | 60/95 [00:39<00:23,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8393, UAS: 0.8922, LAS: 0.8035, UEM: 0.4789, LEM: 0.2181, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5806, partial_loss/deprel_loss: 1.0386, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0107, loss: 1.3139, batch_reg_loss: 0.0638, reg_loss: 0.0636 ||:  67%|######7   | 64/95 [00:42<00:20,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8331, UAS: 0.8920, LAS: 0.8032, UEM: 0.4758, LEM: 0.2142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6390, partial_loss/deprel_loss: 1.0286, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0145, loss: 1.3176, batch_reg_loss: 0.0638, reg_loss: 0.0636 ||:  72%|#######1  | 68/95 [00:44<00:17,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8204, UAS: 0.8900, LAS: 0.8012, UEM: 0.4661, LEM: 0.2089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9543, partial_loss/deprel_loss: 1.2122, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2244, loss: 1.3393, batch_reg_loss: 0.0638, reg_loss: 0.0636 ||:  76%|#######5  | 72/95 [00:46<00:14,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7939, UAS: 0.8907, LAS: 0.8018, UEM: 0.4598, LEM: 0.2040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2010, partial_loss/deprel_loss: 1.5187, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5190, loss: 1.3337, batch_reg_loss: 0.0638, reg_loss: 0.0636 ||:  80%|########  | 76/95 [00:49<00:12,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8152, UAS: 0.8885, LAS: 0.7995, UEM: 0.4531, LEM: 0.1996, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9159, partial_loss/deprel_loss: 1.2435, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2418, loss: 1.3594, batch_reg_loss: 0.0639, reg_loss: 0.0636 ||:  84%|########4 | 80/95 [00:52<00:09,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7586, UAS: 0.8867, LAS: 0.7973, UEM: 0.4429, LEM: 0.1946, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4134, partial_loss/deprel_loss: 1.8125, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7965, loss: 1.3824, batch_reg_loss: 0.0639, reg_loss: 0.0636 ||:  88%|########8 | 84/95 [00:55<00:07,  1.51it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8012, UAS: 0.8867, LAS: 0.7972, UEM: 0.4449, LEM: 0.1972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1268, partial_loss/deprel_loss: 1.3129, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3396, loss: 1.3818, batch_reg_loss: 0.0639, reg_loss: 0.0637 ||:  93%|#########2| 88/95 [00:58<00:04,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7951, UAS: 0.8871, LAS: 0.7972, UEM: 0.4409, LEM: 0.1933, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9967, partial_loss/deprel_loss: 1.4019, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3849, loss: 1.3799, batch_reg_loss: 0.0640, reg_loss: 0.0637 ||:  96%|#########5| 91/95 [01:00<00:02,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8224, UAS: 0.8875, LAS: 0.7973, UEM: 0.4360, LEM: 0.1894, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8249, partial_loss/deprel_loss: 1.0910, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1018, loss: 1.3791, batch_reg_loss: 0.0640, reg_loss: 0.0637 ||:  99%|#########8| 94/95 [01:02<00:00,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7707, UAS: 0.8873, LAS: 0.7970, UEM: 0.4336, LEM: 0.1881, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2738, partial_loss/deprel_loss: 1.5326, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5448, loss: 1.3809, batch_reg_loss: 0.0640, reg_loss: 0.0637 ||: 100%|##########| 95/95 [01:03<00:00,  1.50it/s]\n",
+      "2023-04-06 22:58:45,366 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.064  |       N/A\n",
+      "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - UEM                      |     0.434  |       N/A\n",
+      "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - LEM                      |     0.188  |       N/A\n",
+      "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - EM                       |     0.771  |       N/A\n",
+      "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.274  |       N/A\n",
+      "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - UAS                      |     0.887  |       N/A\n",
+      "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.533  |       N/A\n",
+      "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - loss                     |     1.381  |       N/A\n",
+      "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:58:45,367 - INFO - combo.training.tensorboard_writer - LAS                      |     0.797  |       N/A\n",
+      "2023-04-06 22:58:45,368 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.907  |       N/A\n",
+      "2023-04-06 22:58:45,368 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:58:45,368 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:58:45,368 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:58:45,368 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:58:45,368 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 22:58:45,368 - INFO - combo.training.trainer - Epoch duration: 0:01:03.397784\n",
+      "2023-04-06 22:58:45,369 - INFO - combo.training.trainer - Estimated training time remaining: 7:28:29\n",
+      "2023-04-06 22:58:45,369 - INFO - allennlp.training.trainer - Epoch 8/399\n",
+      "2023-04-06 22:58:45,369 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 22:58:45,369 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 22:58:45,375 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7960, UAS: 0.8766, LAS: 0.7884, UEM: 0.0867, LEM: 0.0186, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1714, partial_loss/deprel_loss: 1.4375, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4483, loss: 1.5283, batch_reg_loss: 0.0641, reg_loss: 0.0641 ||:   3%|3         | 3/95 [00:02<01:01,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8437, UAS: 0.8879, LAS: 0.7993, UEM: 0.2805, LEM: 0.0809, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5547, partial_loss/deprel_loss: 0.9722, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9528, loss: 1.3837, batch_reg_loss: 0.0641, reg_loss: 0.0641 ||:   7%|7         | 7/95 [00:04<00:58,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.8982, LAS: 0.8128, UEM: 0.3722, LEM: 0.1342, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6149, partial_loss/deprel_loss: 0.9548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9510, loss: 1.2616, batch_reg_loss: 0.0642, reg_loss: 0.0641 ||:  13%|#2        | 12/95 [00:06<00:49,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8342, UAS: 0.8925, LAS: 0.8064, UEM: 0.3546, LEM: 0.1231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6295, partial_loss/deprel_loss: 0.9856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9785, loss: 1.3014, batch_reg_loss: 0.0642, reg_loss: 0.0641 ||:  16%|#5        | 15/95 [00:09<00:52,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7982, UAS: 0.8977, LAS: 0.8115, UEM: 0.3777, LEM: 0.1298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8726, partial_loss/deprel_loss: 1.2775, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2607, loss: 1.2535, batch_reg_loss: 0.0642, reg_loss: 0.0641 ||:  19%|#8        | 18/95 [00:11<00:53,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7925, UAS: 0.8982, LAS: 0.8117, UEM: 0.3924, LEM: 0.1437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1242, partial_loss/deprel_loss: 1.4479, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4473, loss: 1.2433, batch_reg_loss: 0.0642, reg_loss: 0.0641 ||:  22%|##2       | 21/95 [00:13<00:52,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7558, UAS: 0.8948, LAS: 0.8080, UEM: 0.3640, LEM: 0.1318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7870, partial_loss/deprel_loss: 1.7873, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8515, loss: 1.2800, batch_reg_loss: 0.0643, reg_loss: 0.0642 ||:  26%|##6       | 25/95 [00:15<00:46,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8093, UAS: 0.8991, LAS: 0.8129, UEM: 0.4093, LEM: 0.1608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9189, partial_loss/deprel_loss: 1.2039, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2112, loss: 1.2355, batch_reg_loss: 0.0643, reg_loss: 0.0642 ||:  29%|##9       | 28/95 [00:18<00:45,  1.49it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8276, UAS: 0.9023, LAS: 0.8164, UEM: 0.4421, LEM: 0.1855, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7983, partial_loss/deprel_loss: 1.0589, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0711, loss: 1.1956, batch_reg_loss: 0.0643, reg_loss: 0.0642 ||:  33%|###2      | 31/95 [00:20<00:45,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8526, UAS: 0.8993, LAS: 0.8138, UEM: 0.4486, LEM: 0.1915, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4474, partial_loss/deprel_loss: 0.7212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7308, loss: 1.2169, batch_reg_loss: 0.0643, reg_loss: 0.0642 ||:  36%|###5      | 34/95 [00:22<00:45,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8529, UAS: 0.8992, LAS: 0.8139, UEM: 0.4544, LEM: 0.1922, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4838, partial_loss/deprel_loss: 0.8630, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8515, loss: 1.2150, batch_reg_loss: 0.0643, reg_loss: 0.0642 ||:  40%|####      | 38/95 [00:25<00:41,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8091, UAS: 0.8998, LAS: 0.8147, UEM: 0.4529, LEM: 0.1911, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1905, partial_loss/deprel_loss: 1.3851, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4105, loss: 1.2106, batch_reg_loss: 0.0644, reg_loss: 0.0642 ||:  43%|####3     | 41/95 [00:27<00:38,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8411, UAS: 0.8994, LAS: 0.8142, UEM: 0.4556, LEM: 0.1896, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5881, partial_loss/deprel_loss: 0.9996, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9817, loss: 1.2179, batch_reg_loss: 0.0644, reg_loss: 0.0642 ||:  47%|####7     | 45/95 [00:30<00:33,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8386, UAS: 0.8983, LAS: 0.8123, UEM: 0.4424, LEM: 0.1808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6947, partial_loss/deprel_loss: 1.0266, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0247, loss: 1.2359, batch_reg_loss: 0.0644, reg_loss: 0.0642 ||:  52%|#####1    | 49/95 [00:32<00:30,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7533, UAS: 0.8985, LAS: 0.8127, UEM: 0.4414, LEM: 0.1795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5425, partial_loss/deprel_loss: 1.5829, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6393, loss: 1.2254, batch_reg_loss: 0.0645, reg_loss: 0.0643 ||:  56%|#####5    | 53/95 [00:35<00:27,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7877, UAS: 0.8973, LAS: 0.8112, UEM: 0.4319, LEM: 0.1743, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3386, partial_loss/deprel_loss: 1.4528, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4945, loss: 1.2410, batch_reg_loss: 0.0645, reg_loss: 0.0643 ||:  60%|######    | 57/95 [00:38<00:25,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8630, UAS: 0.8975, LAS: 0.8113, UEM: 0.4308, LEM: 0.1737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3600, partial_loss/deprel_loss: 0.7389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7277, loss: 1.2418, batch_reg_loss: 0.0646, reg_loss: 0.0643 ||:  64%|######4   | 61/95 [00:40<00:22,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8689, UAS: 0.8972, LAS: 0.8109, UEM: 0.4285, LEM: 0.1730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3648, partial_loss/deprel_loss: 0.7674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7515, loss: 1.2476, batch_reg_loss: 0.0646, reg_loss: 0.0643 ||:  68%|######8   | 65/95 [00:42<00:19,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8825, UAS: 0.8979, LAS: 0.8122, UEM: 0.4507, LEM: 0.1927, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2452, partial_loss/deprel_loss: 0.5030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5161, loss: 1.2376, batch_reg_loss: 0.0647, reg_loss: 0.0643 ||:  73%|#######2  | 69/95 [00:45<00:17,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7070, UAS: 0.8969, LAS: 0.8110, UEM: 0.4422, LEM: 0.1873, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3662, partial_loss/deprel_loss: 2.1813, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2830, loss: 1.2500, batch_reg_loss: 0.0647, reg_loss: 0.0644 ||:  77%|#######6  | 73/95 [00:48<00:14,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8308, UAS: 0.8951, LAS: 0.8090, UEM: 0.4329, LEM: 0.1828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7761, partial_loss/deprel_loss: 1.0307, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0446, loss: 1.2678, batch_reg_loss: 0.0648, reg_loss: 0.0644 ||:  81%|########1 | 77/95 [00:51<00:11,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8289, UAS: 0.8959, LAS: 0.8101, UEM: 0.4385, LEM: 0.1888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7951, partial_loss/deprel_loss: 1.1140, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1150, loss: 1.2612, batch_reg_loss: 0.0648, reg_loss: 0.0644 ||:  85%|########5 | 81/95 [00:54<00:09,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8287, UAS: 0.8950, LAS: 0.8088, UEM: 0.4376, LEM: 0.1864, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8267, partial_loss/deprel_loss: 1.1303, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1344, loss: 1.2756, batch_reg_loss: 0.0649, reg_loss: 0.0644 ||:  89%|########9 | 85/95 [00:56<00:06,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8440, UAS: 0.8945, LAS: 0.8085, UEM: 0.4560, LEM: 0.2097, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6894, partial_loss/deprel_loss: 0.9977, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0009, loss: 1.2818, batch_reg_loss: 0.0649, reg_loss: 0.0644 ||:  94%|#########3| 89/95 [00:59<00:04,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8309, UAS: 0.8938, LAS: 0.8077, UEM: 0.4470, LEM: 0.2044, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8120, partial_loss/deprel_loss: 1.0731, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0858, loss: 1.2908, batch_reg_loss: 0.0650, reg_loss: 0.0645 ||:  98%|#########7| 93/95 [01:01<00:01,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7516, UAS: 0.8926, LAS: 0.8065, UEM: 0.4427, LEM: 0.2025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7706, partial_loss/deprel_loss: 1.7483, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8177, loss: 1.3028, batch_reg_loss: 0.0650, reg_loss: 0.0645 ||: 100%|##########| 95/95 [01:03<00:00,  1.50it/s]\n",
+      "2023-04-06 22:59:48,520 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.064  |       N/A\n",
+      "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - UEM                      |     0.443  |       N/A\n",
+      "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - LEM                      |     0.202  |       N/A\n",
+      "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - EM                       |     0.752  |       N/A\n",
+      "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.771  |       N/A\n",
+      "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - UAS                      |     0.893  |       N/A\n",
+      "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.748  |       N/A\n",
+      "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - loss                     |     1.303  |       N/A\n",
+      "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:59:48,521 - INFO - combo.training.tensorboard_writer - LAS                      |     0.806  |       N/A\n",
+      "2023-04-06 22:59:48,522 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.907  |       N/A\n",
+      "2023-04-06 22:59:48,522 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:59:48,522 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:59:48,522 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:59:48,522 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:59:48,522 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 22:59:48,522 - INFO - combo.training.trainer - Epoch duration: 0:01:03.153713\n",
+      "2023-04-06 22:59:48,522 - INFO - combo.training.trainer - Estimated training time remaining: 7:23:22\n",
+      "2023-04-06 22:59:48,522 - INFO - allennlp.training.trainer - Epoch 9/399\n",
+      "2023-04-06 22:59:48,523 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 22:59:48,523 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 22:59:48,529 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8477, UAS: 0.9012, LAS: 0.8183, UEM: 0.3259, LEM: 0.1007, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6332, partial_loss/deprel_loss: 0.8460, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8685, loss: 1.2115, batch_reg_loss: 0.0650, reg_loss: 0.0650 ||:   4%|4         | 4/95 [00:02<00:49,  1.82it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8063, UAS: 0.9085, LAS: 0.8263, UEM: 0.4017, LEM: 0.1348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1179, partial_loss/deprel_loss: 1.2629, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2989, loss: 1.1239, batch_reg_loss: 0.0651, reg_loss: 0.0650 ||:   7%|7         | 7/95 [00:04<00:53,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8399, UAS: 0.8992, LAS: 0.8168, UEM: 0.3929, LEM: 0.1274, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7859, partial_loss/deprel_loss: 0.9736, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0012, loss: 1.2177, batch_reg_loss: 0.0651, reg_loss: 0.0651 ||:  11%|#         | 10/95 [00:06<00:55,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7336, UAS: 0.8973, LAS: 0.8147, UEM: 0.3889, LEM: 0.1248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3379, partial_loss/deprel_loss: 1.8283, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9954, loss: 1.2410, batch_reg_loss: 0.0652, reg_loss: 0.0651 ||:  14%|#3        | 13/95 [00:08<00:55,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8776, UAS: 0.8937, LAS: 0.8107, UEM: 0.3964, LEM: 0.1369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3987, partial_loss/deprel_loss: 0.7168, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7184, loss: 1.2798, batch_reg_loss: 0.0652, reg_loss: 0.0651 ||:  17%|#6        | 16/95 [00:10<00:53,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7957, UAS: 0.8909, LAS: 0.8065, UEM: 0.3515, LEM: 0.1187, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2395, partial_loss/deprel_loss: 1.4794, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4966, loss: 1.3237, batch_reg_loss: 0.0653, reg_loss: 0.0651 ||:  21%|##1       | 20/95 [00:13<00:50,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8566, UAS: 0.8905, LAS: 0.8061, UEM: 0.3490, LEM: 0.1206, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4946, partial_loss/deprel_loss: 0.7930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7986, loss: 1.3368, batch_reg_loss: 0.0653, reg_loss: 0.0652 ||:  25%|##5       | 24/95 [00:16<00:48,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7865, UAS: 0.8863, LAS: 0.8018, UEM: 0.3213, LEM: 0.1094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5779, partial_loss/deprel_loss: 1.6368, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6904, loss: 1.3790, batch_reg_loss: 0.0654, reg_loss: 0.0652 ||:  29%|##9       | 28/95 [00:18<00:44,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7985, UAS: 0.8878, LAS: 0.8028, UEM: 0.3248, LEM: 0.1124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9806, partial_loss/deprel_loss: 1.4104, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3899, loss: 1.3691, batch_reg_loss: 0.0654, reg_loss: 0.0652 ||:  33%|###2      | 31/95 [00:21<00:43,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8694, UAS: 0.8900, LAS: 0.8052, UEM: 0.3452, LEM: 0.1243, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3102, partial_loss/deprel_loss: 0.6592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6549, loss: 1.3427, batch_reg_loss: 0.0655, reg_loss: 0.0652 ||:  37%|###6      | 35/95 [00:23<00:40,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7492, UAS: 0.8914, LAS: 0.8071, UEM: 0.3706, LEM: 0.1420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7194, partial_loss/deprel_loss: 1.7316, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7946, loss: 1.3227, batch_reg_loss: 0.0655, reg_loss: 0.0652 ||:  40%|####      | 38/95 [00:25<00:39,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7134, UAS: 0.8890, LAS: 0.8047, UEM: 0.3838, LEM: 0.1508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.8345, partial_loss/deprel_loss: 2.2025, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3944, loss: 1.3478, batch_reg_loss: 0.0656, reg_loss: 0.0653 ||:  43%|####3     | 41/95 [00:27<00:37,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8218, UAS: 0.8897, LAS: 0.8053, UEM: 0.3825, LEM: 0.1483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8915, partial_loss/deprel_loss: 1.1250, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1439, loss: 1.3414, batch_reg_loss: 0.0656, reg_loss: 0.0653 ||:  46%|####6     | 44/95 [00:30<00:35,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.8897, LAS: 0.8056, UEM: 0.3805, LEM: 0.1461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4738, partial_loss/deprel_loss: 0.8436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8353, loss: 1.3372, batch_reg_loss: 0.0657, reg_loss: 0.0653 ||:  51%|#####     | 48/95 [00:32<00:31,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8498, UAS: 0.8916, LAS: 0.8080, UEM: 0.3958, LEM: 0.1551, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5700, partial_loss/deprel_loss: 0.9175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9137, loss: 1.3151, batch_reg_loss: 0.0657, reg_loss: 0.0653 ||:  54%|#####3    | 51/95 [00:34<00:29,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7952, UAS: 0.8923, LAS: 0.8088, UEM: 0.3921, LEM: 0.1524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2080, partial_loss/deprel_loss: 1.3800, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4113, loss: 1.3055, batch_reg_loss: 0.0658, reg_loss: 0.0654 ||:  57%|#####6    | 54/95 [00:36<00:28,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8408, UAS: 0.8919, LAS: 0.8083, UEM: 0.3842, LEM: 0.1482, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7063, partial_loss/deprel_loss: 0.9721, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9848, loss: 1.3098, batch_reg_loss: 0.0658, reg_loss: 0.0654 ||:  60%|######    | 57/95 [00:38<00:26,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8125, UAS: 0.8930, LAS: 0.8092, UEM: 0.3777, LEM: 0.1422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9309, partial_loss/deprel_loss: 1.2323, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2379, loss: 1.3015, batch_reg_loss: 0.0659, reg_loss: 0.0654 ||:  64%|######4   | 61/95 [00:41<00:22,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8311, UAS: 0.8943, LAS: 0.8108, UEM: 0.3858, LEM: 0.1472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8321, partial_loss/deprel_loss: 1.1460, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1492, loss: 1.2876, batch_reg_loss: 0.0659, reg_loss: 0.0654 ||:  67%|######7   | 64/95 [00:43<00:20,  1.49it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8163, UAS: 0.8929, LAS: 0.8095, UEM: 0.3785, LEM: 0.1434, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9436, partial_loss/deprel_loss: 1.1526, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1768, loss: 1.2997, batch_reg_loss: 0.0660, reg_loss: 0.0655 ||:  71%|#######   | 67/95 [00:45<00:19,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8328, UAS: 0.8940, LAS: 0.8105, UEM: 0.3968, LEM: 0.1612, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7408, partial_loss/deprel_loss: 1.0109, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0229, loss: 1.2885, batch_reg_loss: 0.0661, reg_loss: 0.0655 ||:  75%|#######4  | 71/95 [00:48<00:16,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8681, UAS: 0.8952, LAS: 0.8120, UEM: 0.4145, LEM: 0.1751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4338, partial_loss/deprel_loss: 0.7239, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7320, loss: 1.2735, batch_reg_loss: 0.0661, reg_loss: 0.0655 ||:  78%|#######7  | 74/95 [00:50<00:14,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6697, UAS: 0.8933, LAS: 0.8103, UEM: 0.4239, LEM: 0.1847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.4333, partial_loss/deprel_loss: 2.4425, partial_loss/cycle_loss: 0.0000, batch_loss: 2.7068, loss: 1.2919, batch_reg_loss: 0.0662, reg_loss: 0.0655 ||:  81%|########1 | 77/95 [00:52<00:12,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8673, UAS: 0.8938, LAS: 0.8106, UEM: 0.4234, LEM: 0.1836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4158, partial_loss/deprel_loss: 0.7884, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7801, loss: 1.2873, batch_reg_loss: 0.0662, reg_loss: 0.0656 ||:  84%|########4 | 80/95 [00:54<00:10,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8292, UAS: 0.8952, LAS: 0.8125, UEM: 0.4462, LEM: 0.2108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8022, partial_loss/deprel_loss: 1.0705, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0831, loss: 1.2711, batch_reg_loss: 0.0663, reg_loss: 0.0656 ||:  87%|########7 | 83/95 [00:57<00:08,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7990, UAS: 0.8952, LAS: 0.8127, UEM: 0.4400, LEM: 0.2055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1483, partial_loss/deprel_loss: 1.3003, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3363, loss: 1.2698, batch_reg_loss: 0.0663, reg_loss: 0.0656 ||:  92%|#########1| 87/95 [00:59<00:05,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8653, UAS: 0.8966, LAS: 0.8144, UEM: 0.4516, LEM: 0.2121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4225, partial_loss/deprel_loss: 0.7426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7450, loss: 1.2534, batch_reg_loss: 0.0664, reg_loss: 0.0657 ||:  95%|#########4| 90/95 [01:01<00:03,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8536, UAS: 0.8979, LAS: 0.8161, UEM: 0.4584, LEM: 0.2137, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6116, partial_loss/deprel_loss: 0.9072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9145, loss: 1.2385, batch_reg_loss: 0.0664, reg_loss: 0.0657 ||:  98%|#########7| 93/95 [01:04<00:01,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8712, UAS: 0.8987, LAS: 0.8170, UEM: 0.4618, LEM: 0.2129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4434, partial_loss/deprel_loss: 0.7938, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7901, loss: 1.2303, batch_reg_loss: 0.0664, reg_loss: 0.0657 ||: 100%|##########| 95/95 [01:06<00:00,  1.44it/s]\n",
+      "2023-04-06 23:00:54,602 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:00:54,602 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:00:54,602 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.066  |       N/A\n",
+      "2023-04-06 23:00:54,602 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:00:54,602 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:00:54,602 - INFO - combo.training.tensorboard_writer - UEM                      |     0.462  |       N/A\n",
+      "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - LEM                      |     0.213  |       N/A\n",
+      "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - EM                       |     0.871  |       N/A\n",
+      "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.443  |       N/A\n",
+      "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - UAS                      |     0.899  |       N/A\n",
+      "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.794  |       N/A\n",
+      "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - loss                     |     1.230  |       N/A\n",
+      "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - LAS                      |     0.817  |       N/A\n",
+      "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.907  |       N/A\n",
+      "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:00:54,603 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:00:54,604 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:00:54,604 - INFO - combo.training.trainer - Epoch duration: 0:01:06.081709\n",
+      "2023-04-06 23:00:54,604 - INFO - combo.training.trainer - Estimated training time remaining: 7:20:57\n",
+      "2023-04-06 23:00:54,604 - INFO - allennlp.training.trainer - Epoch 10/399\n",
+      "2023-04-06 23:00:54,605 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:00:54,605 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:00:54,611 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7031, UAS: 0.8218, LAS: 0.7323, UEM: 0.0305, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5298, partial_loss/deprel_loss: 2.0268, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1939, loss: 1.9374, batch_reg_loss: 0.0665, reg_loss: 0.0665 ||:   3%|3         | 3/95 [00:02<01:03,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8079, UAS: 0.8586, LAS: 0.7740, UEM: 0.3208, LEM: 0.1694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2965, partial_loss/deprel_loss: 1.2639, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3370, loss: 1.5704, batch_reg_loss: 0.0665, reg_loss: 0.0665 ||:   6%|6         | 6/95 [00:04<01:02,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8118, UAS: 0.8798, LAS: 0.7985, UEM: 0.4239, LEM: 0.1836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0467, partial_loss/deprel_loss: 1.1728, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2142, loss: 1.3446, batch_reg_loss: 0.0666, reg_loss: 0.0665 ||:   9%|9         | 9/95 [00:06<01:03,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8492, UAS: 0.8914, LAS: 0.8105, UEM: 0.4657, LEM: 0.2098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6000, partial_loss/deprel_loss: 0.8910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8994, loss: 1.2475, batch_reg_loss: 0.0666, reg_loss: 0.0665 ||:  13%|#2        | 12/95 [00:09<01:02,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7631, UAS: 0.8833, LAS: 0.8005, UEM: 0.4205, LEM: 0.1888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6921, partial_loss/deprel_loss: 1.6346, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7128, loss: 1.3505, batch_reg_loss: 0.0667, reg_loss: 0.0666 ||:  16%|#5        | 15/95 [00:11<00:59,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7271, UAS: 0.8819, LAS: 0.7994, UEM: 0.3897, LEM: 0.1691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5832, partial_loss/deprel_loss: 2.1145, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2749, loss: 1.3850, batch_reg_loss: 0.0667, reg_loss: 0.0666 ||:  19%|#8        | 18/95 [00:13<00:56,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8399, UAS: 0.8877, LAS: 0.8062, UEM: 0.4351, LEM: 0.2032, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7033, partial_loss/deprel_loss: 0.9579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9737, loss: 1.3229, batch_reg_loss: 0.0668, reg_loss: 0.0666 ||:  22%|##2       | 21/95 [00:15<00:53,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8016, UAS: 0.8911, LAS: 0.8099, UEM: 0.4368, LEM: 0.2001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0288, partial_loss/deprel_loss: 1.3583, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3592, loss: 1.2861, batch_reg_loss: 0.0668, reg_loss: 0.0666 ||:  25%|##5       | 24/95 [00:17<00:52,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8398, UAS: 0.8934, LAS: 0.8121, UEM: 0.4386, LEM: 0.1962, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7464, partial_loss/deprel_loss: 1.0831, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0827, loss: 1.2714, batch_reg_loss: 0.0669, reg_loss: 0.0667 ||:  28%|##8       | 27/95 [00:19<00:49,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8977, UAS: 0.8953, LAS: 0.8150, UEM: 0.4853, LEM: 0.2418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2152, partial_loss/deprel_loss: 0.4133, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4406, loss: 1.2412, batch_reg_loss: 0.0669, reg_loss: 0.0667 ||:  32%|###1      | 30/95 [00:22<00:46,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8608, UAS: 0.8960, LAS: 0.8154, UEM: 0.4780, LEM: 0.2322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5071, partial_loss/deprel_loss: 0.8553, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8526, loss: 1.2423, batch_reg_loss: 0.0670, reg_loss: 0.0667 ||:  36%|###5      | 34/95 [00:25<00:44,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8680, UAS: 0.8996, LAS: 0.8191, UEM: 0.4871, LEM: 0.2348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4258, partial_loss/deprel_loss: 0.7316, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7375, loss: 1.2090, batch_reg_loss: 0.0670, reg_loss: 0.0667 ||:  40%|####      | 38/95 [00:27<00:39,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8493, UAS: 0.8994, LAS: 0.8188, UEM: 0.4778, LEM: 0.2275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6680, partial_loss/deprel_loss: 0.9297, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9444, loss: 1.2127, batch_reg_loss: 0.0671, reg_loss: 0.0668 ||:  43%|####3     | 41/95 [00:29<00:39,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7881, UAS: 0.8999, LAS: 0.8193, UEM: 0.4624, LEM: 0.2162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4983, partial_loss/deprel_loss: 1.5294, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5904, loss: 1.2083, batch_reg_loss: 0.0672, reg_loss: 0.0668 ||:  47%|####7     | 45/95 [00:32<00:35,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7780, UAS: 0.9007, LAS: 0.8201, UEM: 0.4617, LEM: 0.2117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4568, partial_loss/deprel_loss: 1.5623, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6084, loss: 1.2016, batch_reg_loss: 0.0672, reg_loss: 0.0668 ||:  51%|#####     | 48/95 [00:34<00:33,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7926, UAS: 0.9010, LAS: 0.8206, UEM: 0.4518, LEM: 0.2046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2942, partial_loss/deprel_loss: 1.3307, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3907, loss: 1.1957, batch_reg_loss: 0.0673, reg_loss: 0.0669 ||:  55%|#####4    | 52/95 [00:37<00:29,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.8989, LAS: 0.8185, UEM: 0.4463, LEM: 0.2011, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5744, partial_loss/deprel_loss: 0.7947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8179, loss: 1.2127, batch_reg_loss: 0.0673, reg_loss: 0.0669 ||:  59%|#####8    | 56/95 [00:39<00:25,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8376, UAS: 0.9001, LAS: 0.8200, UEM: 0.4409, LEM: 0.1938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7566, partial_loss/deprel_loss: 1.0446, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0544, loss: 1.2014, batch_reg_loss: 0.0674, reg_loss: 0.0669 ||:  63%|######3   | 60/95 [00:41<00:22,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8630, UAS: 0.9013, LAS: 0.8216, UEM: 0.4710, LEM: 0.2292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4239, partial_loss/deprel_loss: 0.7125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7222, loss: 1.1868, batch_reg_loss: 0.0675, reg_loss: 0.0670 ||:  67%|######7   | 64/95 [00:45<00:21,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7727, UAS: 0.9012, LAS: 0.8212, UEM: 0.4776, LEM: 0.2361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4438, partial_loss/deprel_loss: 1.4439, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5114, loss: 1.1869, batch_reg_loss: 0.0675, reg_loss: 0.0670 ||:  71%|#######   | 67/95 [00:47<00:19,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8169, UAS: 0.9016, LAS: 0.8213, UEM: 0.4723, LEM: 0.2304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8432, partial_loss/deprel_loss: 1.1341, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1435, loss: 1.1835, batch_reg_loss: 0.0675, reg_loss: 0.0670 ||:  74%|#######3  | 70/95 [00:49<00:17,  1.39it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6733, UAS: 0.9001, LAS: 0.8197, UEM: 0.4714, LEM: 0.2294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.2788, partial_loss/deprel_loss: 2.4155, partial_loss/cycle_loss: 0.0000, batch_loss: 2.6558, loss: 1.2007, batch_reg_loss: 0.0676, reg_loss: 0.0670 ||:  77%|#######6  | 73/95 [00:51<00:15,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8649, UAS: 0.9007, LAS: 0.8207, UEM: 0.4757, LEM: 0.2318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4996, partial_loss/deprel_loss: 0.8426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8417, loss: 1.1912, batch_reg_loss: 0.0676, reg_loss: 0.0671 ||:  80%|########  | 76/95 [00:54<00:13,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8503, UAS: 0.9007, LAS: 0.8207, UEM: 0.4681, LEM: 0.2252, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7483, partial_loss/deprel_loss: 0.9126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9475, loss: 1.1914, batch_reg_loss: 0.0677, reg_loss: 0.0671 ||:  84%|########4 | 80/95 [00:56<00:10,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7666, UAS: 0.9010, LAS: 0.8212, UEM: 0.4685, LEM: 0.2241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8265, partial_loss/deprel_loss: 1.6867, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7824, loss: 1.1903, batch_reg_loss: 0.0678, reg_loss: 0.0671 ||:  88%|########8 | 84/95 [00:59<00:07,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8421, UAS: 0.9010, LAS: 0.8213, UEM: 0.4681, LEM: 0.2237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7418, partial_loss/deprel_loss: 1.0076, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0223, loss: 1.1896, batch_reg_loss: 0.0678, reg_loss: 0.0671 ||:  92%|#########1| 87/95 [01:01<00:05,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8071, UAS: 0.9017, LAS: 0.8221, UEM: 0.4660, LEM: 0.2202, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1855, partial_loss/deprel_loss: 1.3873, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4148, loss: 1.1838, batch_reg_loss: 0.0679, reg_loss: 0.0672 ||:  96%|#########5| 91/95 [01:04<00:02,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7212, UAS: 0.9013, LAS: 0.8217, UEM: 0.4694, LEM: 0.2224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4279, partial_loss/deprel_loss: 1.9875, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1436, loss: 1.1866, batch_reg_loss: 0.0680, reg_loss: 0.0672 ||:  99%|#########8| 94/95 [01:06<00:00,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8137, UAS: 0.9012, LAS: 0.8216, UEM: 0.4672, LEM: 0.2210, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0853, partial_loss/deprel_loss: 1.1440, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2002, loss: 1.1868, batch_reg_loss: 0.0680, reg_loss: 0.0672 ||: 100%|##########| 95/95 [01:06<00:00,  1.42it/s]\n",
+      "2023-04-06 23:02:01,360 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8164, UAS: 0.9162, LAS: 0.8416, UEM: 0.4038, LEM: 0.1126, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5261, partial_loss/deprel_loss: 52.2277, partial_loss/cycle_loss: 0.0000, batch_loss: 42.0874, loss: 27.9840, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  27%|##7       | 3/11 [00:02<00:07,  1.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9343, LAS: 0.8675, UEM: 0.6663, LEM: 0.3834, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2763, partial_loss/deprel_loss: 18.2171, partial_loss/cycle_loss: 0.0000, batch_loss: 14.6289, loss: 23.2585, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:04<00:05,  1.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8349, UAS: 0.9326, LAS: 0.8625, UEM: 0.5833, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9777, partial_loss/deprel_loss: 40.0335, partial_loss/cycle_loss: 0.0000, batch_loss: 32.2224, loss: 23.8342, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  73%|#######2  | 8/11 [00:07<00:02,  1.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9337, LAS: 0.8647, UEM: 0.6010, LEM: 0.3205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2426, partial_loss/deprel_loss: 20.5975, partial_loss/cycle_loss: 0.0000, batch_loss: 16.5265, loss: 24.2762, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  91%|######### | 10/11 [00:09<00:00,  1.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9013, UAS: 0.9363, LAS: 0.8680, UEM: 0.6106, LEM: 0.3210, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3556, partial_loss/deprel_loss: 25.5258, partial_loss/cycle_loss: 0.0000, batch_loss: 20.4918, loss: 23.9322, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.06it/s]\n",
+      "2023-04-06 23:02:11,763 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.067  |     0.000\n",
+      "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - UEM                      |     0.467  |     0.611\n",
+      "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - LEM                      |     0.221  |     0.321\n",
+      "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - EM                       |     0.814  |     0.901\n",
+      "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.085  |     0.356\n",
+      "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - UAS                      |     0.901  |     0.936\n",
+      "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.144  |    25.526\n",
+      "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - loss                     |     1.187  |    23.932\n",
+      "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - LAS                      |     0.822  |     0.868\n",
+      "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.907  |       N/A\n",
+      "2023-04-06 23:02:11,764 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:02:11,765 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:02:11,765 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:02:11,765 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:02:11,765 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 23:02:11,765 - INFO - combo.training.trainer - Epoch duration: 0:01:17.160911\n",
+      "2023-04-06 23:02:11,765 - INFO - combo.training.trainer - Estimated training time remaining: 7:25:19\n",
+      "2023-04-06 23:02:11,766 - INFO - allennlp.training.trainer - Epoch 11/399\n",
+      "2023-04-06 23:02:11,766 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:02:11,766 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:02:11,773 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9371, LAS: 0.8700, UEM: 0.7673, LEM: 0.5902, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0930, partial_loss/deprel_loss: 0.2676, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3007, loss: 0.7984, batch_reg_loss: 0.0680, reg_loss: 0.0680 ||:   3%|3         | 3/95 [00:02<01:15,  1.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8207, UAS: 0.9161, LAS: 0.8430, UEM: 0.6421, LEM: 0.4579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1003, partial_loss/deprel_loss: 1.2503, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2884, loss: 1.0284, batch_reg_loss: 0.0681, reg_loss: 0.0680 ||:   6%|6         | 6/95 [00:04<01:10,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.9152, LAS: 0.8389, UEM: 0.5687, LEM: 0.3555, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3384, partial_loss/deprel_loss: 0.6925, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6898, loss: 1.0641, batch_reg_loss: 0.0681, reg_loss: 0.0681 ||:  11%|#         | 10/95 [00:07<01:03,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7988, UAS: 0.9111, LAS: 0.8337, UEM: 0.5121, LEM: 0.3005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3444, partial_loss/deprel_loss: 1.3470, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4147, loss: 1.1073, batch_reg_loss: 0.0682, reg_loss: 0.0681 ||:  15%|#4        | 14/95 [00:09<00:56,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8031, UAS: 0.9140, LAS: 0.8370, UEM: 0.5409, LEM: 0.3035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2805, partial_loss/deprel_loss: 1.3674, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4183, loss: 1.0751, batch_reg_loss: 0.0683, reg_loss: 0.0681 ||:  18%|#7        | 17/95 [00:12<00:57,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8467, UAS: 0.9148, LAS: 0.8375, UEM: 0.5036, LEM: 0.2682, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6595, partial_loss/deprel_loss: 0.9234, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9390, loss: 1.0632, batch_reg_loss: 0.0683, reg_loss: 0.0682 ||:  22%|##2       | 21/95 [00:14<00:52,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7154, UAS: 0.9141, LAS: 0.8375, UEM: 0.5521, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.7330, partial_loss/deprel_loss: 2.0155, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2274, loss: 1.0689, batch_reg_loss: 0.0684, reg_loss: 0.0682 ||:  25%|##5       | 24/95 [00:16<00:50,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8529, UAS: 0.9145, LAS: 0.8378, UEM: 0.5380, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6724, partial_loss/deprel_loss: 0.9636, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9739, loss: 1.0667, batch_reg_loss: 0.0685, reg_loss: 0.0682 ||:  29%|##9       | 28/95 [00:19<00:46,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8782, UAS: 0.9145, LAS: 0.8375, UEM: 0.5314, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3632, partial_loss/deprel_loss: 0.6049, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6251, loss: 1.0675, batch_reg_loss: 0.0685, reg_loss: 0.0683 ||:  33%|###2      | 31/95 [00:21<00:46,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8768, UAS: 0.9122, LAS: 0.8351, UEM: 0.5227, LEM: 0.2817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4412, partial_loss/deprel_loss: 0.7872, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7866, loss: 1.0905, batch_reg_loss: 0.0686, reg_loss: 0.0683 ||:  36%|###5      | 34/95 [00:23<00:44,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8412, UAS: 0.9136, LAS: 0.8364, UEM: 0.5206, LEM: 0.2695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6975, partial_loss/deprel_loss: 0.9374, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9580, loss: 1.0752, batch_reg_loss: 0.0686, reg_loss: 0.0683 ||:  39%|###8      | 37/95 [00:26<00:44,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8514, UAS: 0.9136, LAS: 0.8363, UEM: 0.5173, LEM: 0.2624, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6055, partial_loss/deprel_loss: 0.9506, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9503, loss: 1.0753, batch_reg_loss: 0.0687, reg_loss: 0.0683 ||:  42%|####2     | 40/95 [00:28<00:40,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7790, UAS: 0.9144, LAS: 0.8375, UEM: 0.5324, LEM: 0.2747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4415, partial_loss/deprel_loss: 1.4272, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4988, loss: 1.0630, batch_reg_loss: 0.0688, reg_loss: 0.0684 ||:  45%|####5     | 43/95 [00:30<00:39,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8695, UAS: 0.9137, LAS: 0.8369, UEM: 0.5255, LEM: 0.2673, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5880, partial_loss/deprel_loss: 0.8005, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8268, loss: 1.0684, batch_reg_loss: 0.0688, reg_loss: 0.0684 ||:  48%|####8     | 46/95 [00:33<00:36,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9121, LAS: 0.8351, UEM: 0.5167, LEM: 0.2606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3658, partial_loss/deprel_loss: 0.6982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7006, loss: 1.0860, batch_reg_loss: 0.0689, reg_loss: 0.0684 ||:  53%|#####2    | 50/95 [00:35<00:30,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7580, UAS: 0.9100, LAS: 0.8325, UEM: 0.5021, LEM: 0.2508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9662, partial_loss/deprel_loss: 1.8036, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9051, loss: 1.1094, batch_reg_loss: 0.0690, reg_loss: 0.0685 ||:  57%|#####6    | 54/95 [00:37<00:26,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8507, UAS: 0.9099, LAS: 0.8327, UEM: 0.5038, LEM: 0.2501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6799, partial_loss/deprel_loss: 0.9219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9425, loss: 1.1041, batch_reg_loss: 0.0690, reg_loss: 0.0685 ||:  61%|######1   | 58/95 [00:40<00:23,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9098, LAS: 0.8327, UEM: 0.5115, LEM: 0.2569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2085, partial_loss/deprel_loss: 0.4961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5077, loss: 1.1045, batch_reg_loss: 0.0691, reg_loss: 0.0685 ||:  65%|######5   | 62/95 [00:43<00:23,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7990, UAS: 0.9075, LAS: 0.8304, UEM: 0.5118, LEM: 0.2565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3136, partial_loss/deprel_loss: 1.3261, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3928, loss: 1.1248, batch_reg_loss: 0.0692, reg_loss: 0.0686 ||:  68%|######8   | 65/95 [00:45<00:21,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8817, UAS: 0.9087, LAS: 0.8316, UEM: 0.5187, LEM: 0.2605, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3529, partial_loss/deprel_loss: 0.5969, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6173, loss: 1.1125, batch_reg_loss: 0.0692, reg_loss: 0.0686 ||:  72%|#######1  | 68/95 [00:47<00:19,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8840, UAS: 0.9087, LAS: 0.8316, UEM: 0.5122, LEM: 0.2553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3889, partial_loss/deprel_loss: 0.6496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6668, loss: 1.1118, batch_reg_loss: 0.0693, reg_loss: 0.0686 ||:  76%|#######5  | 72/95 [00:50<00:15,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8167, UAS: 0.9078, LAS: 0.8307, UEM: 0.4999, LEM: 0.2475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0150, partial_loss/deprel_loss: 1.2229, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2507, loss: 1.1199, batch_reg_loss: 0.0694, reg_loss: 0.0687 ||:  80%|########  | 76/95 [00:52<00:12,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7706, UAS: 0.9065, LAS: 0.8292, UEM: 0.4924, LEM: 0.2422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8164, partial_loss/deprel_loss: 1.5329, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6591, loss: 1.1326, batch_reg_loss: 0.0695, reg_loss: 0.0687 ||:  84%|########4 | 80/95 [00:54<00:09,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8633, UAS: 0.9077, LAS: 0.8305, UEM: 0.5010, LEM: 0.2464, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3924, partial_loss/deprel_loss: 0.7104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7163, loss: 1.1202, batch_reg_loss: 0.0695, reg_loss: 0.0687 ||:  88%|########8 | 84/95 [00:57<00:07,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8075, UAS: 0.9064, LAS: 0.8288, UEM: 0.4941, LEM: 0.2412, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0405, partial_loss/deprel_loss: 1.2673, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2915, loss: 1.1359, batch_reg_loss: 0.0696, reg_loss: 0.0688 ||:  93%|#########2| 88/95 [01:00<00:04,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8281, UAS: 0.9071, LAS: 0.8296, UEM: 0.4892, LEM: 0.2361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8237, partial_loss/deprel_loss: 1.0912, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1074, loss: 1.1295, batch_reg_loss: 0.0697, reg_loss: 0.0688 ||:  97%|#########6| 92/95 [01:02<00:01,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7914, UAS: 0.9071, LAS: 0.8296, UEM: 0.4845, LEM: 0.2324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3436, partial_loss/deprel_loss: 1.3869, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4480, loss: 1.1300, batch_reg_loss: 0.0697, reg_loss: 0.0688 ||: 100%|##########| 95/95 [01:04<00:00,  1.47it/s]\n",
+      "2023-04-06 23:03:16,350 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:03:16,350 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:03:16,350 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.069  |       N/A\n",
+      "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - UEM                      |     0.484  |       N/A\n",
+      "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - LEM                      |     0.232  |       N/A\n",
+      "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - EM                       |     0.791  |       N/A\n",
+      "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.344  |       N/A\n",
+      "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - UAS                      |     0.907  |       N/A\n",
+      "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.387  |       N/A\n",
+      "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - loss                     |     1.130  |       N/A\n",
+      "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - LAS                      |     0.830  |       N/A\n",
+      "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.907  |       N/A\n",
+      "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:03:16,351 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:03:16,352 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:03:16,352 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:03:16,352 - INFO - combo.training.trainer - Epoch duration: 0:01:04.586566\n",
+      "2023-04-06 23:03:16,352 - INFO - combo.training.trainer - Estimated training time remaining: 7:21:58\n",
+      "2023-04-06 23:03:16,352 - INFO - allennlp.training.trainer - Epoch 12/399\n",
+      "2023-04-06 23:03:16,352 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:03:16,353 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:03:16,359 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8227, UAS: 0.9142, LAS: 0.8380, UEM: 0.5825, LEM: 0.3468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8646, partial_loss/deprel_loss: 1.2057, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2073, loss: 1.0739, batch_reg_loss: 0.0698, reg_loss: 0.0698 ||:   3%|3         | 3/95 [00:02<01:06,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9034, LAS: 0.8276, UEM: 0.6364, LEM: 0.4222, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1870, partial_loss/deprel_loss: 0.4088, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4342, loss: 1.1700, batch_reg_loss: 0.0698, reg_loss: 0.0698 ||:   6%|6         | 6/95 [00:04<01:04,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7832, UAS: 0.9081, LAS: 0.8352, UEM: 0.7177, LEM: 0.5336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5395, partial_loss/deprel_loss: 1.5154, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5901, loss: 1.1147, batch_reg_loss: 0.0699, reg_loss: 0.0698 ||:   8%|8         | 8/95 [00:08<01:36,  1.10s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8816, UAS: 0.9166, LAS: 0.8453, UEM: 0.6879, LEM: 0.4704, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3849, partial_loss/deprel_loss: 0.6113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6359, loss: 1.0103, batch_reg_loss: 0.0699, reg_loss: 0.0698 ||:  12%|#1        | 11/95 [00:10<01:24,  1.01s/it]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8337, UAS: 0.9076, LAS: 0.8340, UEM: 0.6387, LEM: 0.4273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7420, partial_loss/deprel_loss: 1.0690, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0736, loss: 1.1095, batch_reg_loss: 0.0700, reg_loss: 0.0699 ||:  15%|#4        | 14/95 [00:13<01:15,  1.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8029, UAS: 0.9005, LAS: 0.8259, UEM: 0.5868, LEM: 0.3819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3702, partial_loss/deprel_loss: 1.3301, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4082, loss: 1.1735, batch_reg_loss: 0.0701, reg_loss: 0.0699 ||:  19%|#8        | 18/95 [00:15<01:04,  1.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8745, UAS: 0.9052, LAS: 0.8306, UEM: 0.5698, LEM: 0.3542, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4813, partial_loss/deprel_loss: 0.7393, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7578, loss: 1.1321, batch_reg_loss: 0.0701, reg_loss: 0.0699 ||:  22%|##2       | 21/95 [00:17<01:00,  1.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8127, UAS: 0.9013, LAS: 0.8258, UEM: 0.5385, LEM: 0.3329, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1662, partial_loss/deprel_loss: 1.3604, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3917, loss: 1.1798, batch_reg_loss: 0.0702, reg_loss: 0.0700 ||:  25%|##5       | 24/95 [00:19<00:54,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8647, UAS: 0.9033, LAS: 0.8286, UEM: 0.5236, LEM: 0.3106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6162, partial_loss/deprel_loss: 0.7490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7927, loss: 1.1548, batch_reg_loss: 0.0702, reg_loss: 0.0700 ||:  28%|##8       | 27/95 [00:21<00:51,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8474, UAS: 0.9078, LAS: 0.8336, UEM: 0.5471, LEM: 0.3188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6983, partial_loss/deprel_loss: 1.0023, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0118, loss: 1.1121, batch_reg_loss: 0.0703, reg_loss: 0.0700 ||:  32%|###1      | 30/95 [00:24<00:48,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7711, UAS: 0.9058, LAS: 0.8310, UEM: 0.5267, LEM: 0.3034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7300, partial_loss/deprel_loss: 1.5565, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6616, loss: 1.1349, batch_reg_loss: 0.0704, reg_loss: 0.0700 ||:  35%|###4      | 33/95 [00:26<00:45,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8769, UAS: 0.9046, LAS: 0.8294, UEM: 0.5203, LEM: 0.2972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4184, partial_loss/deprel_loss: 0.6940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7093, loss: 1.1464, batch_reg_loss: 0.0704, reg_loss: 0.0701 ||:  38%|###7      | 36/95 [00:28<00:45,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8289, UAS: 0.9070, LAS: 0.8316, UEM: 0.5123, LEM: 0.2819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8512, partial_loss/deprel_loss: 1.1832, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1873, loss: 1.1284, batch_reg_loss: 0.0705, reg_loss: 0.0701 ||:  42%|####2     | 40/95 [00:31<00:38,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8624, UAS: 0.9052, LAS: 0.8290, UEM: 0.4983, LEM: 0.2697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4265, partial_loss/deprel_loss: 0.8326, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8220, loss: 1.1563, batch_reg_loss: 0.0706, reg_loss: 0.0702 ||:  46%|####6     | 44/95 [00:33<00:35,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8177, UAS: 0.9056, LAS: 0.8295, UEM: 0.4901, LEM: 0.2619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9502, partial_loss/deprel_loss: 1.1176, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1547, loss: 1.1493, batch_reg_loss: 0.0707, reg_loss: 0.0702 ||:  49%|####9     | 47/95 [00:35<00:32,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8601, UAS: 0.9061, LAS: 0.8299, UEM: 0.4935, LEM: 0.2593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5518, partial_loss/deprel_loss: 0.8065, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8263, loss: 1.1427, batch_reg_loss: 0.0707, reg_loss: 0.0702 ||:  53%|#####2    | 50/95 [00:38<00:32,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8700, UAS: 0.9074, LAS: 0.8313, UEM: 0.4914, LEM: 0.2539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5048, partial_loss/deprel_loss: 0.7113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7408, loss: 1.1276, batch_reg_loss: 0.0708, reg_loss: 0.0703 ||:  56%|#####5    | 53/95 [00:40<00:29,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.9088, LAS: 0.8330, UEM: 0.4917, LEM: 0.2485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5163, partial_loss/deprel_loss: 0.7191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7494, loss: 1.1115, batch_reg_loss: 0.0709, reg_loss: 0.0703 ||:  59%|#####8    | 56/95 [00:42<00:27,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7491, UAS: 0.9080, LAS: 0.8324, UEM: 0.4943, LEM: 0.2500, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1553, partial_loss/deprel_loss: 1.5914, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7751, loss: 1.1141, batch_reg_loss: 0.0709, reg_loss: 0.0703 ||:  62%|######2   | 59/95 [00:44<00:25,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8495, UAS: 0.9075, LAS: 0.8318, UEM: 0.4819, LEM: 0.2405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6134, partial_loss/deprel_loss: 0.8982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9122, loss: 1.1176, batch_reg_loss: 0.0710, reg_loss: 0.0704 ||:  66%|######6   | 63/95 [00:46<00:21,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8162, UAS: 0.9076, LAS: 0.8317, UEM: 0.4790, LEM: 0.2382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0133, partial_loss/deprel_loss: 1.2214, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2509, loss: 1.1179, batch_reg_loss: 0.0710, reg_loss: 0.0704 ||:  69%|######9   | 66/95 [00:49<00:20,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8660, UAS: 0.9067, LAS: 0.8308, UEM: 0.4723, LEM: 0.2336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5435, partial_loss/deprel_loss: 0.8242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8391, loss: 1.1274, batch_reg_loss: 0.0711, reg_loss: 0.0704 ||:  73%|#######2  | 69/95 [00:51<00:18,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8457, UAS: 0.9068, LAS: 0.8308, UEM: 0.4759, LEM: 0.2362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7431, partial_loss/deprel_loss: 0.9755, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0002, loss: 1.1290, batch_reg_loss: 0.0712, reg_loss: 0.0705 ||:  77%|#######6  | 73/95 [00:54<00:15,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8191, UAS: 0.9068, LAS: 0.8307, UEM: 0.4711, LEM: 0.2321, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0499, partial_loss/deprel_loss: 1.2025, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2433, loss: 1.1291, batch_reg_loss: 0.0712, reg_loss: 0.0705 ||:  80%|########  | 76/95 [00:56<00:13,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9062, LAS: 0.8303, UEM: 0.4706, LEM: 0.2287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4272, partial_loss/deprel_loss: 0.7090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7240, loss: 1.1358, batch_reg_loss: 0.0713, reg_loss: 0.0705 ||:  84%|########4 | 80/95 [00:58<00:10,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8396, UAS: 0.9063, LAS: 0.8304, UEM: 0.4649, LEM: 0.2238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7495, partial_loss/deprel_loss: 1.0563, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0663, loss: 1.1354, batch_reg_loss: 0.0714, reg_loss: 0.0706 ||:  88%|########8 | 84/95 [01:01<00:07,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9080, LAS: 0.8324, UEM: 0.4830, LEM: 0.2363, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3591, partial_loss/deprel_loss: 0.6660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6761, loss: 1.1192, batch_reg_loss: 0.0715, reg_loss: 0.0706 ||:  93%|#########2| 88/95 [01:03<00:04,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8796, UAS: 0.9089, LAS: 0.8334, UEM: 0.4855, LEM: 0.2353, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3223, partial_loss/deprel_loss: 0.6439, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6511, loss: 1.1072, batch_reg_loss: 0.0716, reg_loss: 0.0706 ||:  97%|#########6| 92/95 [01:06<00:01,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9097, LAS: 0.8345, UEM: 0.4884, LEM: 0.2346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6029, partial_loss/deprel_loss: 0.8348, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8601, loss: 1.0974, batch_reg_loss: 0.0716, reg_loss: 0.0707 ||: 100%|##########| 95/95 [01:08<00:00,  1.40it/s]\n",
+      "2023-04-06 23:04:24,427 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:04:24,427 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:04:24,427 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.071  |       N/A\n",
+      "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - UEM                      |     0.488  |       N/A\n",
+      "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - LEM                      |     0.235  |       N/A\n",
+      "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - EM                       |     0.863  |       N/A\n",
+      "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.603  |       N/A\n",
+      "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - UAS                      |     0.910  |       N/A\n",
+      "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.835  |       N/A\n",
+      "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - loss                     |     1.097  |       N/A\n",
+      "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - LAS                      |     0.835  |       N/A\n",
+      "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.907  |       N/A\n",
+      "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:04:24,428 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:04:24,429 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:04:24,429 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:04:24,429 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:04:24,429 - INFO - combo.training.trainer - Epoch duration: 0:01:08.076904\n",
+      "2023-04-06 23:04:24,429 - INFO - combo.training.trainer - Estimated training time remaining: 7:20:41\n",
+      "2023-04-06 23:04:24,430 - INFO - allennlp.training.trainer - Epoch 13/399\n",
+      "2023-04-06 23:04:24,430 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:04:24,430 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:04:24,436 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8559, UAS: 0.9381, LAS: 0.8680, UEM: 0.6473, LEM: 0.3485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6424, partial_loss/deprel_loss: 0.8496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8799, loss: 0.7820, batch_reg_loss: 0.0717, reg_loss: 0.0717 ||:   4%|4         | 4/95 [00:02<00:55,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7985, UAS: 0.9090, LAS: 0.8358, UEM: 0.5967, LEM: 0.3128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3901, partial_loss/deprel_loss: 1.4267, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4911, loss: 1.0766, batch_reg_loss: 0.0718, reg_loss: 0.0717 ||:   7%|7         | 7/95 [00:04<00:56,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9142, LAS: 0.8405, UEM: 0.5602, LEM: 0.2753, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3589, partial_loss/deprel_loss: 0.5954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6199, loss: 1.0375, batch_reg_loss: 0.0718, reg_loss: 0.0717 ||:  12%|#1        | 11/95 [00:07<00:53,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8397, UAS: 0.9187, LAS: 0.8454, UEM: 0.5227, LEM: 0.2421, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8380, partial_loss/deprel_loss: 1.0987, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1185, loss: 1.0070, batch_reg_loss: 0.0719, reg_loss: 0.0718 ||:  16%|#5        | 15/95 [00:09<00:49,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8914, UAS: 0.9218, LAS: 0.8490, UEM: 0.5440, LEM: 0.2570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2444, partial_loss/deprel_loss: 0.5095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5285, loss: 0.9723, batch_reg_loss: 0.0720, reg_loss: 0.0718 ||:  20%|##        | 19/95 [00:11<00:47,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8776, UAS: 0.9254, LAS: 0.8535, UEM: 0.5707, LEM: 0.2752, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4998, partial_loss/deprel_loss: 0.7194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7475, loss: 0.9289, batch_reg_loss: 0.0720, reg_loss: 0.0718 ||:  23%|##3       | 22/95 [00:14<00:47,  1.53it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8447, UAS: 0.9244, LAS: 0.8525, UEM: 0.5700, LEM: 0.2769, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7205, partial_loss/deprel_loss: 0.9875, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0062, loss: 0.9452, batch_reg_loss: 0.0721, reg_loss: 0.0719 ||:  26%|##6       | 25/95 [00:16<00:47,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8832, UAS: 0.9257, LAS: 0.8542, UEM: 0.5648, LEM: 0.2724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3978, partial_loss/deprel_loss: 0.6602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6798, loss: 0.9305, batch_reg_loss: 0.0721, reg_loss: 0.0719 ||:  29%|##9       | 28/95 [00:18<00:45,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8617, UAS: 0.9247, LAS: 0.8526, UEM: 0.5489, LEM: 0.2609, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6482, partial_loss/deprel_loss: 0.8613, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8909, loss: 0.9451, batch_reg_loss: 0.0722, reg_loss: 0.0719 ||:  34%|###3      | 32/95 [00:20<00:42,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8669, UAS: 0.9219, LAS: 0.8491, UEM: 0.5345, LEM: 0.2525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5332, partial_loss/deprel_loss: 0.8294, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8425, loss: 0.9753, batch_reg_loss: 0.0723, reg_loss: 0.0720 ||:  37%|###6      | 35/95 [00:23<00:41,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8058, UAS: 0.9230, LAS: 0.8511, UEM: 0.5672, LEM: 0.3000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1614, partial_loss/deprel_loss: 1.1866, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2539, loss: 0.9600, batch_reg_loss: 0.0723, reg_loss: 0.0720 ||:  40%|####      | 38/95 [00:25<00:41,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7790, UAS: 0.9219, LAS: 0.8504, UEM: 0.5568, LEM: 0.2914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5085, partial_loss/deprel_loss: 1.4547, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5378, loss: 0.9640, batch_reg_loss: 0.0724, reg_loss: 0.0720 ||:  44%|####4     | 42/95 [00:28<00:36,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8896, UAS: 0.9209, LAS: 0.8496, UEM: 0.5509, LEM: 0.2868, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4107, partial_loss/deprel_loss: 0.6130, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6450, loss: 0.9750, batch_reg_loss: 0.0725, reg_loss: 0.0721 ||:  47%|####7     | 45/95 [00:30<00:34,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8553, UAS: 0.9199, LAS: 0.8483, UEM: 0.5340, LEM: 0.2747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6735, partial_loss/deprel_loss: 0.9725, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9852, loss: 0.9868, batch_reg_loss: 0.0725, reg_loss: 0.0721 ||:  52%|#####1    | 49/95 [00:32<00:31,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9180, LAS: 0.8463, UEM: 0.5306, LEM: 0.2716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3827, partial_loss/deprel_loss: 0.6815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6944, loss: 1.0060, batch_reg_loss: 0.0726, reg_loss: 0.0721 ||:  55%|#####4    | 52/95 [00:35<00:30,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8418, UAS: 0.9184, LAS: 0.8466, UEM: 0.5256, LEM: 0.2655, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7632, partial_loss/deprel_loss: 0.9772, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0071, loss: 1.0007, batch_reg_loss: 0.0727, reg_loss: 0.0722 ||:  59%|#####8    | 56/95 [00:37<00:26,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7729, UAS: 0.9164, LAS: 0.8441, UEM: 0.5115, LEM: 0.2566, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5636, partial_loss/deprel_loss: 1.4738, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5645, loss: 1.0198, batch_reg_loss: 0.0728, reg_loss: 0.0722 ||:  63%|######3   | 60/95 [00:39<00:22,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7463, UAS: 0.9147, LAS: 0.8422, UEM: 0.5032, LEM: 0.2503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0702, partial_loss/deprel_loss: 1.6810, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8317, loss: 1.0350, batch_reg_loss: 0.0729, reg_loss: 0.0722 ||:  67%|######7   | 64/95 [00:42<00:19,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8639, UAS: 0.9151, LAS: 0.8426, UEM: 0.5026, LEM: 0.2482, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6344, partial_loss/deprel_loss: 0.8218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8573, loss: 1.0305, batch_reg_loss: 0.0730, reg_loss: 0.0723 ||:  72%|#######1  | 68/95 [00:45<00:18,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7964, UAS: 0.9153, LAS: 0.8428, UEM: 0.5113, LEM: 0.2611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4143, partial_loss/deprel_loss: 1.4025, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4779, loss: 1.0303, batch_reg_loss: 0.0730, reg_loss: 0.0723 ||:  75%|#######4  | 71/95 [00:48<00:18,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7762, UAS: 0.9132, LAS: 0.8403, UEM: 0.5022, LEM: 0.2556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6510, partial_loss/deprel_loss: 1.4862, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5923, loss: 1.0526, batch_reg_loss: 0.0731, reg_loss: 0.0723 ||:  79%|#######8  | 75/95 [00:50<00:14,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8421, UAS: 0.9131, LAS: 0.8403, UEM: 0.4988, LEM: 0.2511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8652, partial_loss/deprel_loss: 0.9862, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0352, loss: 1.0537, batch_reg_loss: 0.0732, reg_loss: 0.0724 ||:  83%|########3 | 79/95 [00:53<00:10,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8705, UAS: 0.9131, LAS: 0.8402, UEM: 0.4962, LEM: 0.2491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4240, partial_loss/deprel_loss: 0.7195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7337, loss: 1.0538, batch_reg_loss: 0.0733, reg_loss: 0.0724 ||:  86%|########6 | 82/95 [00:55<00:09,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8696, UAS: 0.9123, LAS: 0.8394, UEM: 0.4930, LEM: 0.2456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4785, partial_loss/deprel_loss: 0.7711, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7859, loss: 1.0607, batch_reg_loss: 0.0733, reg_loss: 0.0725 ||:  89%|########9 | 85/95 [00:57<00:07,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8604, UAS: 0.9126, LAS: 0.8397, UEM: 0.5022, LEM: 0.2528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4379, partial_loss/deprel_loss: 0.8143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8124, loss: 1.0589, batch_reg_loss: 0.0734, reg_loss: 0.0725 ||:  93%|#########2| 88/95 [00:59<00:05,  1.36it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8832, UAS: 0.9123, LAS: 0.8392, UEM: 0.4962, LEM: 0.2488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3830, partial_loss/deprel_loss: 0.6632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6806, loss: 1.0621, batch_reg_loss: 0.0735, reg_loss: 0.0725 ||:  97%|#########6| 92/95 [01:02<00:02,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8763, UAS: 0.9117, LAS: 0.8385, UEM: 0.4926, LEM: 0.2454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5572, partial_loss/deprel_loss: 0.7749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8049, loss: 1.0700, batch_reg_loss: 0.0735, reg_loss: 0.0726 ||: 100%|##########| 95/95 [01:04<00:00,  1.48it/s]\n",
+      "2023-04-06 23:05:28,662 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:05:28,662 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:05:28,662 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.073  |       N/A\n",
+      "2023-04-06 23:05:28,662 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:05:28,662 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - UEM                      |     0.493  |       N/A\n",
+      "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - LEM                      |     0.245  |       N/A\n",
+      "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - EM                       |     0.876  |       N/A\n",
+      "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.557  |       N/A\n",
+      "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - UAS                      |     0.912  |       N/A\n",
+      "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.775  |       N/A\n",
+      "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - loss                     |     1.070  |       N/A\n",
+      "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - LAS                      |     0.838  |       N/A\n",
+      "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.907  |       N/A\n",
+      "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:05:28,663 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:05:28,664 - INFO - combo.training.trainer - Epoch duration: 0:01:04.234400\n",
+      "2023-04-06 23:05:28,664 - INFO - combo.training.trainer - Estimated training time remaining: 7:17:40\n",
+      "2023-04-06 23:05:28,664 - INFO - allennlp.training.trainer - Epoch 14/399\n",
+      "2023-04-06 23:05:28,664 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:05:28,665 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:05:28,670 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8653, UAS: 0.8995, LAS: 0.8276, UEM: 0.4028, LEM: 0.1517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5184, partial_loss/deprel_loss: 0.7889, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8084, loss: 1.1586, batch_reg_loss: 0.0736, reg_loss: 0.0736 ||:   3%|3         | 3/95 [00:02<01:07,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8122, UAS: 0.9089, LAS: 0.8349, UEM: 0.4075, LEM: 0.1567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2148, partial_loss/deprel_loss: 1.2551, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3207, loss: 1.0912, batch_reg_loss: 0.0737, reg_loss: 0.0736 ||:   6%|6         | 6/95 [00:04<01:04,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8321, UAS: 0.9115, LAS: 0.8384, UEM: 0.3569, LEM: 0.1226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0056, partial_loss/deprel_loss: 1.0178, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0892, loss: 1.0504, batch_reg_loss: 0.0738, reg_loss: 0.0737 ||:  11%|#         | 10/95 [00:06<00:58,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9078, LAS: 0.8351, UEM: 0.4315, LEM: 0.1907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2855, partial_loss/deprel_loss: 0.5151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5430, loss: 1.0827, batch_reg_loss: 0.0738, reg_loss: 0.0737 ||:  14%|#3        | 13/95 [00:08<00:56,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8708, UAS: 0.9063, LAS: 0.8329, UEM: 0.4217, LEM: 0.1819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4802, partial_loss/deprel_loss: 0.7585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7768, loss: 1.1004, batch_reg_loss: 0.0739, reg_loss: 0.0737 ||:  18%|#7        | 17/95 [00:11<00:54,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7983, UAS: 0.9064, LAS: 0.8333, UEM: 0.4143, LEM: 0.1745, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4510, partial_loss/deprel_loss: 1.4362, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5131, loss: 1.1014, batch_reg_loss: 0.0740, reg_loss: 0.0738 ||:  21%|##1       | 20/95 [00:13<00:51,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8349, UAS: 0.9072, LAS: 0.8341, UEM: 0.4074, LEM: 0.1658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9802, partial_loss/deprel_loss: 1.0603, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1183, loss: 1.0997, batch_reg_loss: 0.0741, reg_loss: 0.0738 ||:  25%|##5       | 24/95 [00:15<00:46,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7769, UAS: 0.9086, LAS: 0.8357, UEM: 0.4271, LEM: 0.1792, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6805, partial_loss/deprel_loss: 1.4625, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5803, loss: 1.0884, batch_reg_loss: 0.0742, reg_loss: 0.0739 ||:  29%|##9       | 28/95 [00:18<00:42,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8238, UAS: 0.9128, LAS: 0.8405, UEM: 0.4980, LEM: 0.2405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2294, partial_loss/deprel_loss: 1.1924, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2740, loss: 1.0447, batch_reg_loss: 0.0742, reg_loss: 0.0739 ||:  34%|###3      | 32/95 [00:21<00:44,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8788, UAS: 0.9143, LAS: 0.8424, UEM: 0.4999, LEM: 0.2391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4578, partial_loss/deprel_loss: 0.7604, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7742, loss: 1.0288, batch_reg_loss: 0.0743, reg_loss: 0.0739 ||:  37%|###6      | 35/95 [00:23<00:41,  1.44it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9161, LAS: 0.8445, UEM: 0.5030, LEM: 0.2381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3425, partial_loss/deprel_loss: 0.6150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6349, loss: 1.0128, batch_reg_loss: 0.0744, reg_loss: 0.0740 ||:  40%|####      | 38/95 [00:25<00:39,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9150, LAS: 0.8434, UEM: 0.4975, LEM: 0.2359, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4017, partial_loss/deprel_loss: 0.5603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6030, loss: 1.0182, batch_reg_loss: 0.0744, reg_loss: 0.0740 ||:  44%|####4     | 42/95 [00:28<00:37,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7646, UAS: 0.9144, LAS: 0.8432, UEM: 0.5281, LEM: 0.2809, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9945, partial_loss/deprel_loss: 1.5558, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7180, loss: 1.0241, batch_reg_loss: 0.0745, reg_loss: 0.0740 ||:  47%|####7     | 45/95 [00:31<00:36,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8712, UAS: 0.9145, LAS: 0.8433, UEM: 0.5175, LEM: 0.2697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4187, partial_loss/deprel_loss: 0.7959, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7951, loss: 1.0231, batch_reg_loss: 0.0746, reg_loss: 0.0741 ||:  52%|#####1    | 49/95 [00:33<00:31,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8603, UAS: 0.9136, LAS: 0.8421, UEM: 0.5076, LEM: 0.2621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7028, partial_loss/deprel_loss: 0.8929, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9295, loss: 1.0349, batch_reg_loss: 0.0746, reg_loss: 0.0741 ||:  55%|#####4    | 52/95 [00:35<00:29,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9155, LAS: 0.8441, UEM: 0.5193, LEM: 0.2683, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3191, partial_loss/deprel_loss: 0.6088, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6256, loss: 1.0190, batch_reg_loss: 0.0747, reg_loss: 0.0741 ||:  58%|#####7    | 55/95 [00:37<00:28,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8247, UAS: 0.9151, LAS: 0.8434, UEM: 0.5131, LEM: 0.2629, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8426, partial_loss/deprel_loss: 1.2188, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2183, loss: 1.0272, batch_reg_loss: 0.0748, reg_loss: 0.0742 ||:  62%|######2   | 59/95 [00:40<00:24,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8308, UAS: 0.9160, LAS: 0.8443, UEM: 0.5126, LEM: 0.2595, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7857, partial_loss/deprel_loss: 1.0030, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0343, loss: 1.0196, batch_reg_loss: 0.0748, reg_loss: 0.0742 ||:  65%|######5   | 62/95 [00:42<00:22,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8505, UAS: 0.9158, LAS: 0.8441, UEM: 0.5048, LEM: 0.2534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8111, partial_loss/deprel_loss: 0.9532, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9997, loss: 1.0238, batch_reg_loss: 0.0749, reg_loss: 0.0743 ||:  69%|######9   | 66/95 [00:44<00:19,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8682, UAS: 0.9161, LAS: 0.8444, UEM: 0.5025, LEM: 0.2511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6108, partial_loss/deprel_loss: 0.7552, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8013, loss: 1.0215, batch_reg_loss: 0.0750, reg_loss: 0.0743 ||:  74%|#######3  | 70/95 [00:47<00:16,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9148, LAS: 0.8428, UEM: 0.5010, LEM: 0.2483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3281, partial_loss/deprel_loss: 0.6570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6663, loss: 1.0366, batch_reg_loss: 0.0751, reg_loss: 0.0743 ||:  78%|#######7  | 74/95 [00:49<00:13,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.9138, LAS: 0.8419, UEM: 0.4946, LEM: 0.2443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7095, partial_loss/deprel_loss: 0.9343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9645, loss: 1.0429, batch_reg_loss: 0.0752, reg_loss: 0.0744 ||:  82%|########2 | 78/95 [00:52<00:11,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7902, UAS: 0.9139, LAS: 0.8420, UEM: 0.4931, LEM: 0.2423, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8576, partial_loss/deprel_loss: 1.5264, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6679, loss: 1.0455, batch_reg_loss: 0.0753, reg_loss: 0.0744 ||:  86%|########6 | 82/95 [00:55<00:08,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8269, UAS: 0.9141, LAS: 0.8424, UEM: 0.5003, LEM: 0.2525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0369, partial_loss/deprel_loss: 1.2106, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2512, loss: 1.0436, batch_reg_loss: 0.0754, reg_loss: 0.0745 ||:  91%|######### | 86/95 [00:58<00:06,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9140, LAS: 0.8425, UEM: 0.5041, LEM: 0.2537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3531, partial_loss/deprel_loss: 0.5890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6173, loss: 1.0458, batch_reg_loss: 0.0754, reg_loss: 0.0745 ||:  94%|#########3| 89/95 [01:00<00:04,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8309, UAS: 0.9140, LAS: 0.8425, UEM: 0.4988, LEM: 0.2487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9683, partial_loss/deprel_loss: 1.0885, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1400, loss: 1.0450, batch_reg_loss: 0.0755, reg_loss: 0.0745 ||:  98%|#########7| 93/95 [01:03<00:01,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9147, LAS: 0.8433, UEM: 0.5042, LEM: 0.2521, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3336, partial_loss/deprel_loss: 0.5771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6039, loss: 1.0379, batch_reg_loss: 0.0756, reg_loss: 0.0746 ||: 100%|##########| 95/95 [01:05<00:00,  1.46it/s]\n",
+      "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.075  |       N/A\n",
+      "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - UEM                      |     0.504  |       N/A\n",
+      "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - LEM                      |     0.252  |       N/A\n",
+      "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - EM                       |     0.887  |       N/A\n",
+      "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.334  |       N/A\n",
+      "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - UAS                      |     0.915  |       N/A\n",
+      "2023-04-06 23:06:33,739 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:06:33,740 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.577  |       N/A\n",
+      "2023-04-06 23:06:33,740 - INFO - combo.training.tensorboard_writer - loss                     |     1.038  |       N/A\n",
+      "2023-04-06 23:06:33,740 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:06:33,740 - INFO - combo.training.tensorboard_writer - LAS                      |     0.843  |       N/A\n",
+      "2023-04-06 23:06:33,740 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.325  |       N/A\n",
+      "2023-04-06 23:06:33,740 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:06:33,740 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:06:33,740 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:06:33,740 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:06:33,740 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:06:33,741 - INFO - combo.training.trainer - Epoch duration: 0:01:05.076501\n",
+      "2023-04-06 23:06:33,741 - INFO - combo.training.trainer - Estimated training time remaining: 7:15:16\n",
+      "2023-04-06 23:06:33,741 - INFO - allennlp.training.trainer - Epoch 15/399\n",
+      "2023-04-06 23:06:33,741 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:06:33,741 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:06:33,748 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9288, LAS: 0.8590, UEM: 0.4644, LEM: 0.2095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3342, partial_loss/deprel_loss: 0.5915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6157, loss: 0.9118, batch_reg_loss: 0.0756, reg_loss: 0.0756 ||:   3%|3         | 3/95 [00:02<01:03,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8783, UAS: 0.9227, LAS: 0.8551, UEM: 0.4754, LEM: 0.2201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4619, partial_loss/deprel_loss: 0.7155, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7405, loss: 0.9390, batch_reg_loss: 0.0757, reg_loss: 0.0756 ||:   6%|6         | 6/95 [00:04<01:01,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8718, UAS: 0.9234, LAS: 0.8552, UEM: 0.5529, LEM: 0.2888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4761, partial_loss/deprel_loss: 0.7624, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7809, loss: 0.9247, batch_reg_loss: 0.0758, reg_loss: 0.0757 ||:   9%|9         | 9/95 [00:06<01:01,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8870, UAS: 0.9260, LAS: 0.8572, UEM: 0.5653, LEM: 0.2947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3541, partial_loss/deprel_loss: 0.6327, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6528, loss: 0.9133, batch_reg_loss: 0.0758, reg_loss: 0.0757 ||:  13%|#2        | 12/95 [00:08<00:59,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9186, LAS: 0.8482, UEM: 0.5590, LEM: 0.2874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3758, partial_loss/deprel_loss: 0.6077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6373, loss: 0.9877, batch_reg_loss: 0.0759, reg_loss: 0.0757 ||:  17%|#6        | 16/95 [00:11<00:53,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8836, UAS: 0.9244, LAS: 0.8549, UEM: 0.5798, LEM: 0.2914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4062, partial_loss/deprel_loss: 0.7005, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7176, loss: 0.9355, batch_reg_loss: 0.0760, reg_loss: 0.0758 ||:  21%|##1       | 20/95 [00:13<00:50,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8450, UAS: 0.9241, LAS: 0.8542, UEM: 0.5484, LEM: 0.2661, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7622, partial_loss/deprel_loss: 0.9469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9861, loss: 0.9463, batch_reg_loss: 0.0761, reg_loss: 0.0758 ||:  25%|##5       | 24/95 [00:15<00:45,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9218, LAS: 0.8524, UEM: 0.5621, LEM: 0.2783, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2784, partial_loss/deprel_loss: 0.4925, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5259, loss: 0.9628, batch_reg_loss: 0.0762, reg_loss: 0.0759 ||:  29%|##9       | 28/95 [00:18<00:43,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7785, UAS: 0.9227, LAS: 0.8543, UEM: 0.6101, LEM: 0.3420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9559, partial_loss/deprel_loss: 1.5021, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6691, loss: 0.9506, batch_reg_loss: 0.0762, reg_loss: 0.0759 ||:  33%|###2      | 31/95 [00:21<00:45,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9232, LAS: 0.8549, UEM: 0.6136, LEM: 0.3488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1723, partial_loss/deprel_loss: 0.4036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4337, loss: 0.9453, batch_reg_loss: 0.0763, reg_loss: 0.0759 ||:  36%|###5      | 34/95 [00:23<00:42,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8518, UAS: 0.9206, LAS: 0.8518, UEM: 0.5920, LEM: 0.3305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6710, partial_loss/deprel_loss: 0.8887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9216, loss: 0.9707, batch_reg_loss: 0.0764, reg_loss: 0.0760 ||:  40%|####      | 38/95 [00:25<00:37,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8388, UAS: 0.9188, LAS: 0.8498, UEM: 0.5726, LEM: 0.3151, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9090, partial_loss/deprel_loss: 1.0273, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0801, loss: 0.9862, batch_reg_loss: 0.0765, reg_loss: 0.0760 ||:  44%|####4     | 42/95 [00:28<00:35,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9197, LAS: 0.8510, UEM: 0.5769, LEM: 0.3164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3747, partial_loss/deprel_loss: 0.6371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6612, loss: 0.9721, batch_reg_loss: 0.0765, reg_loss: 0.0761 ||:  47%|####7     | 45/95 [00:30<00:35,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7993, UAS: 0.9199, LAS: 0.8513, UEM: 0.5792, LEM: 0.3180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4818, partial_loss/deprel_loss: 1.3520, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4545, loss: 0.9709, batch_reg_loss: 0.0766, reg_loss: 0.0761 ||:  51%|#####     | 48/95 [00:32<00:34,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7902, UAS: 0.9192, LAS: 0.8503, UEM: 0.5732, LEM: 0.3145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2909, partial_loss/deprel_loss: 1.3614, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4240, loss: 0.9733, batch_reg_loss: 0.0767, reg_loss: 0.0761 ||:  54%|#####3    | 51/95 [00:35<00:32,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8298, UAS: 0.9190, LAS: 0.8499, UEM: 0.5627, LEM: 0.3056, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9471, partial_loss/deprel_loss: 1.1233, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1648, loss: 0.9763, batch_reg_loss: 0.0768, reg_loss: 0.0762 ||:  57%|#####6    | 54/95 [00:37<00:29,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7755, UAS: 0.9179, LAS: 0.8488, UEM: 0.5505, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8752, partial_loss/deprel_loss: 1.5216, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6692, loss: 0.9884, batch_reg_loss: 0.0768, reg_loss: 0.0762 ||:  61%|######1   | 58/95 [00:40<00:26,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9177, LAS: 0.8488, UEM: 0.5661, LEM: 0.3133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1684, partial_loss/deprel_loss: 0.3627, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4008, loss: 0.9884, batch_reg_loss: 0.0769, reg_loss: 0.0762 ||:  64%|######4   | 61/95 [00:42<00:25,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9166, LAS: 0.8477, UEM: 0.5528, LEM: 0.3043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5622, partial_loss/deprel_loss: 0.8644, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8809, loss: 0.9998, batch_reg_loss: 0.0770, reg_loss: 0.0763 ||:  68%|######8   | 65/95 [00:44<00:20,  1.45it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8357, UAS: 0.9160, LAS: 0.8466, UEM: 0.5391, LEM: 0.2946, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9552, partial_loss/deprel_loss: 1.0026, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0702, loss: 1.0081, batch_reg_loss: 0.0771, reg_loss: 0.0763 ||:  73%|#######2  | 69/95 [00:46<00:16,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8421, UAS: 0.9163, LAS: 0.8468, UEM: 0.5345, LEM: 0.2866, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7857, partial_loss/deprel_loss: 0.9780, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0168, loss: 1.0061, batch_reg_loss: 0.0772, reg_loss: 0.0764 ||:  77%|#######6  | 73/95 [00:49<00:13,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8416, UAS: 0.9161, LAS: 0.8465, UEM: 0.5242, LEM: 0.2776, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8016, partial_loss/deprel_loss: 0.9685, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0124, loss: 1.0086, batch_reg_loss: 0.0773, reg_loss: 0.0764 ||:  81%|########1 | 77/95 [00:51<00:10,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8215, UAS: 0.9153, LAS: 0.8454, UEM: 0.5156, LEM: 0.2718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9789, partial_loss/deprel_loss: 1.2141, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2444, loss: 1.0181, batch_reg_loss: 0.0774, reg_loss: 0.0765 ||:  85%|########5 | 81/95 [00:54<00:08,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8837, UAS: 0.9155, LAS: 0.8456, UEM: 0.5128, LEM: 0.2681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3639, partial_loss/deprel_loss: 0.6349, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6581, loss: 1.0161, batch_reg_loss: 0.0775, reg_loss: 0.0765 ||:  89%|########9 | 85/95 [00:56<00:06,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8748, UAS: 0.9155, LAS: 0.8454, UEM: 0.5119, LEM: 0.2650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4624, partial_loss/deprel_loss: 0.7593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7775, loss: 1.0191, batch_reg_loss: 0.0775, reg_loss: 0.0766 ||:  94%|#########3| 89/95 [01:00<00:04,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8452, UAS: 0.9154, LAS: 0.8452, UEM: 0.5062, LEM: 0.2609, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8630, partial_loss/deprel_loss: 1.0097, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0580, loss: 1.0202, batch_reg_loss: 0.0776, reg_loss: 0.0766 ||:  97%|#########6| 92/95 [01:02<00:02,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8397, UAS: 0.9157, LAS: 0.8456, UEM: 0.5057, LEM: 0.2600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7605, partial_loss/deprel_loss: 1.0813, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0948, loss: 1.0184, batch_reg_loss: 0.0777, reg_loss: 0.0766 ||: 100%|##########| 95/95 [01:04<00:00,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8397, UAS: 0.9157, LAS: 0.8456, UEM: 0.5057, LEM: 0.2600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7605, partial_loss/deprel_loss: 1.0813, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0948, loss: 1.0184, batch_reg_loss: 0.0777, reg_loss: 0.0766 ||: 100%|##########| 95/95 [01:04<00:00,  1.47it/s]\n",
+      "2023-04-06 23:07:38,192 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8569, UAS: 0.9231, LAS: 0.8549, UEM: 0.2597, LEM: 0.0747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8460, partial_loss/deprel_loss: 41.4560, partial_loss/cycle_loss: 0.0000, batch_loss: 33.3340, loss: 30.5996, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  27%|##7       | 3/11 [00:02<00:07,  1.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9399, LAS: 0.8781, UEM: 0.6512, LEM: 0.4118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2229, partial_loss/deprel_loss: 18.9218, partial_loss/cycle_loss: 0.0000, batch_loss: 15.1820, loss: 25.0834, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:05<00:05,  1.00it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8665, UAS: 0.9336, LAS: 0.8698, UEM: 0.5862, LEM: 0.3545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7833, partial_loss/deprel_loss: 31.7641, partial_loss/cycle_loss: 0.0000, batch_loss: 25.5679, loss: 27.7894, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  64%|######3   | 7/11 [00:07<00:04,  1.01s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9401, LAS: 0.8766, UEM: 0.6039, LEM: 0.3287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5219, partial_loss/deprel_loss: 22.8067, partial_loss/cycle_loss: 0.0000, batch_loss: 18.3497, loss: 25.6024, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  91%|######### | 10/11 [00:09<00:00,  1.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9428, LAS: 0.8808, UEM: 0.6373, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2147, partial_loss/deprel_loss: 21.5416, partial_loss/cycle_loss: 0.0000, batch_loss: 17.2762, loss: 24.8455, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.01it/s]\n",
+      "2023-04-06 23:07:49,043 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:07:49,043 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:07:49,043 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.077  |     0.000\n",
+      "2023-04-06 23:07:49,043 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:07:49,043 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:07:49,043 - INFO - combo.training.tensorboard_writer - UEM                      |     0.506  |     0.637\n",
+      "2023-04-06 23:07:49,043 - INFO - combo.training.tensorboard_writer - LEM                      |     0.260  |     0.358\n",
+      "2023-04-06 23:07:49,043 - INFO - combo.training.tensorboard_writer - EM                       |     0.840  |     0.923\n",
+      "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.761  |     0.215\n",
+      "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - UAS                      |     0.916  |     0.943\n",
+      "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.081  |    21.542\n",
+      "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - loss                     |     1.018  |    24.845\n",
+      "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - LAS                      |     0.846  |     0.881\n",
+      "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.325  |       N/A\n",
+      "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:07:49,044 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 23:07:49,045 - INFO - combo.training.trainer - Epoch duration: 0:01:15.303924\n",
+      "2023-04-06 23:07:49,045 - INFO - combo.training.trainer - Estimated training time remaining: 7:17:08\n",
+      "2023-04-06 23:07:49,045 - INFO - allennlp.training.trainer - Epoch 16/399\n",
+      "2023-04-06 23:07:49,045 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:07:49,045 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:07:49,051 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9318, LAS: 0.8614, UEM: 0.4894, LEM: 0.1965, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4096, partial_loss/deprel_loss: 0.6358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6683, loss: 0.8488, batch_reg_loss: 0.0777, reg_loss: 0.0777 ||:   3%|3         | 3/95 [00:02<01:04,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8948, UAS: 0.9351, LAS: 0.8664, UEM: 0.5156, LEM: 0.2211, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3136, partial_loss/deprel_loss: 0.5873, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6103, loss: 0.8393, batch_reg_loss: 0.0778, reg_loss: 0.0777 ||:   6%|6         | 6/95 [00:04<01:01,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8190, UAS: 0.9224, LAS: 0.8541, UEM: 0.4664, LEM: 0.2007, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2185, partial_loss/deprel_loss: 1.1788, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2646, loss: 0.9456, batch_reg_loss: 0.0779, reg_loss: 0.0778 ||:   9%|9         | 9/95 [00:06<01:02,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7607, UAS: 0.9187, LAS: 0.8505, UEM: 0.4539, LEM: 0.2013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8743, partial_loss/deprel_loss: 1.5597, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7006, loss: 0.9853, batch_reg_loss: 0.0779, reg_loss: 0.0778 ||:  14%|#3        | 13/95 [00:08<00:56,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8719, UAS: 0.9187, LAS: 0.8500, UEM: 0.4268, LEM: 0.1787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6203, partial_loss/deprel_loss: 0.8485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8809, loss: 0.9889, batch_reg_loss: 0.0780, reg_loss: 0.0779 ||:  18%|#7        | 17/95 [00:11<00:52,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9413, UAS: 0.9209, LAS: 0.8532, UEM: 0.5132, LEM: 0.2954, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0836, partial_loss/deprel_loss: 0.2480, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2932, loss: 0.9624, batch_reg_loss: 0.0781, reg_loss: 0.0779 ||:  21%|##1       | 20/95 [00:13<00:53,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8675, UAS: 0.9204, LAS: 0.8518, UEM: 0.4941, LEM: 0.2748, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5449, partial_loss/deprel_loss: 0.7685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8019, loss: 0.9736, batch_reg_loss: 0.0782, reg_loss: 0.0779 ||:  24%|##4       | 23/95 [00:16<00:54,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8178, UAS: 0.9184, LAS: 0.8495, UEM: 0.4660, LEM: 0.2531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2759, partial_loss/deprel_loss: 1.2168, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3069, loss: 0.9971, batch_reg_loss: 0.0783, reg_loss: 0.0780 ||:  28%|##8       | 27/95 [00:18<00:48,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9170, LAS: 0.8477, UEM: 0.4600, LEM: 0.2430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3825, partial_loss/deprel_loss: 0.7065, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7200, loss: 1.0084, batch_reg_loss: 0.0783, reg_loss: 0.0780 ||:  32%|###1      | 30/95 [00:20<00:45,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8421, UAS: 0.9193, LAS: 0.8501, UEM: 0.4875, LEM: 0.2571, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7251, partial_loss/deprel_loss: 0.9890, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0146, loss: 0.9834, batch_reg_loss: 0.0784, reg_loss: 0.0780 ||:  35%|###4      | 33/95 [00:23<00:43,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9034, UAS: 0.9216, LAS: 0.8526, UEM: 0.4994, LEM: 0.2602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2514, partial_loss/deprel_loss: 0.5023, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5306, loss: 0.9620, batch_reg_loss: 0.0785, reg_loss: 0.0781 ||:  39%|###8      | 37/95 [00:25<00:40,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9241, LAS: 0.8557, UEM: 0.5129, LEM: 0.2637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4850, partial_loss/deprel_loss: 0.7002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7357, loss: 0.9371, batch_reg_loss: 0.0786, reg_loss: 0.0781 ||:  43%|####3     | 41/95 [00:28<00:36,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7890, UAS: 0.9220, LAS: 0.8531, UEM: 0.5083, LEM: 0.2616, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5592, partial_loss/deprel_loss: 1.3944, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5060, loss: 0.9564, batch_reg_loss: 0.0786, reg_loss: 0.0782 ||:  47%|####7     | 45/95 [00:30<00:33,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9210, LAS: 0.8520, UEM: 0.5033, LEM: 0.2549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3487, partial_loss/deprel_loss: 0.6453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6647, loss: 0.9648, batch_reg_loss: 0.0787, reg_loss: 0.0782 ||:  52%|#####1    | 49/95 [00:33<00:29,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9236, LAS: 0.8552, UEM: 0.5331, LEM: 0.2771, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1897, partial_loss/deprel_loss: 0.4239, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4559, loss: 0.9363, batch_reg_loss: 0.0788, reg_loss: 0.0783 ||:  56%|#####5    | 53/95 [00:36<00:29,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8068, UAS: 0.9221, LAS: 0.8535, UEM: 0.5169, LEM: 0.2669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3648, partial_loss/deprel_loss: 1.2916, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3851, loss: 0.9517, batch_reg_loss: 0.0789, reg_loss: 0.0783 ||:  60%|######    | 57/95 [00:38<00:25,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8908, UAS: 0.9216, LAS: 0.8529, UEM: 0.5135, LEM: 0.2648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3539, partial_loss/deprel_loss: 0.5904, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6220, loss: 0.9594, batch_reg_loss: 0.0790, reg_loss: 0.0783 ||:  63%|######3   | 60/95 [00:40<00:23,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8594, UAS: 0.9202, LAS: 0.8514, UEM: 0.5009, LEM: 0.2553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7087, partial_loss/deprel_loss: 0.8273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8826, loss: 0.9733, batch_reg_loss: 0.0790, reg_loss: 0.0784 ||:  67%|######7   | 64/95 [00:43<00:20,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8087, UAS: 0.9195, LAS: 0.8504, UEM: 0.4911, LEM: 0.2478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3806, partial_loss/deprel_loss: 1.2804, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3796, loss: 0.9849, batch_reg_loss: 0.0791, reg_loss: 0.0784 ||:  72%|#######1  | 68/95 [00:46<00:17,  1.52it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8748, UAS: 0.9189, LAS: 0.8495, UEM: 0.4932, LEM: 0.2464, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4074, partial_loss/deprel_loss: 0.7526, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7627, loss: 0.9879, batch_reg_loss: 0.0792, reg_loss: 0.0785 ||:  76%|#######5  | 72/95 [00:48<00:15,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8872, UAS: 0.9204, LAS: 0.8514, UEM: 0.5069, LEM: 0.2570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3735, partial_loss/deprel_loss: 0.6245, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6536, loss: 0.9719, batch_reg_loss: 0.0793, reg_loss: 0.0785 ||:  80%|########  | 76/95 [00:51<00:12,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7064, UAS: 0.9186, LAS: 0.8495, UEM: 0.5170, LEM: 0.2694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.9467, partial_loss/deprel_loss: 1.9418, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2222, loss: 0.9877, batch_reg_loss: 0.0794, reg_loss: 0.0785 ||:  83%|########3 | 79/95 [00:53<00:11,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9169, LAS: 0.8478, UEM: 0.5171, LEM: 0.2693, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3720, partial_loss/deprel_loss: 0.6572, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6795, loss: 1.0014, batch_reg_loss: 0.0794, reg_loss: 0.0786 ||:  86%|########6 | 82/95 [00:56<00:09,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8852, UAS: 0.9178, LAS: 0.8489, UEM: 0.5172, LEM: 0.2672, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4747, partial_loss/deprel_loss: 0.6203, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6707, loss: 0.9920, batch_reg_loss: 0.0795, reg_loss: 0.0786 ||:  91%|######### | 86/95 [00:59<00:06,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7905, UAS: 0.9173, LAS: 0.8484, UEM: 0.5160, LEM: 0.2678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4908, partial_loss/deprel_loss: 1.3661, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4706, loss: 0.9963, batch_reg_loss: 0.0796, reg_loss: 0.0786 ||:  94%|#########3| 89/95 [01:01<00:04,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8267, UAS: 0.9177, LAS: 0.8486, UEM: 0.5121, LEM: 0.2636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8148, partial_loss/deprel_loss: 1.1143, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1341, loss: 0.9947, batch_reg_loss: 0.0797, reg_loss: 0.0787 ||:  97%|#########6| 92/95 [01:03<00:02,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8112, UAS: 0.9175, LAS: 0.8483, UEM: 0.5078, LEM: 0.2601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1950, partial_loss/deprel_loss: 1.2697, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3345, loss: 0.9974, batch_reg_loss: 0.0797, reg_loss: 0.0787 ||: 100%|##########| 95/95 [01:05<00:00,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8112, UAS: 0.9175, LAS: 0.8483, UEM: 0.5078, LEM: 0.2601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1950, partial_loss/deprel_loss: 1.2697, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3345, loss: 0.9974, batch_reg_loss: 0.0797, reg_loss: 0.0787 ||: 100%|##########| 95/95 [01:05<00:00,  1.45it/s]\n",
+      "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.079  |       N/A\n",
+      "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - UEM                      |     0.508  |       N/A\n",
+      "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - LEM                      |     0.260  |       N/A\n",
+      "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - EM                       |     0.811  |       N/A\n",
+      "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.195  |       N/A\n",
+      "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - UAS                      |     0.918  |       N/A\n",
+      "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.270  |       N/A\n",
+      "2023-04-06 23:08:54,695 - INFO - combo.training.tensorboard_writer - loss                     |     0.997  |       N/A\n",
+      "2023-04-06 23:08:54,696 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:08:54,696 - INFO - combo.training.tensorboard_writer - LAS                      |     0.848  |       N/A\n",
+      "2023-04-06 23:08:54,696 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.325  |       N/A\n",
+      "2023-04-06 23:08:54,696 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:08:54,696 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:08:54,696 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:08:54,696 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:08:54,696 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:08:54,696 - INFO - combo.training.trainer - Epoch duration: 0:01:05.651487\n",
+      "2023-04-06 23:08:54,697 - INFO - combo.training.trainer - Estimated training time remaining: 7:15:00\n",
+      "2023-04-06 23:08:54,697 - INFO - allennlp.training.trainer - Epoch 17/399\n",
+      "2023-04-06 23:08:54,697 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:08:54,697 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:08:54,702 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8211, UAS: 0.9094, LAS: 0.8421, UEM: 0.4571, LEM: 0.2251, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2175, partial_loss/deprel_loss: 1.1695, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2589, loss: 1.0662, batch_reg_loss: 0.0798, reg_loss: 0.0798 ||:   3%|3         | 3/95 [00:02<01:08,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8607, UAS: 0.9177, LAS: 0.8486, UEM: 0.4710, LEM: 0.2165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6351, partial_loss/deprel_loss: 0.8392, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8782, loss: 1.0078, batch_reg_loss: 0.0799, reg_loss: 0.0798 ||:   7%|7         | 7/95 [00:04<01:03,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9068, UAS: 0.9255, LAS: 0.8579, UEM: 0.4782, LEM: 0.2083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2571, partial_loss/deprel_loss: 0.5411, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5643, loss: 0.9388, batch_reg_loss: 0.0800, reg_loss: 0.0799 ||:  12%|#1        | 11/95 [00:07<00:59,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8603, UAS: 0.9292, LAS: 0.8630, UEM: 0.5108, LEM: 0.2318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6941, partial_loss/deprel_loss: 0.8530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9013, loss: 0.8938, batch_reg_loss: 0.0800, reg_loss: 0.0799 ||:  15%|#4        | 14/95 [00:09<00:56,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8764, UAS: 0.9276, LAS: 0.8610, UEM: 0.4956, LEM: 0.2220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4762, partial_loss/deprel_loss: 0.7494, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7748, loss: 0.9064, batch_reg_loss: 0.0801, reg_loss: 0.0799 ||:  18%|#7        | 17/95 [00:12<00:57,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8561, UAS: 0.9244, LAS: 0.8568, UEM: 0.4666, LEM: 0.2043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7222, partial_loss/deprel_loss: 0.8504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9049, loss: 0.9373, batch_reg_loss: 0.0802, reg_loss: 0.0800 ||:  21%|##1       | 20/95 [00:14<00:54,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8657, UAS: 0.9269, LAS: 0.8603, UEM: 0.5326, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5957, partial_loss/deprel_loss: 0.7876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8294, loss: 0.9040, batch_reg_loss: 0.0802, reg_loss: 0.0800 ||:  24%|##4       | 23/95 [00:16<00:54,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8330, UAS: 0.9240, LAS: 0.8568, UEM: 0.5163, LEM: 0.2807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9524, partial_loss/deprel_loss: 1.0799, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1347, loss: 0.9328, batch_reg_loss: 0.0803, reg_loss: 0.0800 ||:  27%|##7       | 26/95 [00:18<00:50,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8368, UAS: 0.9238, LAS: 0.8563, UEM: 0.5109, LEM: 0.2744, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8677, partial_loss/deprel_loss: 1.1584, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1806, loss: 0.9377, batch_reg_loss: 0.0804, reg_loss: 0.0801 ||:  31%|###       | 29/95 [00:21<00:49,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8650, UAS: 0.9227, LAS: 0.8549, UEM: 0.5017, LEM: 0.2652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5467, partial_loss/deprel_loss: 0.7827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8159, loss: 0.9461, batch_reg_loss: 0.0804, reg_loss: 0.0801 ||:  35%|###4      | 33/95 [00:23<00:43,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8780, UAS: 0.9224, LAS: 0.8544, UEM: 0.4874, LEM: 0.2528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4548, partial_loss/deprel_loss: 0.7003, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7317, loss: 0.9517, batch_reg_loss: 0.0805, reg_loss: 0.0801 ||:  39%|###8      | 37/95 [00:25<00:38,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8853, UAS: 0.9221, LAS: 0.8539, UEM: 0.4947, LEM: 0.2573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4211, partial_loss/deprel_loss: 0.7539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7679, loss: 0.9597, batch_reg_loss: 0.0806, reg_loss: 0.0802 ||:  43%|####3     | 41/95 [00:28<00:36,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8369, UAS: 0.9180, LAS: 0.8491, UEM: 0.4773, LEM: 0.2463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8364, partial_loss/deprel_loss: 0.9655, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0204, loss: 1.0019, batch_reg_loss: 0.0807, reg_loss: 0.0802 ||:  47%|####7     | 45/95 [00:30<00:32,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9179, LAS: 0.8491, UEM: 0.4911, LEM: 0.2535, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2303, partial_loss/deprel_loss: 0.5202, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5430, loss: 0.9998, batch_reg_loss: 0.0808, reg_loss: 0.0803 ||:  52%|#####1    | 49/95 [00:33<00:31,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8731, UAS: 0.9195, LAS: 0.8512, UEM: 0.4988, LEM: 0.2546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5456, partial_loss/deprel_loss: 0.7183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7646, loss: 0.9834, batch_reg_loss: 0.0809, reg_loss: 0.0803 ||:  55%|#####4    | 52/95 [00:35<00:29,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8208, UAS: 0.9200, LAS: 0.8515, UEM: 0.4981, LEM: 0.2511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0464, partial_loss/deprel_loss: 1.1652, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2224, loss: 0.9811, batch_reg_loss: 0.0810, reg_loss: 0.0803 ||:  58%|#####7    | 55/95 [00:37<00:27,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7881, UAS: 0.9196, LAS: 0.8511, UEM: 0.4950, LEM: 0.2480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5286, partial_loss/deprel_loss: 1.3468, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4642, loss: 0.9830, batch_reg_loss: 0.0810, reg_loss: 0.0804 ||:  61%|######1   | 58/95 [00:40<00:25,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8583, UAS: 0.9208, LAS: 0.8526, UEM: 0.5058, LEM: 0.2540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5972, partial_loss/deprel_loss: 0.8106, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8490, loss: 0.9690, batch_reg_loss: 0.0811, reg_loss: 0.0804 ||:  64%|######4   | 61/95 [00:42<00:24,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8537, UAS: 0.9221, LAS: 0.8539, UEM: 0.5137, LEM: 0.2579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8451, partial_loss/deprel_loss: 0.9112, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9792, loss: 0.9557, batch_reg_loss: 0.0812, reg_loss: 0.0805 ||:  68%|######8   | 65/95 [00:45<00:20,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8385, UAS: 0.9227, LAS: 0.8548, UEM: 0.5225, LEM: 0.2662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8310, partial_loss/deprel_loss: 1.0333, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0741, loss: 0.9481, batch_reg_loss: 0.0812, reg_loss: 0.0805 ||:  72%|#######1  | 68/95 [00:47<00:19,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9229, LAS: 0.8549, UEM: 0.5200, LEM: 0.2643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3519, partial_loss/deprel_loss: 0.5175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5657, loss: 0.9448, batch_reg_loss: 0.0813, reg_loss: 0.0805 ||:  76%|#######5  | 72/95 [00:49<00:16,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9218, LAS: 0.8536, UEM: 0.5125, LEM: 0.2596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5668, partial_loss/deprel_loss: 0.7364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7839, loss: 0.9564, batch_reg_loss: 0.0814, reg_loss: 0.0806 ||:  80%|########  | 76/95 [00:52<00:12,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8361, UAS: 0.9197, LAS: 0.8512, UEM: 0.5029, LEM: 0.2530, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8183, partial_loss/deprel_loss: 1.0178, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0594, loss: 0.9775, batch_reg_loss: 0.0815, reg_loss: 0.0806 ||:  84%|########4 | 80/95 [00:54<00:09,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9204, LAS: 0.8520, UEM: 0.5089, LEM: 0.2557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3322, partial_loss/deprel_loss: 0.6043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6315, loss: 0.9704, batch_reg_loss: 0.0816, reg_loss: 0.0807 ||:  88%|########8 | 84/95 [00:57<00:07,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7638, UAS: 0.9197, LAS: 0.8513, UEM: 0.5099, LEM: 0.2574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8641, partial_loss/deprel_loss: 1.5048, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6583, loss: 0.9760, batch_reg_loss: 0.0816, reg_loss: 0.0807 ||:  92%|#########1| 87/95 [01:00<00:05,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9149, UAS: 0.9207, LAS: 0.8525, UEM: 0.5240, LEM: 0.2723, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1640, partial_loss/deprel_loss: 0.3235, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3733, loss: 0.9655, batch_reg_loss: 0.0817, reg_loss: 0.0807 ||:  95%|#########4| 90/95 [01:02<00:03,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8265, UAS: 0.9196, LAS: 0.8512, UEM: 0.5187, LEM: 0.2684, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0582, partial_loss/deprel_loss: 1.0256, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1139, loss: 0.9761, batch_reg_loss: 0.0818, reg_loss: 0.0808 ||:  98%|#########7| 93/95 [01:04<00:01,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8991, UAS: 0.9198, LAS: 0.8514, UEM: 0.5192, LEM: 0.2679, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3025, partial_loss/deprel_loss: 0.5928, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6165, loss: 0.9746, batch_reg_loss: 0.0818, reg_loss: 0.0808 ||: 100%|##########| 95/95 [01:06<00:00,  1.44it/s]\n",
+      "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.081  |       N/A\n",
+      "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - UEM                      |     0.519  |       N/A\n",
+      "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - LEM                      |     0.268  |       N/A\n",
+      "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - EM                       |     0.899  |       N/A\n",
+      "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.302  |       N/A\n",
+      "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - UAS                      |     0.920  |       N/A\n",
+      "2023-04-06 23:10:00,782 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:10:00,783 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.593  |       N/A\n",
+      "2023-04-06 23:10:00,783 - INFO - combo.training.tensorboard_writer - loss                     |     0.975  |       N/A\n",
+      "2023-04-06 23:10:00,783 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:10:00,783 - INFO - combo.training.tensorboard_writer - LAS                      |     0.851  |       N/A\n",
+      "2023-04-06 23:10:00,783 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.325  |       N/A\n",
+      "2023-04-06 23:10:00,783 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:10:00,783 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:10:00,783 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:10:00,783 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:10:00,783 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:10:00,783 - INFO - combo.training.trainer - Epoch duration: 0:01:06.086857\n",
+      "2023-04-06 23:10:00,784 - INFO - combo.training.trainer - Estimated training time remaining: 7:13:08\n",
+      "2023-04-06 23:10:00,784 - INFO - allennlp.training.trainer - Epoch 18/399\n",
+      "2023-04-06 23:10:00,784 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:10:00,784 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:10:00,790 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8063, UAS: 0.9016, LAS: 0.8326, UEM: 0.3613, LEM: 0.1450, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3579, partial_loss/deprel_loss: 1.2578, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3597, loss: 1.1402, batch_reg_loss: 0.0819, reg_loss: 0.0819 ||:   4%|4         | 4/95 [00:02<00:57,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8612, UAS: 0.9147, LAS: 0.8475, UEM: 0.4064, LEM: 0.1864, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6307, partial_loss/deprel_loss: 0.8028, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8504, loss: 1.0049, batch_reg_loss: 0.0820, reg_loss: 0.0819 ||:   8%|8         | 8/95 [00:05<00:55,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9042, UAS: 0.9260, LAS: 0.8603, UEM: 0.5197, LEM: 0.2540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2139, partial_loss/deprel_loss: 0.4959, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5216, loss: 0.9117, batch_reg_loss: 0.0821, reg_loss: 0.0820 ||:  13%|#2        | 12/95 [00:07<00:53,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9277, LAS: 0.8604, UEM: 0.5508, LEM: 0.2655, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3392, partial_loss/deprel_loss: 0.6802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6942, loss: 0.9067, batch_reg_loss: 0.0822, reg_loss: 0.0820 ||:  16%|#5        | 15/95 [00:09<00:52,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8069, UAS: 0.9241, LAS: 0.8566, UEM: 0.5429, LEM: 0.2701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2321, partial_loss/deprel_loss: 1.1701, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2647, loss: 0.9299, batch_reg_loss: 0.0822, reg_loss: 0.0820 ||:  19%|#8        | 18/95 [00:12<00:52,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8569, UAS: 0.9226, LAS: 0.8539, UEM: 0.5082, LEM: 0.2467, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7400, partial_loss/deprel_loss: 0.9208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9670, loss: 0.9604, batch_reg_loss: 0.0823, reg_loss: 0.0821 ||:  23%|##3       | 22/95 [00:14<00:47,  1.54it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8159, UAS: 0.9219, LAS: 0.8527, UEM: 0.4923, LEM: 0.2314, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1987, partial_loss/deprel_loss: 1.2112, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2911, loss: 0.9728, batch_reg_loss: 0.0824, reg_loss: 0.0821 ||:  26%|##6       | 25/95 [00:16<00:46,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8190, UAS: 0.9208, LAS: 0.8517, UEM: 0.4836, LEM: 0.2277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2457, partial_loss/deprel_loss: 1.1310, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2364, loss: 0.9771, batch_reg_loss: 0.0824, reg_loss: 0.0821 ||:  29%|##9       | 28/95 [00:18<00:45,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8890, UAS: 0.9225, LAS: 0.8538, UEM: 0.4998, LEM: 0.2389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3777, partial_loss/deprel_loss: 0.6058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6427, loss: 0.9584, batch_reg_loss: 0.0825, reg_loss: 0.0822 ||:  33%|###2      | 31/95 [00:20<00:44,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9247, LAS: 0.8565, UEM: 0.5108, LEM: 0.2453, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2491, partial_loss/deprel_loss: 0.4766, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5137, loss: 0.9393, batch_reg_loss: 0.0826, reg_loss: 0.0822 ||:  37%|###6      | 35/95 [00:23<00:42,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8703, UAS: 0.9260, LAS: 0.8585, UEM: 0.5073, LEM: 0.2391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5593, partial_loss/deprel_loss: 0.7965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8317, loss: 0.9242, batch_reg_loss: 0.0827, reg_loss: 0.0823 ||:  41%|####1     | 39/95 [00:26<00:38,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8836, UAS: 0.9277, LAS: 0.8603, UEM: 0.5189, LEM: 0.2430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4367, partial_loss/deprel_loss: 0.6974, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7280, loss: 0.9088, batch_reg_loss: 0.0827, reg_loss: 0.0823 ||:  44%|####4     | 42/95 [00:28<00:37,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7823, UAS: 0.9266, LAS: 0.8590, UEM: 0.5181, LEM: 0.2452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6739, partial_loss/deprel_loss: 1.5471, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6553, loss: 0.9214, batch_reg_loss: 0.0828, reg_loss: 0.0823 ||:  47%|####7     | 45/95 [00:30<00:34,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9271, LAS: 0.8590, UEM: 0.5167, LEM: 0.2423, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3455, partial_loss/deprel_loss: 0.5809, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6167, loss: 0.9202, batch_reg_loss: 0.0829, reg_loss: 0.0824 ||:  52%|#####1    | 49/95 [00:33<00:31,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8635, UAS: 0.9254, LAS: 0.8574, UEM: 0.5037, LEM: 0.2336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6386, partial_loss/deprel_loss: 0.8472, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8885, loss: 0.9353, batch_reg_loss: 0.0830, reg_loss: 0.0824 ||:  56%|#####5    | 53/95 [00:35<00:27,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9235, LAS: 0.8553, UEM: 0.5002, LEM: 0.2311, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3206, partial_loss/deprel_loss: 0.6063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6322, loss: 0.9538, batch_reg_loss: 0.0831, reg_loss: 0.0825 ||:  60%|######    | 57/95 [00:37<00:24,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8673, UAS: 0.9217, LAS: 0.8532, UEM: 0.4937, LEM: 0.2270, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6313, partial_loss/deprel_loss: 0.7961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8463, loss: 0.9686, batch_reg_loss: 0.0831, reg_loss: 0.0825 ||:  64%|######4   | 61/95 [00:40<00:21,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8383, UAS: 0.9221, LAS: 0.8537, UEM: 0.5130, LEM: 0.2585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8276, partial_loss/deprel_loss: 1.0782, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1113, loss: 0.9656, batch_reg_loss: 0.0832, reg_loss: 0.0825 ||:  68%|######8   | 65/95 [00:43<00:20,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8797, UAS: 0.9227, LAS: 0.8546, UEM: 0.5260, LEM: 0.2715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3946, partial_loss/deprel_loss: 0.6266, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6635, loss: 0.9557, batch_reg_loss: 0.0833, reg_loss: 0.0826 ||:  72%|#######1  | 68/95 [00:46<00:20,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8142, UAS: 0.9225, LAS: 0.8545, UEM: 0.5218, LEM: 0.2689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3803, partial_loss/deprel_loss: 1.2825, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3855, loss: 0.9600, batch_reg_loss: 0.0834, reg_loss: 0.0826 ||:  75%|#######4  | 71/95 [00:48<00:17,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7495, UAS: 0.9206, LAS: 0.8526, UEM: 0.5165, LEM: 0.2648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2523, partial_loss/deprel_loss: 1.6199, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8299, loss: 0.9755, batch_reg_loss: 0.0835, reg_loss: 0.0826 ||:  78%|#######7  | 74/95 [00:50<00:15,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8827, UAS: 0.9207, LAS: 0.8526, UEM: 0.5172, LEM: 0.2657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4643, partial_loss/deprel_loss: 0.7071, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7421, loss: 0.9738, batch_reg_loss: 0.0835, reg_loss: 0.0827 ||:  82%|########2 | 78/95 [00:53<00:12,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7802, UAS: 0.9204, LAS: 0.8522, UEM: 0.5150, LEM: 0.2624, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7017, partial_loss/deprel_loss: 1.4659, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5967, loss: 0.9763, batch_reg_loss: 0.0836, reg_loss: 0.0827 ||:  86%|########6 | 82/95 [00:55<00:08,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8492, UAS: 0.9201, LAS: 0.8519, UEM: 0.5133, LEM: 0.2586, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8410, partial_loss/deprel_loss: 0.9424, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0059, loss: 0.9782, batch_reg_loss: 0.0837, reg_loss: 0.0828 ||:  91%|######### | 86/95 [00:58<00:05,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8569, UAS: 0.9205, LAS: 0.8524, UEM: 0.5166, LEM: 0.2627, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6177, partial_loss/deprel_loss: 0.8882, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9179, loss: 0.9757, batch_reg_loss: 0.0838, reg_loss: 0.0828 ||:  95%|#########4| 90/95 [01:00<00:03,  1.54it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8401, UAS: 0.9208, LAS: 0.8527, UEM: 0.5221, LEM: 0.2707, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7381, partial_loss/deprel_loss: 0.9807, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0161, loss: 0.9715, batch_reg_loss: 0.0839, reg_loss: 0.0829 ||:  99%|#########8| 94/95 [01:02<00:00,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8543, UAS: 0.9209, LAS: 0.8527, UEM: 0.5206, LEM: 0.2690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6922, partial_loss/deprel_loss: 0.8876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9324, loss: 0.9711, batch_reg_loss: 0.0839, reg_loss: 0.0829 ||: 100%|##########| 95/95 [01:03<00:00,  1.49it/s]\n",
+      "2023-04-06 23:11:04,380 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:11:04,380 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:11:04,380 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.083  |       N/A\n",
+      "2023-04-06 23:11:04,380 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:11:04,380 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:11:04,380 - INFO - combo.training.tensorboard_writer - UEM                      |     0.521  |       N/A\n",
+      "2023-04-06 23:11:04,380 - INFO - combo.training.tensorboard_writer - LEM                      |     0.269  |       N/A\n",
+      "2023-04-06 23:11:04,380 - INFO - combo.training.tensorboard_writer - EM                       |     0.854  |       N/A\n",
+      "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.692  |       N/A\n",
+      "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - UAS                      |     0.921  |       N/A\n",
+      "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.888  |       N/A\n",
+      "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - loss                     |     0.971  |       N/A\n",
+      "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - LAS                      |     0.853  |       N/A\n",
+      "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.325  |       N/A\n",
+      "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:11:04,381 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:11:04,382 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:11:04,382 - INFO - combo.training.trainer - Epoch duration: 0:01:03.598358\n",
+      "2023-04-06 23:11:04,382 - INFO - combo.training.trainer - Estimated training time remaining: 7:10:31\n",
+      "2023-04-06 23:11:04,382 - INFO - allennlp.training.trainer - Epoch 19/399\n",
+      "2023-04-06 23:11:04,382 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:11:04,383 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:11:04,388 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8330, UAS: 0.9435, LAS: 0.8860, UEM: 0.7204, LEM: 0.4746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9285, partial_loss/deprel_loss: 1.0618, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1192, loss: 0.6993, batch_reg_loss: 0.0840, reg_loss: 0.0840 ||:   3%|3         | 3/95 [00:02<01:09,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8009, UAS: 0.9156, LAS: 0.8519, UEM: 0.5387, LEM: 0.3258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6037, partial_loss/deprel_loss: 1.2293, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3883, loss: 0.9807, batch_reg_loss: 0.0841, reg_loss: 0.0840 ||:   7%|7         | 7/95 [00:04<01:02,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9223, LAS: 0.8586, UEM: 0.5432, LEM: 0.3024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3469, partial_loss/deprel_loss: 0.6004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6339, loss: 0.9240, batch_reg_loss: 0.0841, reg_loss: 0.0840 ||:  11%|#         | 10/95 [00:07<01:04,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8421, UAS: 0.9256, LAS: 0.8612, UEM: 0.5207, LEM: 0.2688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8806, partial_loss/deprel_loss: 0.9421, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0140, loss: 0.8929, batch_reg_loss: 0.0842, reg_loss: 0.0841 ||:  15%|#4        | 14/95 [00:09<00:57,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7806, UAS: 0.9192, LAS: 0.8538, UEM: 0.5271, LEM: 0.2799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6357, partial_loss/deprel_loss: 1.4219, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5490, loss: 0.9499, batch_reg_loss: 0.0843, reg_loss: 0.0841 ||:  19%|#8        | 18/95 [00:12<00:52,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9156, LAS: 0.8487, UEM: 0.4943, LEM: 0.2532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5104, partial_loss/deprel_loss: 0.7872, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8163, loss: 0.9940, batch_reg_loss: 0.0844, reg_loss: 0.0842 ||:  23%|##3       | 22/95 [00:14<00:48,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8561, UAS: 0.9168, LAS: 0.8503, UEM: 0.4811, LEM: 0.2394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7056, partial_loss/deprel_loss: 0.8735, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9244, loss: 0.9825, batch_reg_loss: 0.0845, reg_loss: 0.0842 ||:  26%|##6       | 25/95 [00:16<00:46,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9175, LAS: 0.8506, UEM: 0.4635, LEM: 0.2253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4135, partial_loss/deprel_loss: 0.6657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6998, loss: 0.9775, batch_reg_loss: 0.0846, reg_loss: 0.0843 ||:  31%|###       | 29/95 [00:18<00:41,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9197, LAS: 0.8531, UEM: 0.4805, LEM: 0.2322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4015, partial_loss/deprel_loss: 0.6840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7122, loss: 0.9550, batch_reg_loss: 0.0847, reg_loss: 0.0843 ||:  35%|###4      | 33/95 [00:21<00:40,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8916, UAS: 0.9224, LAS: 0.8559, UEM: 0.5072, LEM: 0.2469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2650, partial_loss/deprel_loss: 0.5334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5645, loss: 0.9343, batch_reg_loss: 0.0848, reg_loss: 0.0844 ||:  39%|###8      | 37/95 [00:24<00:39,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8727, UAS: 0.9217, LAS: 0.8554, UEM: 0.4989, LEM: 0.2412, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5131, partial_loss/deprel_loss: 0.6908, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7401, loss: 0.9416, batch_reg_loss: 0.0849, reg_loss: 0.0844 ||:  42%|####2     | 40/95 [00:26<00:37,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8368, UAS: 0.9233, LAS: 0.8573, UEM: 0.5106, LEM: 0.2486, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9475, partial_loss/deprel_loss: 1.0811, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1393, loss: 0.9286, batch_reg_loss: 0.0849, reg_loss: 0.0844 ||:  45%|####5     | 43/95 [00:28<00:36,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8408, UAS: 0.9236, LAS: 0.8577, UEM: 0.5018, LEM: 0.2420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9378, partial_loss/deprel_loss: 0.9711, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0495, loss: 0.9265, batch_reg_loss: 0.0850, reg_loss: 0.0845 ||:  48%|####8     | 46/95 [00:31<00:34,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9245, LAS: 0.8588, UEM: 0.5113, LEM: 0.2475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3375, partial_loss/deprel_loss: 0.5103, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5608, loss: 0.9145, batch_reg_loss: 0.0851, reg_loss: 0.0845 ||:  52%|#####1    | 49/95 [00:33<00:33,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8744, UAS: 0.9246, LAS: 0.8589, UEM: 0.5174, LEM: 0.2533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4168, partial_loss/deprel_loss: 0.7370, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7581, loss: 0.9116, batch_reg_loss: 0.0851, reg_loss: 0.0845 ||:  55%|#####4    | 52/95 [00:35<00:30,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8553, UAS: 0.9250, LAS: 0.8593, UEM: 0.5118, LEM: 0.2468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7121, partial_loss/deprel_loss: 0.8879, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9379, loss: 0.9107, batch_reg_loss: 0.0852, reg_loss: 0.0846 ||:  59%|#####8    | 56/95 [00:37<00:26,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8288, UAS: 0.9247, LAS: 0.8590, UEM: 0.5060, LEM: 0.2419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1599, partial_loss/deprel_loss: 1.1592, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2446, loss: 0.9141, batch_reg_loss: 0.0853, reg_loss: 0.0846 ||:  62%|######2   | 59/95 [00:39<00:24,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8143, UAS: 0.9251, LAS: 0.8594, UEM: 0.5113, LEM: 0.2465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3870, partial_loss/deprel_loss: 1.3038, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4058, loss: 0.9143, batch_reg_loss: 0.0853, reg_loss: 0.0846 ||:  65%|######5   | 62/95 [00:42<00:23,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9182, UAS: 0.9266, LAS: 0.8613, UEM: 0.5381, LEM: 0.2765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1560, partial_loss/deprel_loss: 0.3884, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4274, loss: 0.8983, batch_reg_loss: 0.0854, reg_loss: 0.0847 ||:  69%|######9   | 66/95 [00:44<00:20,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9263, LAS: 0.8610, UEM: 0.5383, LEM: 0.2797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3126, partial_loss/deprel_loss: 0.4687, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5230, loss: 0.9019, batch_reg_loss: 0.0855, reg_loss: 0.0847 ||:  73%|#######2  | 69/95 [00:47<00:18,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8739, UAS: 0.9269, LAS: 0.8615, UEM: 0.5384, LEM: 0.2763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4765, partial_loss/deprel_loss: 0.6877, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7310, loss: 0.8967, batch_reg_loss: 0.0855, reg_loss: 0.0848 ||:  76%|#######5  | 72/95 [00:49<00:15,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8586, UAS: 0.9264, LAS: 0.8608, UEM: 0.5295, LEM: 0.2685, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6799, partial_loss/deprel_loss: 0.8600, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9096, loss: 0.9015, batch_reg_loss: 0.0856, reg_loss: 0.0848 ||:  80%|########  | 76/95 [00:51<00:12,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7132, UAS: 0.9240, LAS: 0.8580, UEM: 0.5249, LEM: 0.2660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6995, partial_loss/deprel_loss: 1.8867, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1350, loss: 0.9255, batch_reg_loss: 0.0857, reg_loss: 0.0848 ||:  84%|########4 | 80/95 [00:53<00:09,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8211, UAS: 0.9225, LAS: 0.8562, UEM: 0.5163, LEM: 0.2602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0998, partial_loss/deprel_loss: 1.1962, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2627, loss: 0.9415, batch_reg_loss: 0.0858, reg_loss: 0.0849 ||:  88%|########8 | 84/95 [00:56<00:07,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8162, UAS: 0.9213, LAS: 0.8547, UEM: 0.5081, LEM: 0.2550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2418, partial_loss/deprel_loss: 1.2224, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3122, loss: 0.9540, batch_reg_loss: 0.0859, reg_loss: 0.0849 ||:  93%|#########2| 88/95 [00:59<00:04,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8681, UAS: 0.9229, LAS: 0.8565, UEM: 0.5315, LEM: 0.2803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4410, partial_loss/deprel_loss: 0.8339, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8413, loss: 0.9397, batch_reg_loss: 0.0860, reg_loss: 0.0850 ||:  97%|#########6| 92/95 [01:02<00:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8902, UAS: 0.9226, LAS: 0.8561, UEM: 0.5297, LEM: 0.2785, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3539, partial_loss/deprel_loss: 0.6098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6447, loss: 0.9430, batch_reg_loss: 0.0861, reg_loss: 0.0850 ||: 100%|##########| 95/95 [01:04<00:00,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8902, UAS: 0.9226, LAS: 0.8561, UEM: 0.5297, LEM: 0.2785, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3539, partial_loss/deprel_loss: 0.6098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6447, loss: 0.9430, batch_reg_loss: 0.0861, reg_loss: 0.0850 ||: 100%|##########| 95/95 [01:04<00:00,  1.48it/s]\n",
+      "2023-04-06 23:12:08,723 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:12:08,723 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:12:08,723 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.085  |       N/A\n",
+      "2023-04-06 23:12:08,723 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - UEM                      |     0.530  |       N/A\n",
+      "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - LEM                      |     0.278  |       N/A\n",
+      "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - EM                       |     0.890  |       N/A\n",
+      "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.354  |       N/A\n",
+      "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - UAS                      |     0.923  |       N/A\n",
+      "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.610  |       N/A\n",
+      "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - loss                     |     0.943  |       N/A\n",
+      "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - LAS                      |     0.856  |       N/A\n",
+      "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.325  |       N/A\n",
+      "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:12:08,724 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:12:08,725 - INFO - combo.training.trainer - Epoch duration: 0:01:04.342871\n",
+      "2023-04-06 23:12:08,725 - INFO - combo.training.trainer - Estimated training time remaining: 7:08:17\n",
+      "2023-04-06 23:12:08,725 - INFO - allennlp.training.trainer - Epoch 20/399\n",
+      "2023-04-06 23:12:08,725 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:12:08,726 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:12:08,732 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9035, UAS: 0.9110, LAS: 0.8443, UEM: 0.3849, LEM: 0.1702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2972, partial_loss/deprel_loss: 0.5319, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5711, loss: 1.0397, batch_reg_loss: 0.0862, reg_loss: 0.0861 ||:   4%|4         | 4/95 [00:02<01:01,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8880, UAS: 0.9310, LAS: 0.8659, UEM: 0.5533, LEM: 0.2781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3611, partial_loss/deprel_loss: 0.5817, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6238, loss: 0.8645, batch_reg_loss: 0.0862, reg_loss: 0.0862 ||:   8%|8         | 8/95 [00:05<00:58,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8717, UAS: 0.9336, LAS: 0.8679, UEM: 0.5478, LEM: 0.2519, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4877, partial_loss/deprel_loss: 0.6900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7359, loss: 0.8320, batch_reg_loss: 0.0863, reg_loss: 0.0862 ||:  12%|#1        | 11/95 [00:07<00:57,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9324, LAS: 0.8653, UEM: 0.5534, LEM: 0.2555, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4115, partial_loss/deprel_loss: 0.6690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7038, loss: 0.8553, batch_reg_loss: 0.0864, reg_loss: 0.0862 ||:  16%|#5        | 15/95 [00:09<00:51,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.9284, LAS: 0.8616, UEM: 0.5068, LEM: 0.2273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1938, partial_loss/deprel_loss: 1.0830, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1916, loss: 0.8870, batch_reg_loss: 0.0865, reg_loss: 0.0863 ||:  20%|##        | 19/95 [00:12<00:47,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8691, UAS: 0.9314, LAS: 0.8659, UEM: 0.5482, LEM: 0.2662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6033, partial_loss/deprel_loss: 0.7846, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8348, loss: 0.8500, batch_reg_loss: 0.0865, reg_loss: 0.0863 ||:  23%|##3       | 22/95 [00:14<00:51,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8376, UAS: 0.9259, LAS: 0.8598, UEM: 0.5101, LEM: 0.2451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9727, partial_loss/deprel_loss: 1.0948, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1570, loss: 0.9070, batch_reg_loss: 0.0866, reg_loss: 0.0864 ||:  27%|##7       | 26/95 [00:17<00:46,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8802, UAS: 0.9231, LAS: 0.8571, UEM: 0.4837, LEM: 0.2284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5614, partial_loss/deprel_loss: 0.6820, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7446, loss: 0.9337, batch_reg_loss: 0.0867, reg_loss: 0.0864 ||:  32%|###1      | 30/95 [00:19<00:42,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9254, LAS: 0.8596, UEM: 0.5063, LEM: 0.2410, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3327, partial_loss/deprel_loss: 0.5998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6332, loss: 0.9123, batch_reg_loss: 0.0868, reg_loss: 0.0864 ||:  35%|###4      | 33/95 [00:22<00:43,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7897, UAS: 0.9223, LAS: 0.8554, UEM: 0.4936, LEM: 0.2330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7403, partial_loss/deprel_loss: 1.4286, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5778, loss: 0.9495, batch_reg_loss: 0.0869, reg_loss: 0.0865 ||:  39%|###8      | 37/95 [00:24<00:39,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8780, UAS: 0.9210, LAS: 0.8539, UEM: 0.4811, LEM: 0.2228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5754, partial_loss/deprel_loss: 0.8188, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8571, loss: 0.9656, batch_reg_loss: 0.0870, reg_loss: 0.0865 ||:  43%|####3     | 41/95 [00:26<00:35,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9231, LAS: 0.8565, UEM: 0.5083, LEM: 0.2521, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1527, partial_loss/deprel_loss: 0.4154, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4499, loss: 0.9443, batch_reg_loss: 0.0871, reg_loss: 0.0866 ||:  47%|####7     | 45/95 [00:29<00:33,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8537, UAS: 0.9231, LAS: 0.8567, UEM: 0.5003, LEM: 0.2448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7734, partial_loss/deprel_loss: 0.9690, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0170, loss: 0.9441, batch_reg_loss: 0.0871, reg_loss: 0.0866 ||:  51%|#####     | 48/95 [00:31<00:32,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9148, UAS: 0.9250, LAS: 0.8595, UEM: 0.5372, LEM: 0.2904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2823, partial_loss/deprel_loss: 0.5420, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5773, loss: 0.9245, batch_reg_loss: 0.0872, reg_loss: 0.0866 ||:  54%|#####3    | 51/95 [00:34<00:31,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9266, LAS: 0.8612, UEM: 0.5460, LEM: 0.2920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3473, partial_loss/deprel_loss: 0.5949, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6327, loss: 0.9112, batch_reg_loss: 0.0873, reg_loss: 0.0867 ||:  57%|#####6    | 54/95 [00:36<00:28,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8433, UAS: 0.9251, LAS: 0.8595, UEM: 0.5404, LEM: 0.2895, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0079, partial_loss/deprel_loss: 0.9937, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0839, loss: 0.9280, batch_reg_loss: 0.0874, reg_loss: 0.0867 ||:  61%|######1   | 58/95 [00:38<00:24,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9247, LAS: 0.8591, UEM: 0.5448, LEM: 0.2945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5486, partial_loss/deprel_loss: 0.7013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7582, loss: 0.9304, batch_reg_loss: 0.0874, reg_loss: 0.0868 ||:  65%|######5   | 62/95 [00:41<00:22,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8300, UAS: 0.9228, LAS: 0.8570, UEM: 0.5325, LEM: 0.2853, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0626, partial_loss/deprel_loss: 1.0727, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1582, loss: 0.9464, batch_reg_loss: 0.0875, reg_loss: 0.0868 ||:  69%|######9   | 66/95 [00:44<00:19,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8860, UAS: 0.9230, LAS: 0.8569, UEM: 0.5244, LEM: 0.2780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4814, partial_loss/deprel_loss: 0.7219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7614, loss: 0.9487, batch_reg_loss: 0.0876, reg_loss: 0.0868 ||:  74%|#######3  | 70/95 [00:47<00:17,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8839, UAS: 0.9237, LAS: 0.8577, UEM: 0.5248, LEM: 0.2772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4907, partial_loss/deprel_loss: 0.7567, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7911, loss: 0.9429, batch_reg_loss: 0.0877, reg_loss: 0.0869 ||:  77%|#######6  | 73/95 [00:49<00:15,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8927, UAS: 0.9242, LAS: 0.8581, UEM: 0.5217, LEM: 0.2723, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3526, partial_loss/deprel_loss: 0.6355, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6667, loss: 0.9388, batch_reg_loss: 0.0878, reg_loss: 0.0869 ||:  81%|########1 | 77/95 [00:51<00:12,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7475, UAS: 0.9237, LAS: 0.8577, UEM: 0.5224, LEM: 0.2713, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3742, partial_loss/deprel_loss: 1.6319, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8683, loss: 0.9423, batch_reg_loss: 0.0879, reg_loss: 0.0870 ||:  85%|########5 | 81/95 [00:54<00:09,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8607, UAS: 0.9248, LAS: 0.8591, UEM: 0.5373, LEM: 0.2862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6663, partial_loss/deprel_loss: 0.7912, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8541, loss: 0.9301, batch_reg_loss: 0.0879, reg_loss: 0.0870 ||:  88%|########8 | 84/95 [00:56<00:07,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7260, UAS: 0.9236, LAS: 0.8578, UEM: 0.5355, LEM: 0.2844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6770, partial_loss/deprel_loss: 1.8716, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1207, loss: 0.9407, batch_reg_loss: 0.0880, reg_loss: 0.0870 ||:  92%|#########1| 87/95 [00:58<00:05,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8341, UAS: 0.9228, LAS: 0.8568, UEM: 0.5279, LEM: 0.2790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9349, partial_loss/deprel_loss: 1.0539, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1182, loss: 0.9479, batch_reg_loss: 0.0881, reg_loss: 0.0871 ||:  95%|#########4| 90/95 [01:00<00:03,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8482, UAS: 0.9235, LAS: 0.8578, UEM: 0.5311, LEM: 0.2795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7756, partial_loss/deprel_loss: 0.8687, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9383, loss: 0.9384, batch_reg_loss: 0.0882, reg_loss: 0.0871 ||:  99%|#########8| 94/95 [01:03<00:00,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8695, UAS: 0.9237, LAS: 0.8579, UEM: 0.5307, LEM: 0.2782, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5919, partial_loss/deprel_loss: 0.8331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8731, loss: 0.9377, batch_reg_loss: 0.0882, reg_loss: 0.0871 ||: 100%|##########| 95/95 [01:03<00:00,  1.49it/s]\n",
+      "2023-04-06 23:13:12,510 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9319, LAS: 0.8801, UEM: 0.7776, LEM: 0.6212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2257, partial_loss/deprel_loss: 19.5722, partial_loss/cycle_loss: 0.0000, batch_loss: 15.7029, loss: 30.2250, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  18%|#8        | 2/11 [00:02<00:09,  1.08s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9292, LAS: 0.8706, UEM: 0.5947, LEM: 0.3993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7996, partial_loss/deprel_loss: 32.6935, partial_loss/cycle_loss: 0.0000, batch_loss: 26.3147, loss: 28.7042, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:04<00:06,  1.03s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9410, LAS: 0.8846, UEM: 0.6785, LEM: 0.4306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3704, partial_loss/deprel_loss: 23.8122, partial_loss/cycle_loss: 0.0000, batch_loss: 19.1238, loss: 25.7829, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  64%|######3   | 7/11 [00:06<00:04,  1.04s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9433, LAS: 0.8857, UEM: 0.6618, LEM: 0.3910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3140, partial_loss/deprel_loss: 27.5430, partial_loss/cycle_loss: 0.0000, batch_loss: 22.0972, loss: 26.3043, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  91%|######### | 10/11 [00:09<00:00,  1.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8786, UAS: 0.9434, LAS: 0.8851, UEM: 0.6533, LEM: 0.3740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5105, partial_loss/deprel_loss: 23.3250, partial_loss/cycle_loss: 0.0000, batch_loss: 18.7621, loss: 25.6187, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:09<00:00,  1.13it/s]\n",
+      "2023-04-06 23:13:22,264 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.087  |     0.000\n",
+      "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - UEM                      |     0.531  |     0.653\n",
+      "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - LEM                      |     0.278  |     0.374\n",
+      "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - EM                       |     0.870  |     0.879\n",
+      "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.592  |     0.510\n",
+      "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - UAS                      |     0.924  |     0.943\n",
+      "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.833  |    23.325\n",
+      "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - loss                     |     0.938  |    25.619\n",
+      "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - LAS                      |     0.858  |     0.885\n",
+      "2023-04-06 23:13:22,265 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.596  |       N/A\n",
+      "2023-04-06 23:13:22,266 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:13:22,266 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:13:22,266 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:13:22,266 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:13:22,266 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 23:13:22,266 - INFO - combo.training.trainer - Epoch duration: 0:01:13.540946\n",
+      "2023-04-06 23:13:22,266 - INFO - combo.training.trainer - Estimated training time remaining: 7:08:57\n",
+      "2023-04-06 23:13:22,266 - INFO - allennlp.training.trainer - Epoch 21/399\n",
+      "2023-04-06 23:13:22,267 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:13:22,267 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:13:22,273 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8840, UAS: 0.9221, LAS: 0.8546, UEM: 0.3557, LEM: 0.1229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4082, partial_loss/deprel_loss: 0.6628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7001, loss: 0.9470, batch_reg_loss: 0.0883, reg_loss: 0.0882 ||:   4%|4         | 4/95 [00:02<00:54,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8405, UAS: 0.9199, LAS: 0.8541, UEM: 0.3511, LEM: 0.1239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9181, partial_loss/deprel_loss: 1.0244, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0915, loss: 0.9805, batch_reg_loss: 0.0883, reg_loss: 0.0883 ||:   7%|7         | 7/95 [00:04<00:58,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9295, LAS: 0.8663, UEM: 0.6005, LEM: 0.4025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0708, partial_loss/deprel_loss: 0.2353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2908, loss: 0.8785, batch_reg_loss: 0.0884, reg_loss: 0.0883 ||:  11%|#         | 10/95 [00:07<01:01,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8384, UAS: 0.9190, LAS: 0.8538, UEM: 0.5549, LEM: 0.3586, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9296, partial_loss/deprel_loss: 1.0548, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1183, loss: 0.9701, batch_reg_loss: 0.0885, reg_loss: 0.0883 ||:  14%|#3        | 13/95 [00:09<00:57,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9230, LAS: 0.8573, UEM: 0.5473, LEM: 0.3278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5756, partial_loss/deprel_loss: 0.8580, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8901, loss: 0.9454, batch_reg_loss: 0.0886, reg_loss: 0.0884 ||:  18%|#7        | 17/95 [00:11<00:52,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9273, LAS: 0.8625, UEM: 0.5692, LEM: 0.3355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2405, partial_loss/deprel_loss: 0.4936, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5317, loss: 0.9059, batch_reg_loss: 0.0887, reg_loss: 0.0884 ||:  22%|##2       | 21/95 [00:14<00:48,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9048, UAS: 0.9278, LAS: 0.8636, UEM: 0.5645, LEM: 0.3271, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2945, partial_loss/deprel_loss: 0.5534, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5904, loss: 0.9013, batch_reg_loss: 0.0887, reg_loss: 0.0885 ||:  25%|##5       | 24/95 [00:16<00:47,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9298, LAS: 0.8662, UEM: 0.5759, LEM: 0.3350, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1747, partial_loss/deprel_loss: 0.3965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4410, loss: 0.8804, batch_reg_loss: 0.0888, reg_loss: 0.0885 ||:  29%|##9       | 28/95 [00:19<00:44,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9313, LAS: 0.8677, UEM: 0.5794, LEM: 0.3319, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2287, partial_loss/deprel_loss: 0.4578, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5008, loss: 0.8691, batch_reg_loss: 0.0889, reg_loss: 0.0886 ||:  33%|###2      | 31/95 [00:21<00:44,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9322, LAS: 0.8694, UEM: 0.5735, LEM: 0.3221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4688, partial_loss/deprel_loss: 0.6444, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6983, loss: 0.8587, batch_reg_loss: 0.0890, reg_loss: 0.0886 ||:  36%|###5      | 34/95 [00:23<00:43,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8696, UAS: 0.9288, LAS: 0.8655, UEM: 0.5588, LEM: 0.3120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5252, partial_loss/deprel_loss: 0.7641, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8053, loss: 0.8868, batch_reg_loss: 0.0890, reg_loss: 0.0886 ||:  39%|###8      | 37/95 [00:25<00:40,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8536, UAS: 0.9269, LAS: 0.8634, UEM: 0.5501, LEM: 0.3038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8205, partial_loss/deprel_loss: 0.9077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9794, loss: 0.9034, batch_reg_loss: 0.0891, reg_loss: 0.0887 ||:  42%|####2     | 40/95 [00:27<00:39,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8703, UAS: 0.9280, LAS: 0.8645, UEM: 0.5619, LEM: 0.3164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5773, partial_loss/deprel_loss: 0.7543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8081, loss: 0.8940, batch_reg_loss: 0.0892, reg_loss: 0.0887 ||:  46%|####6     | 44/95 [00:30<00:35,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8614, UAS: 0.9255, LAS: 0.8619, UEM: 0.5429, LEM: 0.3034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8078, partial_loss/deprel_loss: 0.8197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9065, loss: 0.9176, batch_reg_loss: 0.0893, reg_loss: 0.0887 ||:  51%|#####     | 48/95 [00:32<00:31,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8261, UAS: 0.9226, LAS: 0.8587, UEM: 0.5308, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2410, partial_loss/deprel_loss: 1.1667, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2709, loss: 0.9484, batch_reg_loss: 0.0893, reg_loss: 0.0888 ||:  54%|#####3    | 51/95 [00:35<00:30,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9044, UAS: 0.9237, LAS: 0.8598, UEM: 0.5345, LEM: 0.2954, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3290, partial_loss/deprel_loss: 0.5271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5769, loss: 0.9379, batch_reg_loss: 0.0894, reg_loss: 0.0888 ||:  57%|#####6    | 54/95 [00:37<00:28,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8685, UAS: 0.9241, LAS: 0.8602, UEM: 0.5310, LEM: 0.2909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6501, partial_loss/deprel_loss: 0.8100, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8675, loss: 0.9327, batch_reg_loss: 0.0895, reg_loss: 0.0888 ||:  60%|######    | 57/95 [00:39<00:26,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7886, UAS: 0.9236, LAS: 0.8593, UEM: 0.5250, LEM: 0.2836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6350, partial_loss/deprel_loss: 1.3677, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5108, loss: 0.9359, batch_reg_loss: 0.0896, reg_loss: 0.0889 ||:  64%|######4   | 61/95 [00:41<00:22,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8438, UAS: 0.9245, LAS: 0.8600, UEM: 0.5268, LEM: 0.2805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7538, partial_loss/deprel_loss: 1.0441, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0757, loss: 0.9285, batch_reg_loss: 0.0897, reg_loss: 0.0889 ||:  68%|######8   | 65/95 [00:44<00:20,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8068, UAS: 0.9245, LAS: 0.8603, UEM: 0.5323, LEM: 0.2862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4523, partial_loss/deprel_loss: 1.2092, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3476, loss: 0.9238, batch_reg_loss: 0.0897, reg_loss: 0.0890 ||:  72%|#######1  | 68/95 [00:46<00:19,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8679, UAS: 0.9241, LAS: 0.8601, UEM: 0.5268, LEM: 0.2820, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6872, partial_loss/deprel_loss: 0.9213, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9643, loss: 0.9281, batch_reg_loss: 0.0898, reg_loss: 0.0890 ||:  75%|#######4  | 71/95 [00:49<00:17,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8261, UAS: 0.9234, LAS: 0.8594, UEM: 0.5213, LEM: 0.2761, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3491, partial_loss/deprel_loss: 1.1402, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2719, loss: 0.9356, batch_reg_loss: 0.0899, reg_loss: 0.0890 ||:  79%|#######8  | 75/95 [00:51<00:13,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8833, UAS: 0.9236, LAS: 0.8595, UEM: 0.5278, LEM: 0.2807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3342, partial_loss/deprel_loss: 0.6017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6382, loss: 0.9324, batch_reg_loss: 0.0900, reg_loss: 0.0891 ||:  82%|########2 | 78/95 [00:53<00:12,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7965, UAS: 0.9235, LAS: 0.8593, UEM: 0.5329, LEM: 0.2843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7970, partial_loss/deprel_loss: 1.3702, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5456, loss: 0.9340, batch_reg_loss: 0.0901, reg_loss: 0.0891 ||:  85%|########5 | 81/95 [00:55<00:09,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8750, UAS: 0.9231, LAS: 0.8588, UEM: 0.5271, LEM: 0.2793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5215, partial_loss/deprel_loss: 0.6945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7501, loss: 0.9381, batch_reg_loss: 0.0901, reg_loss: 0.0892 ||:  88%|########8 | 84/95 [00:57<00:07,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8623, UAS: 0.9242, LAS: 0.8600, UEM: 0.5301, LEM: 0.2781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5919, partial_loss/deprel_loss: 0.7680, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8230, loss: 0.9284, batch_reg_loss: 0.0902, reg_loss: 0.0892 ||:  93%|#########2| 88/95 [01:00<00:04,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9248, LAS: 0.8606, UEM: 0.5364, LEM: 0.2827, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6627, partial_loss/deprel_loss: 0.8353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8911, loss: 0.9216, batch_reg_loss: 0.0903, reg_loss: 0.0892 ||:  97%|#########6| 92/95 [01:03<00:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8579, UAS: 0.9251, LAS: 0.8608, UEM: 0.5348, LEM: 0.2797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7600, partial_loss/deprel_loss: 0.8205, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8988, loss: 0.9181, batch_reg_loss: 0.0904, reg_loss: 0.0893 ||: 100%|##########| 95/95 [01:04<00:00,  1.46it/s]\n",
+      "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.089  |       N/A\n",
+      "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - UEM                      |     0.535  |       N/A\n",
+      "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - LEM                      |     0.280  |       N/A\n",
+      "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - EM                       |     0.858  |       N/A\n",
+      "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.760  |       N/A\n",
+      "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:14:27,261 - INFO - combo.training.tensorboard_writer - UAS                      |     0.925  |       N/A\n",
+      "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.820  |       N/A\n",
+      "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - loss                     |     0.918  |       N/A\n",
+      "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - LAS                      |     0.861  |       N/A\n",
+      "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.596  |       N/A\n",
+      "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:14:27,262 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:14:27,263 - INFO - combo.training.trainer - Epoch duration: 0:01:04.996104\n",
+      "2023-04-06 23:14:27,263 - INFO - combo.training.trainer - Estimated training time remaining: 7:06:59\n",
+      "2023-04-06 23:14:27,263 - INFO - allennlp.training.trainer - Epoch 22/399\n",
+      "2023-04-06 23:14:27,263 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:14:27,263 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:14:27,269 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8943, UAS: 0.9550, LAS: 0.8944, UEM: 0.6711, LEM: 0.3244, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3710, partial_loss/deprel_loss: 0.6435, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6794, loss: 0.6546, batch_reg_loss: 0.0904, reg_loss: 0.0904 ||:   3%|3         | 3/95 [00:02<01:12,  1.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9571, LAS: 0.8994, UEM: 0.7498, LEM: 0.4738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1352, partial_loss/deprel_loss: 0.2762, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3385, loss: 0.5984, batch_reg_loss: 0.0905, reg_loss: 0.0904 ||:   6%|6         | 6/95 [00:04<01:10,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8508, UAS: 0.9366, LAS: 0.8751, UEM: 0.6501, LEM: 0.3910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7438, partial_loss/deprel_loss: 0.9171, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9730, loss: 0.7992, batch_reg_loss: 0.0906, reg_loss: 0.0905 ||:  11%|#         | 10/95 [00:06<01:01,  1.39it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8734, UAS: 0.9245, LAS: 0.8616, UEM: 0.5855, LEM: 0.3379, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5410, partial_loss/deprel_loss: 0.6696, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7345, loss: 0.9022, batch_reg_loss: 0.0906, reg_loss: 0.0905 ||:  15%|#4        | 14/95 [00:09<00:55,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8907, UAS: 0.9253, LAS: 0.8622, UEM: 0.5631, LEM: 0.3073, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3329, partial_loss/deprel_loss: 0.6379, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6676, loss: 0.9063, batch_reg_loss: 0.0907, reg_loss: 0.0906 ||:  19%|#8        | 18/95 [00:11<00:51,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8312, UAS: 0.9255, LAS: 0.8618, UEM: 0.5433, LEM: 0.2871, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1120, partial_loss/deprel_loss: 1.0946, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1888, loss: 0.9048, batch_reg_loss: 0.0908, reg_loss: 0.0906 ||:  22%|##2       | 21/95 [00:14<00:52,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9284, LAS: 0.8650, UEM: 0.5625, LEM: 0.2960, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3439, partial_loss/deprel_loss: 0.5512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6006, loss: 0.8739, batch_reg_loss: 0.0909, reg_loss: 0.0906 ||:  25%|##5       | 24/95 [00:16<00:52,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.9261, LAS: 0.8622, UEM: 0.5615, LEM: 0.2936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6291, partial_loss/deprel_loss: 0.7910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8496, loss: 0.8936, batch_reg_loss: 0.0909, reg_loss: 0.0907 ||:  28%|##8       | 27/95 [00:18<00:50,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8517, UAS: 0.9276, LAS: 0.8640, UEM: 0.5600, LEM: 0.2862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7352, partial_loss/deprel_loss: 0.9390, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9892, loss: 0.8841, batch_reg_loss: 0.0910, reg_loss: 0.0907 ||:  32%|###1      | 30/95 [00:21<00:47,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8651, UAS: 0.9267, LAS: 0.8631, UEM: 0.5387, LEM: 0.2710, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7497, partial_loss/deprel_loss: 0.8094, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8885, loss: 0.8920, batch_reg_loss: 0.0911, reg_loss: 0.0907 ||:  35%|###4      | 33/95 [00:23<00:44,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9277, LAS: 0.8640, UEM: 0.5550, LEM: 0.2830, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3010, partial_loss/deprel_loss: 0.4692, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5267, loss: 0.8830, batch_reg_loss: 0.0912, reg_loss: 0.0908 ||:  39%|###8      | 37/95 [00:26<00:41,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8380, UAS: 0.9279, LAS: 0.8642, UEM: 0.5553, LEM: 0.2845, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8983, partial_loss/deprel_loss: 1.0623, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1207, loss: 0.8820, batch_reg_loss: 0.0912, reg_loss: 0.0908 ||:  42%|####2     | 40/95 [00:28<00:40,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8325, UAS: 0.9271, LAS: 0.8628, UEM: 0.5414, LEM: 0.2733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0324, partial_loss/deprel_loss: 1.0027, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0999, loss: 0.8922, batch_reg_loss: 0.0913, reg_loss: 0.0908 ||:  45%|####5     | 43/95 [00:30<00:37,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8209, UAS: 0.9257, LAS: 0.8616, UEM: 0.5265, LEM: 0.2652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1586, partial_loss/deprel_loss: 1.1841, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2703, loss: 0.9049, batch_reg_loss: 0.0914, reg_loss: 0.0909 ||:  49%|####9     | 47/95 [00:33<00:33,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8048, UAS: 0.9250, LAS: 0.8605, UEM: 0.5145, LEM: 0.2555, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3112, partial_loss/deprel_loss: 1.1704, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2900, loss: 0.9120, batch_reg_loss: 0.0915, reg_loss: 0.0909 ||:  54%|#####3    | 51/95 [00:35<00:30,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8958, UAS: 0.9254, LAS: 0.8609, UEM: 0.5121, LEM: 0.2531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2439, partial_loss/deprel_loss: 0.4910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5331, loss: 0.9080, batch_reg_loss: 0.0915, reg_loss: 0.0910 ||:  58%|#####7    | 55/95 [00:38<00:26,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9182, UAS: 0.9269, LAS: 0.8626, UEM: 0.5298, LEM: 0.2669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1640, partial_loss/deprel_loss: 0.3964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4415, loss: 0.8933, batch_reg_loss: 0.0916, reg_loss: 0.0910 ||:  61%|######1   | 58/95 [00:40<00:25,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8567, UAS: 0.9246, LAS: 0.8602, UEM: 0.5197, LEM: 0.2607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7664, partial_loss/deprel_loss: 0.9591, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0123, loss: 0.9131, batch_reg_loss: 0.0917, reg_loss: 0.0910 ||:  65%|######5   | 62/95 [00:42<00:22,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8780, UAS: 0.9247, LAS: 0.8607, UEM: 0.5253, LEM: 0.2637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4750, partial_loss/deprel_loss: 0.7193, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7622, loss: 0.9094, batch_reg_loss: 0.0918, reg_loss: 0.0911 ||:  69%|######9   | 66/95 [00:45<00:19,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8741, UAS: 0.9260, LAS: 0.8624, UEM: 0.5400, LEM: 0.2790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4970, partial_loss/deprel_loss: 0.6956, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7478, loss: 0.8936, batch_reg_loss: 0.0919, reg_loss: 0.0911 ||:  74%|#######3  | 70/95 [00:48<00:18,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9253, LAS: 0.8616, UEM: 0.5566, LEM: 0.3054, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0800, partial_loss/deprel_loss: 0.2153, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2802, loss: 0.9009, batch_reg_loss: 0.0920, reg_loss: 0.0912 ||:  77%|#######6  | 73/95 [00:51<00:16,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8441, UAS: 0.9253, LAS: 0.8615, UEM: 0.5530, LEM: 0.3020, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8445, partial_loss/deprel_loss: 1.0010, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0617, loss: 0.9044, batch_reg_loss: 0.0920, reg_loss: 0.0912 ||:  80%|########  | 76/95 [00:53<00:14,  1.34it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8696, UAS: 0.9254, LAS: 0.8613, UEM: 0.5480, LEM: 0.2971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5778, partial_loss/deprel_loss: 0.8384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8784, loss: 0.9069, batch_reg_loss: 0.0921, reg_loss: 0.0912 ||:  84%|########4 | 80/95 [00:56<00:10,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8113, UAS: 0.9241, LAS: 0.8598, UEM: 0.5398, LEM: 0.2923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6084, partial_loss/deprel_loss: 1.2795, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4375, loss: 0.9203, batch_reg_loss: 0.0922, reg_loss: 0.0913 ||:  87%|########7 | 83/95 [00:58<00:08,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8501, UAS: 0.9246, LAS: 0.8605, UEM: 0.5373, LEM: 0.2892, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8148, partial_loss/deprel_loss: 0.8937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9702, loss: 0.9162, batch_reg_loss: 0.0922, reg_loss: 0.0913 ||:  91%|######### | 86/95 [01:00<00:06,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9245, LAS: 0.8603, UEM: 0.5389, LEM: 0.2900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3375, partial_loss/deprel_loss: 0.5576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6059, loss: 0.9188, batch_reg_loss: 0.0923, reg_loss: 0.0913 ||:  95%|#########4| 90/95 [01:03<00:03,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8481, UAS: 0.9248, LAS: 0.8607, UEM: 0.5360, LEM: 0.2862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7173, partial_loss/deprel_loss: 0.9406, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9883, loss: 0.9151, batch_reg_loss: 0.0924, reg_loss: 0.0914 ||:  99%|#########8| 94/95 [01:05<00:00,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8778, UAS: 0.9250, LAS: 0.8609, UEM: 0.5356, LEM: 0.2854, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5528, partial_loss/deprel_loss: 0.7448, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7988, loss: 0.9139, batch_reg_loss: 0.0924, reg_loss: 0.0914 ||: 100%|##########| 95/95 [01:06<00:00,  1.43it/s]\n",
+      "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.091  |       N/A\n",
+      "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - UEM                      |     0.536  |       N/A\n",
+      "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - LEM                      |     0.285  |       N/A\n",
+      "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - EM                       |     0.878  |       N/A\n",
+      "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.553  |       N/A\n",
+      "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - UAS                      |     0.925  |       N/A\n",
+      "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:15:33,694 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.745  |       N/A\n",
+      "2023-04-06 23:15:33,695 - INFO - combo.training.tensorboard_writer - loss                     |     0.914  |       N/A\n",
+      "2023-04-06 23:15:33,695 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:15:33,695 - INFO - combo.training.tensorboard_writer - LAS                      |     0.861  |       N/A\n",
+      "2023-04-06 23:15:33,695 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.596  |       N/A\n",
+      "2023-04-06 23:15:33,695 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:15:33,695 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:15:33,695 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:15:33,695 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:15:33,695 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:15:33,696 - INFO - combo.training.trainer - Epoch duration: 0:01:06.432977\n",
+      "2023-04-06 23:15:33,696 - INFO - combo.training.trainer - Estimated training time remaining: 7:05:29\n",
+      "2023-04-06 23:15:33,696 - INFO - allennlp.training.trainer - Epoch 23/399\n",
+      "2023-04-06 23:15:33,696 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:15:33,696 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:15:33,703 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8573, UAS: 0.9396, LAS: 0.8879, UEM: 0.7813, LEM: 0.6526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9156, partial_loss/deprel_loss: 0.9224, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0136, loss: 0.7480, batch_reg_loss: 0.0925, reg_loss: 0.0925 ||:   3%|3         | 3/95 [00:02<01:13,  1.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8504, UAS: 0.9246, LAS: 0.8641, UEM: 0.6055, LEM: 0.4671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8152, partial_loss/deprel_loss: 0.9452, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0118, loss: 0.9061, batch_reg_loss: 0.0926, reg_loss: 0.0925 ||:   7%|7         | 7/95 [00:04<01:05,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9336, LAS: 0.8745, UEM: 0.6267, LEM: 0.4295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4032, partial_loss/deprel_loss: 0.6305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6777, loss: 0.8215, batch_reg_loss: 0.0927, reg_loss: 0.0926 ||:  11%|#         | 10/95 [00:07<01:02,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8429, UAS: 0.9333, LAS: 0.8736, UEM: 0.5851, LEM: 0.3732, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9253, partial_loss/deprel_loss: 0.9607, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0464, loss: 0.8242, batch_reg_loss: 0.0928, reg_loss: 0.0926 ||:  15%|#4        | 14/95 [00:09<00:57,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9306, LAS: 0.8685, UEM: 0.5478, LEM: 0.3308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3530, partial_loss/deprel_loss: 0.6736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7023, loss: 0.8645, batch_reg_loss: 0.0928, reg_loss: 0.0927 ||:  19%|#8        | 18/95 [00:11<00:51,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8930, UAS: 0.9233, LAS: 0.8608, UEM: 0.5436, LEM: 0.3292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3514, partial_loss/deprel_loss: 0.4489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5223, loss: 0.9171, batch_reg_loss: 0.0929, reg_loss: 0.0927 ||:  22%|##2       | 21/95 [00:14<00:51,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8325, UAS: 0.9229, LAS: 0.8595, UEM: 0.5345, LEM: 0.3218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9966, partial_loss/deprel_loss: 1.0144, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1038, loss: 0.9269, batch_reg_loss: 0.0930, reg_loss: 0.0927 ||:  26%|##6       | 25/95 [00:16<00:47,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9235, LAS: 0.8599, UEM: 0.5237, LEM: 0.3068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4287, partial_loss/deprel_loss: 0.6603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7070, loss: 0.9253, batch_reg_loss: 0.0931, reg_loss: 0.0928 ||:  29%|##9       | 28/95 [00:18<00:46,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9257, LAS: 0.8626, UEM: 0.5416, LEM: 0.3125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1919, partial_loss/deprel_loss: 0.4566, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4968, loss: 0.9015, batch_reg_loss: 0.0931, reg_loss: 0.0928 ||:  33%|###2      | 31/95 [00:21<00:44,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8176, UAS: 0.9265, LAS: 0.8633, UEM: 0.5546, LEM: 0.3246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1036, partial_loss/deprel_loss: 1.1616, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2432, loss: 0.8961, batch_reg_loss: 0.0932, reg_loss: 0.0928 ||:  36%|###5      | 34/95 [00:23<00:44,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8807, UAS: 0.9280, LAS: 0.8649, UEM: 0.5659, LEM: 0.3310, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4681, partial_loss/deprel_loss: 0.7331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7734, loss: 0.8842, batch_reg_loss: 0.0933, reg_loss: 0.0929 ||:  39%|###8      | 37/95 [00:25<00:42,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9053, UAS: 0.9282, LAS: 0.8651, UEM: 0.5715, LEM: 0.3287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2860, partial_loss/deprel_loss: 0.5343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5780, loss: 0.8838, batch_reg_loss: 0.0933, reg_loss: 0.0929 ||:  42%|####2     | 40/95 [00:27<00:40,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7985, UAS: 0.9280, LAS: 0.8651, UEM: 0.5746, LEM: 0.3274, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6112, partial_loss/deprel_loss: 1.2473, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4135, loss: 0.8834, batch_reg_loss: 0.0934, reg_loss: 0.0929 ||:  45%|####5     | 43/95 [00:30<00:40,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8517, UAS: 0.9286, LAS: 0.8656, UEM: 0.5680, LEM: 0.3191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6863, partial_loss/deprel_loss: 0.8954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9471, loss: 0.8781, batch_reg_loss: 0.0935, reg_loss: 0.0930 ||:  48%|####8     | 46/95 [00:33<00:39,  1.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8069, UAS: 0.9281, LAS: 0.8651, UEM: 0.5619, LEM: 0.3115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2999, partial_loss/deprel_loss: 1.2194, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3291, loss: 0.8818, batch_reg_loss: 0.0935, reg_loss: 0.0930 ||:  52%|#####1    | 49/95 [00:35<00:35,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8021, UAS: 0.9284, LAS: 0.8654, UEM: 0.5685, LEM: 0.3158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4109, partial_loss/deprel_loss: 1.2558, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3804, loss: 0.8792, batch_reg_loss: 0.0936, reg_loss: 0.0930 ||:  55%|#####4    | 52/95 [00:39<00:39,  1.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9290, LAS: 0.8665, UEM: 0.5837, LEM: 0.3354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1328, partial_loss/deprel_loss: 0.2806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3447, loss: 0.8706, batch_reg_loss: 0.0937, reg_loss: 0.0931 ||:  58%|#####7    | 55/95 [00:41<00:35,  1.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8548, UAS: 0.9294, LAS: 0.8665, UEM: 0.5767, LEM: 0.3271, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7648, partial_loss/deprel_loss: 0.9760, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0275, loss: 0.8704, batch_reg_loss: 0.0937, reg_loss: 0.0931 ||:  61%|######1   | 58/95 [00:43<00:31,  1.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9308, LAS: 0.8682, UEM: 0.5835, LEM: 0.3291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2990, partial_loss/deprel_loss: 0.5147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5653, loss: 0.8553, batch_reg_loss: 0.0938, reg_loss: 0.0931 ||:  64%|######4   | 61/95 [00:46<00:27,  1.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8475, UAS: 0.9294, LAS: 0.8665, UEM: 0.5760, LEM: 0.3216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8493, partial_loss/deprel_loss: 0.9959, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0604, loss: 0.8729, batch_reg_loss: 0.0939, reg_loss: 0.0932 ||:  68%|######8   | 65/95 [00:48<00:23,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8878, UAS: 0.9290, LAS: 0.8658, UEM: 0.5684, LEM: 0.3144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4934, partial_loss/deprel_loss: 0.6541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7159, loss: 0.8777, batch_reg_loss: 0.0939, reg_loss: 0.0932 ||:  72%|#######1  | 68/95 [00:50<00:20,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8593, UAS: 0.9287, LAS: 0.8654, UEM: 0.5604, LEM: 0.3071, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7519, partial_loss/deprel_loss: 0.8984, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9631, loss: 0.8827, batch_reg_loss: 0.0940, reg_loss: 0.0932 ||:  75%|#######4  | 71/95 [00:52<00:17,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7866, UAS: 0.9278, LAS: 0.8644, UEM: 0.5533, LEM: 0.3016, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6260, partial_loss/deprel_loss: 1.3245, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4789, loss: 0.8904, batch_reg_loss: 0.0941, reg_loss: 0.0933 ||:  78%|#######7  | 74/95 [00:55<00:15,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7768, UAS: 0.9264, LAS: 0.8628, UEM: 0.5454, LEM: 0.2965, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9205, partial_loss/deprel_loss: 1.4197, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6140, loss: 0.9026, batch_reg_loss: 0.0941, reg_loss: 0.0933 ||:  81%|########1 | 77/95 [00:57<00:12,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8221, UAS: 0.9259, LAS: 0.8622, UEM: 0.5381, LEM: 0.2908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2362, partial_loss/deprel_loss: 1.1283, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2441, loss: 0.9077, batch_reg_loss: 0.0942, reg_loss: 0.0933 ||:  84%|########4 | 80/95 [00:59<00:10,  1.39it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8262, UAS: 0.9257, LAS: 0.8619, UEM: 0.5395, LEM: 0.2932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1983, partial_loss/deprel_loss: 1.1750, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2739, loss: 0.9105, batch_reg_loss: 0.0943, reg_loss: 0.0934 ||:  87%|########7 | 83/95 [01:01<00:08,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8201, UAS: 0.9257, LAS: 0.8619, UEM: 0.5385, LEM: 0.2912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0666, partial_loss/deprel_loss: 1.1067, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1930, loss: 0.9104, batch_reg_loss: 0.0944, reg_loss: 0.0934 ||:  91%|######### | 86/95 [01:03<00:06,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9265, LAS: 0.8628, UEM: 0.5374, LEM: 0.2884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3046, partial_loss/deprel_loss: 0.5369, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5849, loss: 0.9043, batch_reg_loss: 0.0945, reg_loss: 0.0935 ||:  95%|#########4| 90/95 [01:06<00:03,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8174, UAS: 0.9268, LAS: 0.8631, UEM: 0.5373, LEM: 0.2863, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2839, partial_loss/deprel_loss: 1.1413, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2644, loss: 0.9027, batch_reg_loss: 0.0946, reg_loss: 0.0935 ||:  99%|#########8| 94/95 [01:08<00:00,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8302, UAS: 0.9264, LAS: 0.8628, UEM: 0.5351, LEM: 0.2850, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2075, partial_loss/deprel_loss: 1.1032, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2186, loss: 0.9061, batch_reg_loss: 0.0946, reg_loss: 0.0935 ||: 100%|##########| 95/95 [01:09<00:00,  1.37it/s]\n",
+      "2023-04-06 23:16:43,091 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:16:43,091 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:16:43,091 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.094  |       N/A\n",
+      "2023-04-06 23:16:43,091 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:16:43,091 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:16:43,091 - INFO - combo.training.tensorboard_writer - UEM                      |     0.535  |       N/A\n",
+      "2023-04-06 23:16:43,091 - INFO - combo.training.tensorboard_writer - LEM                      |     0.285  |       N/A\n",
+      "2023-04-06 23:16:43,091 - INFO - combo.training.tensorboard_writer - EM                       |     0.830  |       N/A\n",
+      "2023-04-06 23:16:43,091 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.207  |       N/A\n",
+      "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - UAS                      |     0.926  |       N/A\n",
+      "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.103  |       N/A\n",
+      "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - loss                     |     0.906  |       N/A\n",
+      "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - LAS                      |     0.863  |       N/A\n",
+      "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.596  |       N/A\n",
+      "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:16:43,092 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:16:43,093 - INFO - combo.training.trainer - Epoch duration: 0:01:09.396964\n",
+      "2023-04-06 23:16:43,093 - INFO - combo.training.trainer - Estimated training time remaining: 7:04:48\n",
+      "2023-04-06 23:16:43,093 - INFO - allennlp.training.trainer - Epoch 24/399\n",
+      "2023-04-06 23:16:43,093 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:16:43,094 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:16:43,100 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8705, UAS: 0.9249, LAS: 0.8612, UEM: 0.3056, LEM: 0.0894, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6457, partial_loss/deprel_loss: 0.7513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8249, loss: 0.9038, batch_reg_loss: 0.0947, reg_loss: 0.0946 ||:   4%|4         | 4/95 [00:02<00:56,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9116, UAS: 0.9331, LAS: 0.8720, UEM: 0.4283, LEM: 0.1824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2924, partial_loss/deprel_loss: 0.4524, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5151, loss: 0.8246, batch_reg_loss: 0.0947, reg_loss: 0.0947 ||:   7%|7         | 7/95 [00:04<00:56,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8776, UAS: 0.9360, LAS: 0.8737, UEM: 0.4721, LEM: 0.2128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4536, partial_loss/deprel_loss: 0.6589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7127, loss: 0.8078, batch_reg_loss: 0.0948, reg_loss: 0.0947 ||:  11%|#         | 10/95 [00:07<01:00,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9323, LAS: 0.8695, UEM: 0.4776, LEM: 0.2093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3617, partial_loss/deprel_loss: 0.6263, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6682, loss: 0.8369, batch_reg_loss: 0.0949, reg_loss: 0.0947 ||:  14%|#3        | 13/95 [00:09<00:59,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8336, UAS: 0.9316, LAS: 0.8699, UEM: 0.4900, LEM: 0.2237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2622, partial_loss/deprel_loss: 1.1134, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2381, loss: 0.8428, batch_reg_loss: 0.0949, reg_loss: 0.0948 ||:  18%|#7        | 17/95 [00:11<00:53,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9322, LAS: 0.8705, UEM: 0.5049, LEM: 0.2429, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2068, partial_loss/deprel_loss: 0.4451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4924, loss: 0.8404, batch_reg_loss: 0.0950, reg_loss: 0.0948 ||:  21%|##1       | 20/95 [00:13<00:51,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8700, UAS: 0.9301, LAS: 0.8684, UEM: 0.4812, LEM: 0.2256, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5620, partial_loss/deprel_loss: 0.7618, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8170, loss: 0.8559, batch_reg_loss: 0.0951, reg_loss: 0.0948 ||:  25%|##5       | 24/95 [00:16<00:46,  1.51it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9204, UAS: 0.9300, LAS: 0.8688, UEM: 0.5011, LEM: 0.2415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2828, partial_loss/deprel_loss: 0.4777, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5339, loss: 0.8527, batch_reg_loss: 0.0952, reg_loss: 0.0949 ||:  28%|##8       | 27/95 [00:18<00:46,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9327, LAS: 0.8717, UEM: 0.5366, LEM: 0.2690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6499, partial_loss/deprel_loss: 0.8602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9134, loss: 0.8289, batch_reg_loss: 0.0953, reg_loss: 0.0949 ||:  33%|###2      | 31/95 [00:20<00:42,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8504, UAS: 0.9316, LAS: 0.8703, UEM: 0.5202, LEM: 0.2579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8491, partial_loss/deprel_loss: 0.8918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9785, loss: 0.8418, batch_reg_loss: 0.0953, reg_loss: 0.0950 ||:  36%|###5      | 34/95 [00:22<00:40,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9334, LAS: 0.8725, UEM: 0.5423, LEM: 0.2780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4035, partial_loss/deprel_loss: 0.6322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6819, loss: 0.8235, batch_reg_loss: 0.0954, reg_loss: 0.0950 ||:  39%|###8      | 37/95 [00:25<00:42,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8001, UAS: 0.9309, LAS: 0.8697, UEM: 0.5260, LEM: 0.2675, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4140, partial_loss/deprel_loss: 1.2018, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3397, loss: 0.8425, batch_reg_loss: 0.0955, reg_loss: 0.0950 ||:  42%|####2     | 40/95 [00:27<00:40,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9311, LAS: 0.8699, UEM: 0.5406, LEM: 0.2838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1469, partial_loss/deprel_loss: 0.3664, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4180, loss: 0.8396, batch_reg_loss: 0.0955, reg_loss: 0.0951 ||:  45%|####5     | 43/95 [00:30<00:39,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9293, LAS: 0.8681, UEM: 0.5387, LEM: 0.2812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2984, partial_loss/deprel_loss: 0.5597, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6031, loss: 0.8573, batch_reg_loss: 0.0956, reg_loss: 0.0951 ||:  48%|####8     | 46/95 [00:32<00:36,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8952, UAS: 0.9308, LAS: 0.8700, UEM: 0.5586, LEM: 0.2980, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4226, partial_loss/deprel_loss: 0.6094, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6677, loss: 0.8396, batch_reg_loss: 0.0957, reg_loss: 0.0951 ||:  52%|#####1    | 49/95 [00:34<00:35,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8375, UAS: 0.9300, LAS: 0.8688, UEM: 0.5567, LEM: 0.2960, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0885, partial_loss/deprel_loss: 1.0907, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1860, loss: 0.8510, batch_reg_loss: 0.0957, reg_loss: 0.0952 ||:  56%|#####5    | 53/95 [00:37<00:29,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8210, UAS: 0.9292, LAS: 0.8678, UEM: 0.5456, LEM: 0.2875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2178, partial_loss/deprel_loss: 1.1537, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2623, loss: 0.8606, batch_reg_loss: 0.0958, reg_loss: 0.0952 ||:  59%|#####8    | 56/95 [00:39<00:27,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8232, UAS: 0.9287, LAS: 0.8669, UEM: 0.5385, LEM: 0.2788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2499, partial_loss/deprel_loss: 1.1162, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2388, loss: 0.8674, batch_reg_loss: 0.0959, reg_loss: 0.0952 ||:  63%|######3   | 60/95 [00:41<00:23,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9286, LAS: 0.8667, UEM: 0.5355, LEM: 0.2758, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2946, partial_loss/deprel_loss: 0.5109, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5636, loss: 0.8687, batch_reg_loss: 0.0960, reg_loss: 0.0953 ||:  67%|######7   | 64/95 [00:43<00:19,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8406, UAS: 0.9291, LAS: 0.8674, UEM: 0.5448, LEM: 0.2888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9763, partial_loss/deprel_loss: 0.9913, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0844, loss: 0.8637, batch_reg_loss: 0.0961, reg_loss: 0.0953 ||:  72%|#######1  | 68/95 [00:46<00:17,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8227, UAS: 0.9284, LAS: 0.8665, UEM: 0.5365, LEM: 0.2817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3328, partial_loss/deprel_loss: 1.2516, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3640, loss: 0.8735, batch_reg_loss: 0.0962, reg_loss: 0.0954 ||:  76%|#######5  | 72/95 [00:48<00:14,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9294, LAS: 0.8672, UEM: 0.5403, LEM: 0.2812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3011, partial_loss/deprel_loss: 0.5586, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6034, loss: 0.8663, batch_reg_loss: 0.0963, reg_loss: 0.0954 ||:  81%|########1 | 77/95 [00:51<00:10,  1.71it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8299, UAS: 0.9286, LAS: 0.8664, UEM: 0.5539, LEM: 0.3033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1272, partial_loss/deprel_loss: 1.1322, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2275, loss: 0.8750, batch_reg_loss: 0.0964, reg_loss: 0.0955 ||:  85%|########5 | 81/95 [00:53<00:08,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7664, UAS: 0.9275, LAS: 0.8651, UEM: 0.5479, LEM: 0.2981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1046, partial_loss/deprel_loss: 1.5443, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7528, loss: 0.8858, batch_reg_loss: 0.0965, reg_loss: 0.0955 ||:  89%|########9 | 85/95 [00:56<00:06,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8017, UAS: 0.9272, LAS: 0.8646, UEM: 0.5430, LEM: 0.2943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4042, partial_loss/deprel_loss: 1.3009, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4182, loss: 0.8911, batch_reg_loss: 0.0966, reg_loss: 0.0956 ||:  94%|#########3| 89/95 [00:59<00:03,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8640, UAS: 0.9267, LAS: 0.8640, UEM: 0.5401, LEM: 0.2912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7409, partial_loss/deprel_loss: 0.8910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9577, loss: 0.8968, batch_reg_loss: 0.0967, reg_loss: 0.0956 ||:  98%|#########7| 93/95 [01:01<00:01,  1.56it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8652, UAS: 0.9270, LAS: 0.8644, UEM: 0.5390, LEM: 0.2893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6818, partial_loss/deprel_loss: 0.8711, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9299, loss: 0.8950, batch_reg_loss: 0.0967, reg_loss: 0.0956 ||: 100%|##########| 95/95 [01:03<00:00,  1.50it/s]\n",
+      "2023-04-06 23:17:46,366 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.096  |       N/A\n",
+      "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - UEM                      |     0.539  |       N/A\n",
+      "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - LEM                      |     0.289  |       N/A\n",
+      "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - EM                       |     0.865  |       N/A\n",
+      "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.682  |       N/A\n",
+      "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - UAS                      |     0.927  |       N/A\n",
+      "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.871  |       N/A\n",
+      "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - loss                     |     0.895  |       N/A\n",
+      "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:17:46,367 - INFO - combo.training.tensorboard_writer - LAS                      |     0.864  |       N/A\n",
+      "2023-04-06 23:17:46,368 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.596  |       N/A\n",
+      "2023-04-06 23:17:46,368 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:17:46,368 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:17:46,368 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:17:46,368 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:17:46,368 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:17:46,368 - INFO - combo.training.trainer - Epoch duration: 0:01:03.275262\n",
+      "2023-04-06 23:17:46,368 - INFO - combo.training.trainer - Estimated training time remaining: 7:02:32\n",
+      "2023-04-06 23:17:46,369 - INFO - allennlp.training.trainer - Epoch 25/399\n",
+      "2023-04-06 23:17:46,369 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:17:46,369 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:17:46,375 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9189, LAS: 0.8572, UEM: 0.6852, LEM: 0.5232, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1098, partial_loss/deprel_loss: 0.3017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3601, loss: 0.9374, batch_reg_loss: 0.0968, reg_loss: 0.0967 ||:   3%|3         | 3/95 [00:02<01:09,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8290, UAS: 0.9208, LAS: 0.8558, UEM: 0.5725, LEM: 0.3888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1098, partial_loss/deprel_loss: 1.1618, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2482, loss: 0.9715, batch_reg_loss: 0.0969, reg_loss: 0.0968 ||:   7%|7         | 7/95 [00:04<01:02,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8663, UAS: 0.9256, LAS: 0.8627, UEM: 0.5164, LEM: 0.3131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7495, partial_loss/deprel_loss: 0.7931, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8813, loss: 0.9090, batch_reg_loss: 0.0970, reg_loss: 0.0968 ||:  12%|#1        | 11/95 [00:07<00:57,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9541, UAS: 0.9256, LAS: 0.8639, UEM: 0.6032, LEM: 0.4338, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0652, partial_loss/deprel_loss: 0.1868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2595, loss: 0.9034, batch_reg_loss: 0.0970, reg_loss: 0.0969 ||:  15%|#4        | 14/95 [00:09<01:00,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8926, UAS: 0.9313, LAS: 0.8700, UEM: 0.6227, LEM: 0.4128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3785, partial_loss/deprel_loss: 0.5911, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6457, loss: 0.8529, batch_reg_loss: 0.0971, reg_loss: 0.0969 ||:  18%|#7        | 17/95 [00:12<00:57,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9294, LAS: 0.8675, UEM: 0.5875, LEM: 0.3764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4364, partial_loss/deprel_loss: 0.6350, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6925, loss: 0.8762, batch_reg_loss: 0.0972, reg_loss: 0.0970 ||:  22%|##2       | 21/95 [00:14<00:53,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8775, UAS: 0.9292, LAS: 0.8669, UEM: 0.5596, LEM: 0.3443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4452, partial_loss/deprel_loss: 0.7809, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8110, loss: 0.8809, batch_reg_loss: 0.0973, reg_loss: 0.0970 ||:  26%|##6       | 25/95 [00:17<00:48,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8664, UAS: 0.9298, LAS: 0.8674, UEM: 0.5522, LEM: 0.3354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6590, partial_loss/deprel_loss: 0.8291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8925, loss: 0.8776, batch_reg_loss: 0.0974, reg_loss: 0.0970 ||:  29%|##9       | 28/95 [00:19<00:46,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8351, UAS: 0.9299, LAS: 0.8680, UEM: 0.5456, LEM: 0.3247, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9874, partial_loss/deprel_loss: 1.0991, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1742, loss: 0.8726, batch_reg_loss: 0.0974, reg_loss: 0.0971 ||:  34%|###3      | 32/95 [00:21<00:42,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8864, UAS: 0.9290, LAS: 0.8669, UEM: 0.5328, LEM: 0.3096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3754, partial_loss/deprel_loss: 0.6724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7105, loss: 0.8782, batch_reg_loss: 0.0975, reg_loss: 0.0971 ||:  38%|###7      | 36/95 [00:24<00:40,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8141, UAS: 0.9284, LAS: 0.8662, UEM: 0.5361, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4523, partial_loss/deprel_loss: 1.2520, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3896, loss: 0.8849, batch_reg_loss: 0.0976, reg_loss: 0.0972 ||:  41%|####1     | 39/95 [00:26<00:39,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7732, UAS: 0.9246, LAS: 0.8615, UEM: 0.5251, LEM: 0.3019, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9087, partial_loss/deprel_loss: 1.4498, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6392, loss: 0.9204, batch_reg_loss: 0.0977, reg_loss: 0.0972 ||:  44%|####4     | 42/95 [00:29<00:37,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8868, UAS: 0.9254, LAS: 0.8623, UEM: 0.5276, LEM: 0.3000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4421, partial_loss/deprel_loss: 0.6628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7164, loss: 0.9134, batch_reg_loss: 0.0977, reg_loss: 0.0972 ||:  47%|####7     | 45/95 [00:31<00:37,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8501, UAS: 0.9226, LAS: 0.8588, UEM: 0.5102, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8822, partial_loss/deprel_loss: 0.9684, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0490, loss: 0.9447, batch_reg_loss: 0.0978, reg_loss: 0.0973 ||:  52%|#####1    | 49/95 [00:34<00:32,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9239, LAS: 0.8604, UEM: 0.5140, LEM: 0.2872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3090, partial_loss/deprel_loss: 0.4786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5426, loss: 0.9326, batch_reg_loss: 0.0979, reg_loss: 0.0973 ||:  56%|#####5    | 53/95 [00:36<00:28,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9247, LAS: 0.8612, UEM: 0.5259, LEM: 0.2950, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1767, partial_loss/deprel_loss: 0.3957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4499, loss: 0.9250, batch_reg_loss: 0.0980, reg_loss: 0.0974 ||:  60%|######    | 57/95 [00:39<00:25,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8981, UAS: 0.9248, LAS: 0.8615, UEM: 0.5254, LEM: 0.2928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2928, partial_loss/deprel_loss: 0.5556, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6012, loss: 0.9223, batch_reg_loss: 0.0981, reg_loss: 0.0974 ||:  64%|######4   | 61/95 [00:42<00:23,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7954, UAS: 0.9250, LAS: 0.8616, UEM: 0.5250, LEM: 0.2908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6197, partial_loss/deprel_loss: 1.2852, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4504, loss: 0.9219, batch_reg_loss: 0.0982, reg_loss: 0.0975 ||:  68%|######8   | 65/95 [00:44<00:20,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9256, LAS: 0.8623, UEM: 0.5224, LEM: 0.2851, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2762, partial_loss/deprel_loss: 0.5328, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5798, loss: 0.9149, batch_reg_loss: 0.0983, reg_loss: 0.0975 ||:  73%|#######2  | 69/95 [00:47<00:17,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9152, UAS: 0.9260, LAS: 0.8628, UEM: 0.5265, LEM: 0.2855, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2881, partial_loss/deprel_loss: 0.4474, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5140, loss: 0.9117, batch_reg_loss: 0.0984, reg_loss: 0.0976 ||:  77%|#######6  | 73/95 [00:49<00:14,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8064, UAS: 0.9260, LAS: 0.8628, UEM: 0.5274, LEM: 0.2852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3724, partial_loss/deprel_loss: 1.1643, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3044, loss: 0.9094, batch_reg_loss: 0.0985, reg_loss: 0.0976 ||:  81%|########1 | 77/95 [00:52<00:12,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9016, UAS: 0.9267, LAS: 0.8637, UEM: 0.5316, LEM: 0.2863, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3660, partial_loss/deprel_loss: 0.5573, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6176, loss: 0.9028, batch_reg_loss: 0.0985, reg_loss: 0.0976 ||:  84%|########4 | 80/95 [00:54<00:10,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8768, UAS: 0.9264, LAS: 0.8632, UEM: 0.5251, LEM: 0.2818, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5652, partial_loss/deprel_loss: 0.8186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8665, loss: 0.9087, batch_reg_loss: 0.0986, reg_loss: 0.0977 ||:  87%|########7 | 83/95 [00:57<00:08,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9272, LAS: 0.8641, UEM: 0.5284, LEM: 0.2816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5205, partial_loss/deprel_loss: 0.6962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7597, loss: 0.9006, batch_reg_loss: 0.0987, reg_loss: 0.0977 ||:  91%|######### | 86/95 [00:59<00:06,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8862, UAS: 0.9273, LAS: 0.8641, UEM: 0.5355, LEM: 0.2872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4141, partial_loss/deprel_loss: 0.6238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6806, loss: 0.8981, batch_reg_loss: 0.0987, reg_loss: 0.0977 ||:  94%|#########3| 89/95 [01:01<00:04,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8717, UAS: 0.9277, LAS: 0.8647, UEM: 0.5379, LEM: 0.2892, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5813, partial_loss/deprel_loss: 0.7569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8206, loss: 0.8927, batch_reg_loss: 0.0988, reg_loss: 0.0978 ||:  97%|#########6| 92/95 [01:03<00:02,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8762, UAS: 0.9283, LAS: 0.8652, UEM: 0.5407, LEM: 0.2897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5545, partial_loss/deprel_loss: 0.7295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7933, loss: 0.8872, batch_reg_loss: 0.0988, reg_loss: 0.0978 ||: 100%|##########| 95/95 [01:06<00:00,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8762, UAS: 0.9283, LAS: 0.8652, UEM: 0.5407, LEM: 0.2897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5545, partial_loss/deprel_loss: 0.7295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7933, loss: 0.8872, batch_reg_loss: 0.0988, reg_loss: 0.0978 ||: 100%|##########| 95/95 [01:06<00:00,  1.44it/s]\n",
+      "2023-04-06 23:18:52,458 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8898, UAS: 0.9213, LAS: 0.8628, UEM: 0.3785, LEM: 0.1168, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4790, partial_loss/deprel_loss: 23.3874, partial_loss/cycle_loss: 0.0000, batch_loss: 18.8057, loss: 31.9415, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  18%|#8        | 2/11 [00:02<00:09,  1.07s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8605, UAS: 0.9251, LAS: 0.8630, UEM: 0.3372, LEM: 0.1015, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8384, partial_loss/deprel_loss: 42.7479, partial_loss/cycle_loss: 0.0000, batch_loss: 34.3660, loss: 31.7453, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:04<00:06,  1.03s/it]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8942, UAS: 0.9405, LAS: 0.8815, UEM: 0.5725, LEM: 0.2807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4084, partial_loss/deprel_loss: 28.1948, partial_loss/cycle_loss: 0.0000, batch_loss: 22.6376, loss: 27.6476, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  73%|#######2  | 8/11 [00:07<00:02,  1.00it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9460, LAS: 0.8885, UEM: 0.6523, LEM: 0.3801, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7674, partial_loss/deprel_loss: 32.9125, partial_loss/cycle_loss: 0.0000, batch_loss: 26.4835, loss: 25.6424, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9460, LAS: 0.8885, UEM: 0.6523, LEM: 0.3801, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7674, partial_loss/deprel_loss: 32.9125, partial_loss/cycle_loss: 0.0000, batch_loss: 26.4835, loss: 25.6424, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.04it/s]\n",
+      "2023-04-06 23:19:03,065 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.098  |     0.000\n",
+      "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - UEM                      |     0.541  |     0.652\n",
+      "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - LEM                      |     0.290  |     0.380\n",
+      "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - EM                       |     0.876  |     0.873\n",
+      "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.555  |     0.767\n",
+      "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - UAS                      |     0.928  |     0.946\n",
+      "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.729  |    32.913\n",
+      "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - loss                     |     0.887  |    25.642\n",
+      "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - LAS                      |     0.865  |     0.888\n",
+      "2023-04-06 23:19:03,066 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.596  |       N/A\n",
+      "2023-04-06 23:19:03,067 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:19:03,067 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:19:03,067 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:19:03,067 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:19:03,067 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 23:19:03,067 - INFO - combo.training.trainer - Epoch duration: 0:01:16.698692\n",
+      "2023-04-06 23:19:03,067 - INFO - combo.training.trainer - Estimated training time remaining: 7:03:35\n",
+      "2023-04-06 23:19:03,067 - INFO - allennlp.training.trainer - Epoch 26/399\n",
+      "2023-04-06 23:19:03,068 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:19:03,068 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:19:03,074 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8072, UAS: 0.9113, LAS: 0.8445, UEM: 0.2432, LEM: 0.0822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4756, partial_loss/deprel_loss: 1.1600, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3220, loss: 1.0506, batch_reg_loss: 0.0989, reg_loss: 0.0989 ||:   3%|3         | 3/95 [00:02<01:04,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9313, LAS: 0.8702, UEM: 0.6215, LEM: 0.4108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2637, partial_loss/deprel_loss: 0.5345, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5793, loss: 0.8482, batch_reg_loss: 0.0990, reg_loss: 0.0989 ||:   6%|6         | 6/95 [00:04<01:01,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8316, UAS: 0.9333, LAS: 0.8707, UEM: 0.5914, LEM: 0.3525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0801, partial_loss/deprel_loss: 1.0039, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1181, loss: 0.8360, batch_reg_loss: 0.0990, reg_loss: 0.0989 ||:   9%|9         | 9/95 [00:06<00:59,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8532, UAS: 0.9310, LAS: 0.8692, UEM: 0.5342, LEM: 0.2943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9169, partial_loss/deprel_loss: 0.8493, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9619, loss: 0.8448, batch_reg_loss: 0.0991, reg_loss: 0.0990 ||:  14%|#3        | 13/95 [00:08<00:54,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9501, UAS: 0.9347, LAS: 0.8743, UEM: 0.6199, LEM: 0.4003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0694, partial_loss/deprel_loss: 0.1922, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2668, loss: 0.8110, batch_reg_loss: 0.0991, reg_loss: 0.0990 ||:  17%|#6        | 16/95 [00:11<00:56,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9389, LAS: 0.8791, UEM: 0.6526, LEM: 0.4167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1531, partial_loss/deprel_loss: 0.3584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4165, loss: 0.7715, batch_reg_loss: 0.0992, reg_loss: 0.0990 ||:  20%|##        | 19/95 [00:13<00:57,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8427, UAS: 0.9359, LAS: 0.8755, UEM: 0.6283, LEM: 0.3947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0335, partial_loss/deprel_loss: 0.9413, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0590, loss: 0.8061, batch_reg_loss: 0.0993, reg_loss: 0.0991 ||:  23%|##3       | 22/95 [00:15<00:55,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9358, LAS: 0.8751, UEM: 0.6096, LEM: 0.3691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2864, partial_loss/deprel_loss: 0.5830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6230, loss: 0.8102, batch_reg_loss: 0.0993, reg_loss: 0.0991 ||:  27%|##7       | 26/95 [00:18<00:49,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8783, UAS: 0.9367, LAS: 0.8759, UEM: 0.5972, LEM: 0.3475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4592, partial_loss/deprel_loss: 0.6983, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7499, loss: 0.8017, batch_reg_loss: 0.0994, reg_loss: 0.0991 ||:  32%|###1      | 30/95 [00:20<00:43,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7727, UAS: 0.9329, LAS: 0.8714, UEM: 0.5814, LEM: 0.3363, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0666, partial_loss/deprel_loss: 1.4850, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7008, loss: 0.8388, batch_reg_loss: 0.0995, reg_loss: 0.0992 ||:  35%|###4      | 33/95 [00:22<00:42,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9321, LAS: 0.8707, UEM: 0.5792, LEM: 0.3314, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5242, partial_loss/deprel_loss: 0.6863, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7535, loss: 0.8426, batch_reg_loss: 0.0996, reg_loss: 0.0992 ||:  38%|###7      | 36/95 [00:25<00:41,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9170, UAS: 0.9335, LAS: 0.8721, UEM: 0.5865, LEM: 0.3348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1567, partial_loss/deprel_loss: 0.4337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4779, loss: 0.8318, batch_reg_loss: 0.0996, reg_loss: 0.0992 ||:  41%|####1     | 39/95 [00:27<00:38,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8556, UAS: 0.9334, LAS: 0.8717, UEM: 0.5767, LEM: 0.3236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7608, partial_loss/deprel_loss: 0.8941, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9672, loss: 0.8360, batch_reg_loss: 0.0997, reg_loss: 0.0993 ||:  44%|####4     | 42/95 [00:29<00:37,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8195, UAS: 0.9308, LAS: 0.8689, UEM: 0.5553, LEM: 0.3096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2714, partial_loss/deprel_loss: 1.1683, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2887, loss: 0.8602, batch_reg_loss: 0.0998, reg_loss: 0.0993 ||:  48%|####8     | 46/95 [00:31<00:32,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8615, UAS: 0.9302, LAS: 0.8681, UEM: 0.5470, LEM: 0.3021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6266, partial_loss/deprel_loss: 0.9013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9463, loss: 0.8662, batch_reg_loss: 0.0999, reg_loss: 0.0993 ||:  53%|#####2    | 50/95 [00:34<00:29,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9290, LAS: 0.8667, UEM: 0.5389, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3298, partial_loss/deprel_loss: 0.5372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5956, loss: 0.8754, batch_reg_loss: 0.1000, reg_loss: 0.0994 ||:  57%|#####6    | 54/95 [00:37<00:27,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8896, UAS: 0.9298, LAS: 0.8677, UEM: 0.5382, LEM: 0.2922, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4384, partial_loss/deprel_loss: 0.6646, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7194, loss: 0.8674, batch_reg_loss: 0.1000, reg_loss: 0.0994 ||:  60%|######    | 57/95 [00:39<00:26,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8756, UAS: 0.9305, LAS: 0.8687, UEM: 0.5427, LEM: 0.2938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5983, partial_loss/deprel_loss: 0.7491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8190, loss: 0.8575, batch_reg_loss: 0.1001, reg_loss: 0.0995 ||:  63%|######3   | 60/95 [00:41<00:24,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9068, UAS: 0.9314, LAS: 0.8696, UEM: 0.5507, LEM: 0.2991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3255, partial_loss/deprel_loss: 0.5318, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5907, loss: 0.8503, batch_reg_loss: 0.1002, reg_loss: 0.0995 ||:  66%|######6   | 63/95 [00:43<00:22,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9325, LAS: 0.8710, UEM: 0.5650, LEM: 0.3113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2447, partial_loss/deprel_loss: 0.4833, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5358, loss: 0.8399, batch_reg_loss: 0.1002, reg_loss: 0.0995 ||:  69%|######9   | 66/95 [00:45<00:20,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8878, UAS: 0.9321, LAS: 0.8707, UEM: 0.5562, LEM: 0.3035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5490, partial_loss/deprel_loss: 0.6523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7320, loss: 0.8437, batch_reg_loss: 0.1003, reg_loss: 0.0996 ||:  74%|#######3  | 70/95 [00:48<00:16,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8345, UAS: 0.9299, LAS: 0.8679, UEM: 0.5506, LEM: 0.2993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0729, partial_loss/deprel_loss: 1.0520, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1566, loss: 0.8650, batch_reg_loss: 0.1004, reg_loss: 0.0996 ||:  78%|#######7  | 74/95 [00:51<00:14,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9031, UAS: 0.9310, LAS: 0.8692, UEM: 0.5607, LEM: 0.3054, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2774, partial_loss/deprel_loss: 0.5219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5735, loss: 0.8541, batch_reg_loss: 0.1005, reg_loss: 0.0996 ||:  81%|########1 | 77/95 [00:53<00:12,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9311, LAS: 0.8690, UEM: 0.5606, LEM: 0.3044, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3240, partial_loss/deprel_loss: 0.5033, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5680, loss: 0.8555, batch_reg_loss: 0.1006, reg_loss: 0.0997 ||:  85%|########5 | 81/95 [00:55<00:09,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7720, UAS: 0.9296, LAS: 0.8672, UEM: 0.5546, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9315, partial_loss/deprel_loss: 1.4020, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6085, loss: 0.8708, batch_reg_loss: 0.1006, reg_loss: 0.0997 ||:  89%|########9 | 85/95 [00:58<00:06,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9295, LAS: 0.8671, UEM: 0.5508, LEM: 0.2948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2891, partial_loss/deprel_loss: 0.5579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6049, loss: 0.8730, batch_reg_loss: 0.1007, reg_loss: 0.0998 ||:  94%|#########3| 89/95 [01:00<00:03,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8302, UAS: 0.9282, LAS: 0.8654, UEM: 0.5411, LEM: 0.2887, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2976, partial_loss/deprel_loss: 1.0998, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2402, loss: 0.8888, batch_reg_loss: 0.1008, reg_loss: 0.0998 ||:  98%|#########7| 93/95 [01:03<00:01,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8521, UAS: 0.9284, LAS: 0.8657, UEM: 0.5413, LEM: 0.2883, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7940, partial_loss/deprel_loss: 0.9193, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9951, loss: 0.8863, batch_reg_loss: 0.1009, reg_loss: 0.0998 ||: 100%|##########| 95/95 [01:04<00:00,  1.47it/s]\n",
+      "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.100  |       N/A\n",
+      "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer - UEM                      |     0.541  |       N/A\n",
+      "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer - LEM                      |     0.288  |       N/A\n",
+      "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer - EM                       |     0.852  |       N/A\n",
+      "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.794  |       N/A\n",
+      "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:20:07,747 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - UAS                      |     0.928  |       N/A\n",
+      "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.919  |       N/A\n",
+      "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - loss                     |     0.886  |       N/A\n",
+      "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - LAS                      |     0.866  |       N/A\n",
+      "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.596  |       N/A\n",
+      "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:20:07,748 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:20:07,749 - INFO - combo.training.trainer - Epoch duration: 0:01:04.681370\n",
+      "2023-04-06 23:20:07,749 - INFO - combo.training.trainer - Estimated training time remaining: 7:01:42\n",
+      "2023-04-06 23:20:07,749 - INFO - allennlp.training.trainer - Epoch 27/399\n",
+      "2023-04-06 23:20:07,749 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:20:07,750 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:20:07,756 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8349, UAS: 0.9402, LAS: 0.8809, UEM: 0.6214, LEM: 0.3571, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0407, partial_loss/deprel_loss: 0.9975, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1071, loss: 0.7497, batch_reg_loss: 0.1009, reg_loss: 0.1009 ||:   3%|3         | 3/95 [00:02<01:07,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9328, LAS: 0.8730, UEM: 0.5754, LEM: 0.3017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4208, partial_loss/deprel_loss: 0.5776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6473, loss: 0.8459, batch_reg_loss: 0.1010, reg_loss: 0.1010 ||:   7%|7         | 7/95 [00:04<01:01,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8304, UAS: 0.9262, LAS: 0.8658, UEM: 0.5596, LEM: 0.3057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2200, partial_loss/deprel_loss: 1.0964, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2222, loss: 0.9046, batch_reg_loss: 0.1011, reg_loss: 0.1010 ||:  12%|#1        | 11/95 [00:07<00:56,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9303, LAS: 0.8699, UEM: 0.5420, LEM: 0.2755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2592, partial_loss/deprel_loss: 0.5424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5870, loss: 0.8664, batch_reg_loss: 0.1012, reg_loss: 0.1011 ||:  16%|#5        | 15/95 [00:09<00:52,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9025, UAS: 0.9321, LAS: 0.8715, UEM: 0.5462, LEM: 0.2800, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2855, partial_loss/deprel_loss: 0.5019, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5599, loss: 0.8517, batch_reg_loss: 0.1013, reg_loss: 0.1011 ||:  19%|#8        | 18/95 [00:11<00:51,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8288, UAS: 0.9278, LAS: 0.8668, UEM: 0.5127, LEM: 0.2573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2996, partial_loss/deprel_loss: 1.0387, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1922, loss: 0.8887, batch_reg_loss: 0.1014, reg_loss: 0.1011 ||:  22%|##2       | 21/95 [00:13<00:50,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7923, UAS: 0.9247, LAS: 0.8633, UEM: 0.5101, LEM: 0.2574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7245, partial_loss/deprel_loss: 1.2478, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4445, loss: 0.9164, batch_reg_loss: 0.1014, reg_loss: 0.1012 ||:  25%|##5       | 24/95 [00:15<00:48,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8524, UAS: 0.9267, LAS: 0.8652, UEM: 0.5210, LEM: 0.2605, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8427, partial_loss/deprel_loss: 0.8735, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9689, loss: 0.8957, batch_reg_loss: 0.1015, reg_loss: 0.1012 ||:  28%|##8       | 27/95 [00:18<00:49,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9258, LAS: 0.8646, UEM: 0.5120, LEM: 0.2556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2659, partial_loss/deprel_loss: 0.5009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5554, loss: 0.8987, batch_reg_loss: 0.1016, reg_loss: 0.1012 ||:  33%|###2      | 31/95 [00:20<00:44,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8541, UAS: 0.9272, LAS: 0.8661, UEM: 0.5207, LEM: 0.2645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7525, partial_loss/deprel_loss: 0.9462, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0091, loss: 0.8831, batch_reg_loss: 0.1016, reg_loss: 0.1013 ||:  36%|###5      | 34/95 [00:23<00:44,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9090, UAS: 0.9275, LAS: 0.8662, UEM: 0.5229, LEM: 0.2687, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2010, partial_loss/deprel_loss: 0.4556, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5064, loss: 0.8833, batch_reg_loss: 0.1017, reg_loss: 0.1013 ||:  40%|####      | 38/95 [00:25<00:40,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9298, LAS: 0.8686, UEM: 0.5593, LEM: 0.3146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0536, partial_loss/deprel_loss: 0.2114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2817, loss: 0.8655, batch_reg_loss: 0.1018, reg_loss: 0.1014 ||:  44%|####4     | 42/95 [00:28<00:38,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.9312, LAS: 0.8703, UEM: 0.5728, LEM: 0.3241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6638, partial_loss/deprel_loss: 0.8781, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9371, loss: 0.8541, batch_reg_loss: 0.1019, reg_loss: 0.1014 ||:  47%|####7     | 45/95 [00:30<00:35,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9325, LAS: 0.8718, UEM: 0.5748, LEM: 0.3211, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3237, partial_loss/deprel_loss: 0.5522, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6084, loss: 0.8425, batch_reg_loss: 0.1020, reg_loss: 0.1014 ||:  52%|#####1    | 49/95 [00:33<00:32,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9324, LAS: 0.8714, UEM: 0.5740, LEM: 0.3170, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2472, partial_loss/deprel_loss: 0.4914, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5446, loss: 0.8439, batch_reg_loss: 0.1020, reg_loss: 0.1015 ||:  56%|#####5    | 53/95 [00:36<00:29,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8713, UAS: 0.9321, LAS: 0.8710, UEM: 0.5646, LEM: 0.3081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6406, partial_loss/deprel_loss: 0.6568, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7557, loss: 0.8434, batch_reg_loss: 0.1021, reg_loss: 0.1015 ||:  59%|#####8    | 56/95 [00:38<00:26,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9334, LAS: 0.8726, UEM: 0.5752, LEM: 0.3184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1631, partial_loss/deprel_loss: 0.3817, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4401, loss: 0.8327, batch_reg_loss: 0.1022, reg_loss: 0.1015 ||:  62%|######2   | 59/95 [00:40<00:25,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8279, UAS: 0.9339, LAS: 0.8731, UEM: 0.5878, LEM: 0.3324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3192, partial_loss/deprel_loss: 1.2217, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3434, loss: 0.8309, batch_reg_loss: 0.1022, reg_loss: 0.1016 ||:  65%|######5   | 62/95 [00:43<00:24,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9332, LAS: 0.8723, UEM: 0.5816, LEM: 0.3252, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4838, partial_loss/deprel_loss: 0.6110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6879, loss: 0.8382, batch_reg_loss: 0.1023, reg_loss: 0.1016 ||:  69%|######9   | 66/95 [00:45<00:20,  1.39it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8323, UAS: 0.9321, LAS: 0.8710, UEM: 0.5712, LEM: 0.3175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0679, partial_loss/deprel_loss: 1.0180, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1303, loss: 0.8474, batch_reg_loss: 0.1023, reg_loss: 0.1016 ||:  73%|#######2  | 69/95 [00:47<00:18,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8505, UAS: 0.9304, LAS: 0.8692, UEM: 0.5678, LEM: 0.3159, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8930, partial_loss/deprel_loss: 0.9460, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0378, loss: 0.8628, batch_reg_loss: 0.1024, reg_loss: 0.1017 ||:  76%|#######5  | 72/95 [00:49<00:15,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8870, UAS: 0.9309, LAS: 0.8698, UEM: 0.5655, LEM: 0.3115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4401, partial_loss/deprel_loss: 0.6275, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6925, loss: 0.8581, batch_reg_loss: 0.1025, reg_loss: 0.1017 ||:  80%|########  | 76/95 [00:52<00:13,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8117, UAS: 0.9301, LAS: 0.8687, UEM: 0.5591, LEM: 0.3067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2777, partial_loss/deprel_loss: 1.1437, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2731, loss: 0.8666, batch_reg_loss: 0.1026, reg_loss: 0.1017 ||:  83%|########3 | 79/95 [00:54<00:11,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8390, UAS: 0.9290, LAS: 0.8676, UEM: 0.5500, LEM: 0.2991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0951, partial_loss/deprel_loss: 0.9973, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1195, loss: 0.8737, batch_reg_loss: 0.1027, reg_loss: 0.1018 ||:  87%|########7 | 83/95 [00:57<00:08,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7900, UAS: 0.9282, LAS: 0.8667, UEM: 0.5473, LEM: 0.2971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7822, partial_loss/deprel_loss: 1.2444, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4547, loss: 0.8816, batch_reg_loss: 0.1027, reg_loss: 0.1018 ||:  91%|######### | 86/95 [00:59<00:06,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8335, UAS: 0.9280, LAS: 0.8663, UEM: 0.5431, LEM: 0.2938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9607, partial_loss/deprel_loss: 1.1209, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1917, loss: 0.8857, batch_reg_loss: 0.1028, reg_loss: 0.1019 ||:  94%|#########3| 89/95 [01:01<00:04,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9287, LAS: 0.8672, UEM: 0.5497, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2051, partial_loss/deprel_loss: 0.4471, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5016, loss: 0.8794, batch_reg_loss: 0.1029, reg_loss: 0.1019 ||:  97%|#########6| 92/95 [01:03<00:02,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9292, LAS: 0.8676, UEM: 0.5475, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6508, partial_loss/deprel_loss: 0.8607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9217, loss: 0.8774, batch_reg_loss: 0.1030, reg_loss: 0.1019 ||: 100%|##########| 95/95 [01:06<00:00,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9292, LAS: 0.8676, UEM: 0.5475, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6508, partial_loss/deprel_loss: 0.8607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9217, loss: 0.8774, batch_reg_loss: 0.1030, reg_loss: 0.1019 ||: 100%|##########| 95/95 [01:06<00:00,  1.44it/s]\n",
+      "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.102  |       N/A\n",
+      "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer - UEM                      |     0.547  |       N/A\n",
+      "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer - LEM                      |     0.295  |       N/A\n",
+      "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer - EM                       |     0.869  |       N/A\n",
+      "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.651  |       N/A\n",
+      "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:21:13,788 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - UAS                      |     0.929  |       N/A\n",
+      "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.861  |       N/A\n",
+      "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - loss                     |     0.877  |       N/A\n",
+      "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - LAS                      |     0.868  |       N/A\n",
+      "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.596  |       N/A\n",
+      "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:21:13,789 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:21:13,790 - INFO - combo.training.trainer - Epoch duration: 0:01:06.040844\n",
+      "2023-04-06 23:21:13,790 - INFO - combo.training.trainer - Estimated training time remaining: 7:00:10\n",
+      "2023-04-06 23:21:13,790 - INFO - allennlp.training.trainer - Epoch 28/399\n",
+      "2023-04-06 23:21:13,790 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:21:13,791 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:21:13,797 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9346, LAS: 0.8735, UEM: 0.6326, LEM: 0.3608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2719, partial_loss/deprel_loss: 0.4796, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5411, loss: 0.8077, batch_reg_loss: 0.1030, reg_loss: 0.1030 ||:   3%|3         | 3/95 [00:02<01:08,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8646, UAS: 0.9287, LAS: 0.8674, UEM: 0.5346, LEM: 0.2683, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6960, partial_loss/deprel_loss: 0.7365, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8315, loss: 0.8417, batch_reg_loss: 0.1031, reg_loss: 0.1030 ||:   6%|6         | 6/95 [00:04<01:06,  1.34it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9345, LAS: 0.8759, UEM: 0.5972, LEM: 0.3350, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2194, partial_loss/deprel_loss: 0.4033, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4697, loss: 0.7925, batch_reg_loss: 0.1032, reg_loss: 0.1031 ||:   9%|9         | 9/95 [00:06<01:03,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8456, UAS: 0.9365, LAS: 0.8772, UEM: 0.5851, LEM: 0.3187, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8063, partial_loss/deprel_loss: 0.9712, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0415, loss: 0.7803, batch_reg_loss: 0.1033, reg_loss: 0.1031 ||:  13%|#2        | 12/95 [00:08<01:00,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8620, UAS: 0.9352, LAS: 0.8757, UEM: 0.5425, LEM: 0.2885, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7990, partial_loss/deprel_loss: 0.8716, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9604, loss: 0.8003, batch_reg_loss: 0.1033, reg_loss: 0.1032 ||:  17%|#6        | 16/95 [00:11<00:53,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8952, UAS: 0.9375, LAS: 0.8778, UEM: 0.5466, LEM: 0.2875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3478, partial_loss/deprel_loss: 0.6074, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6589, loss: 0.7860, batch_reg_loss: 0.1034, reg_loss: 0.1032 ||:  21%|##1       | 20/95 [00:13<00:50,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8801, UAS: 0.9379, LAS: 0.8783, UEM: 0.5463, LEM: 0.2834, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5882, partial_loss/deprel_loss: 0.7416, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8144, loss: 0.7834, batch_reg_loss: 0.1035, reg_loss: 0.1032 ||:  24%|##4       | 23/95 [00:15<00:49,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8387, UAS: 0.9334, LAS: 0.8734, UEM: 0.5331, LEM: 0.2727, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1025, partial_loss/deprel_loss: 1.0446, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1597, loss: 0.8237, batch_reg_loss: 0.1036, reg_loss: 0.1033 ||:  27%|##7       | 26/95 [00:18<00:48,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9375, LAS: 0.8775, UEM: 0.5796, LEM: 0.3063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1351, partial_loss/deprel_loss: 0.3968, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4481, loss: 0.7905, batch_reg_loss: 0.1036, reg_loss: 0.1033 ||:  32%|###1      | 30/95 [00:20<00:45,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9390, LAS: 0.8796, UEM: 0.5881, LEM: 0.3117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3049, partial_loss/deprel_loss: 0.5112, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5736, loss: 0.7753, batch_reg_loss: 0.1037, reg_loss: 0.1034 ||:  36%|###5      | 34/95 [00:23<00:42,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8943, UAS: 0.9383, LAS: 0.8791, UEM: 0.5771, LEM: 0.3039, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4137, partial_loss/deprel_loss: 0.5516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6278, loss: 0.7768, batch_reg_loss: 0.1038, reg_loss: 0.1034 ||:  39%|###8      | 37/95 [00:25<00:40,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9340, LAS: 0.8743, UEM: 0.5647, LEM: 0.2956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5219, partial_loss/deprel_loss: 0.6677, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7423, loss: 0.8181, batch_reg_loss: 0.1038, reg_loss: 0.1034 ||:  42%|####2     | 40/95 [00:27<00:39,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8978, UAS: 0.9351, LAS: 0.8755, UEM: 0.5681, LEM: 0.2962, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3436, partial_loss/deprel_loss: 0.5420, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6062, loss: 0.8089, batch_reg_loss: 0.1039, reg_loss: 0.1035 ||:  45%|####5     | 43/95 [00:30<00:38,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8868, UAS: 0.9339, LAS: 0.8741, UEM: 0.5594, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3736, partial_loss/deprel_loss: 0.6634, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7094, loss: 0.8196, batch_reg_loss: 0.1040, reg_loss: 0.1035 ||:  49%|####9     | 47/95 [00:32<00:33,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9337, LAS: 0.8738, UEM: 0.5603, LEM: 0.2875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2939, partial_loss/deprel_loss: 0.5093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5702, loss: 0.8231, batch_reg_loss: 0.1040, reg_loss: 0.1035 ||:  53%|#####2    | 50/95 [00:34<00:32,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8383, UAS: 0.9327, LAS: 0.8726, UEM: 0.5652, LEM: 0.2959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9954, partial_loss/deprel_loss: 1.1214, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2003, loss: 0.8335, batch_reg_loss: 0.1041, reg_loss: 0.1036 ||:  56%|#####5    | 53/95 [00:37<00:29,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9165, UAS: 0.9328, LAS: 0.8727, UEM: 0.5670, LEM: 0.2993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1960, partial_loss/deprel_loss: 0.4040, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4666, loss: 0.8345, batch_reg_loss: 0.1042, reg_loss: 0.1036 ||:  59%|#####8    | 56/95 [00:39<00:27,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8573, UAS: 0.9334, LAS: 0.8734, UEM: 0.5847, LEM: 0.3264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7031, partial_loss/deprel_loss: 0.9869, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0344, loss: 0.8302, batch_reg_loss: 0.1042, reg_loss: 0.1036 ||:  62%|######2   | 59/95 [00:41<00:25,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9340, LAS: 0.8741, UEM: 0.5861, LEM: 0.3268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2656, partial_loss/deprel_loss: 0.4323, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5032, loss: 0.8227, batch_reg_loss: 0.1043, reg_loss: 0.1037 ||:  65%|######5   | 62/95 [00:43<00:23,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9343, LAS: 0.8742, UEM: 0.5832, LEM: 0.3227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2923, partial_loss/deprel_loss: 0.5219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5804, loss: 0.8244, batch_reg_loss: 0.1044, reg_loss: 0.1037 ||:  69%|######9   | 66/95 [00:45<00:19,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8361, UAS: 0.9334, LAS: 0.8731, UEM: 0.5736, LEM: 0.3156, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0562, partial_loss/deprel_loss: 1.0607, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1642, loss: 0.8343, batch_reg_loss: 0.1045, reg_loss: 0.1037 ||:  73%|#######2  | 69/95 [00:48<00:17,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8958, UAS: 0.9317, LAS: 0.8714, UEM: 0.5647, LEM: 0.3096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4167, partial_loss/deprel_loss: 0.6013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6689, loss: 0.8474, batch_reg_loss: 0.1046, reg_loss: 0.1038 ||:  77%|#######6  | 73/95 [00:50<00:14,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8362, UAS: 0.9317, LAS: 0.8713, UEM: 0.5695, LEM: 0.3180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0380, partial_loss/deprel_loss: 1.0594, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1598, loss: 0.8477, batch_reg_loss: 0.1046, reg_loss: 0.1038 ||:  81%|########1 | 77/95 [00:53<00:11,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8665, UAS: 0.9315, LAS: 0.8710, UEM: 0.5662, LEM: 0.3139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6735, partial_loss/deprel_loss: 0.7805, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8638, loss: 0.8493, batch_reg_loss: 0.1047, reg_loss: 0.1039 ||:  85%|########5 | 81/95 [00:55<00:09,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8714, UAS: 0.9312, LAS: 0.8707, UEM: 0.5638, LEM: 0.3129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6924, partial_loss/deprel_loss: 0.8298, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9072, loss: 0.8523, batch_reg_loss: 0.1048, reg_loss: 0.1039 ||:  89%|########9 | 85/95 [00:58<00:06,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9315, LAS: 0.8709, UEM: 0.5598, LEM: 0.3092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3775, partial_loss/deprel_loss: 0.6310, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6852, loss: 0.8520, batch_reg_loss: 0.1049, reg_loss: 0.1039 ||:  93%|#########2| 88/95 [01:00<00:04,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8323, UAS: 0.9302, LAS: 0.8695, UEM: 0.5517, LEM: 0.3027, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0410, partial_loss/deprel_loss: 0.9326, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0593, loss: 0.8626, batch_reg_loss: 0.1050, reg_loss: 0.1040 ||:  97%|#########6| 92/95 [01:03<00:02,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8612, UAS: 0.9294, LAS: 0.8688, UEM: 0.5463, LEM: 0.2986, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7954, partial_loss/deprel_loss: 0.8031, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9066, loss: 0.8690, batch_reg_loss: 0.1050, reg_loss: 0.1040 ||: 100%|##########| 95/95 [01:05<00:00,  1.46it/s]\n",
+      "2023-04-06 23:22:18,868 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:22:18,868 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-06 23:22:18,868 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.104  |       N/A\n",
+      "2023-04-06 23:22:18,868 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:22:18,868 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:22:18,868 - INFO - combo.training.tensorboard_writer - UEM                      |     0.546  |       N/A\n",
+      "2023-04-06 23:22:18,868 - INFO - combo.training.tensorboard_writer - LEM                      |     0.299  |       N/A\n",
+      "2023-04-06 23:22:18,868 - INFO - combo.training.tensorboard_writer - EM                       |     0.861  |       N/A\n",
+      "2023-04-06 23:22:18,868 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.795  |       N/A\n",
+      "2023-04-06 23:22:18,868 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - UAS                      |     0.929  |       N/A\n",
+      "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.803  |       N/A\n",
+      "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - loss                     |     0.869  |       N/A\n",
+      "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - LAS                      |     0.869  |       N/A\n",
+      "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.596  |       N/A\n",
+      "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:22:18,869 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:22:18,870 - INFO - combo.training.trainer - Epoch duration: 0:01:05.079751\n",
+      "2023-04-06 23:22:18,870 - INFO - combo.training.trainer - Estimated training time remaining: 6:58:28\n",
+      "2023-04-06 23:22:18,870 - INFO - allennlp.training.trainer - Epoch 29/399\n",
+      "2023-04-06 23:22:18,870 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:22:18,871 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:22:18,878 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8736, UAS: 0.9405, LAS: 0.8823, UEM: 0.5759, LEM: 0.3195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5825, partial_loss/deprel_loss: 0.8253, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8819, loss: 0.7942, batch_reg_loss: 0.1051, reg_loss: 0.1051 ||:   4%|4         | 4/95 [00:02<00:55,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8507, UAS: 0.9405, LAS: 0.8816, UEM: 0.5821, LEM: 0.3110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9805, partial_loss/deprel_loss: 0.9054, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0257, loss: 0.7758, batch_reg_loss: 0.1052, reg_loss: 0.1051 ||:   7%|7         | 7/95 [00:04<00:58,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9302, LAS: 0.8717, UEM: 0.5302, LEM: 0.2747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4166, partial_loss/deprel_loss: 0.5184, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6033, loss: 0.8529, batch_reg_loss: 0.1053, reg_loss: 0.1052 ||:  12%|#1        | 11/95 [00:07<00:54,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9260, LAS: 0.8661, UEM: 0.5289, LEM: 0.2658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3419, partial_loss/deprel_loss: 0.5726, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6318, loss: 0.8873, batch_reg_loss: 0.1053, reg_loss: 0.1052 ||:  15%|#4        | 14/95 [00:09<00:55,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8456, UAS: 0.9275, LAS: 0.8671, UEM: 0.5159, LEM: 0.2500, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0340, partial_loss/deprel_loss: 0.9651, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0843, loss: 0.8791, batch_reg_loss: 0.1054, reg_loss: 0.1053 ||:  19%|#8        | 18/95 [00:12<00:51,  1.50it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9061, UAS: 0.9315, LAS: 0.8715, UEM: 0.5550, LEM: 0.2817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2981, partial_loss/deprel_loss: 0.4884, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5558, loss: 0.8402, batch_reg_loss: 0.1055, reg_loss: 0.1053 ||:  22%|##2       | 21/95 [00:14<00:50,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8750, UAS: 0.9280, LAS: 0.8674, UEM: 0.5284, LEM: 0.2651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6160, partial_loss/deprel_loss: 0.7219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8063, loss: 0.8731, batch_reg_loss: 0.1056, reg_loss: 0.1053 ||:  25%|##5       | 24/95 [00:16<00:49,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8788, UAS: 0.9277, LAS: 0.8663, UEM: 0.4999, LEM: 0.2436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5052, partial_loss/deprel_loss: 0.7323, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7925, loss: 0.8844, batch_reg_loss: 0.1057, reg_loss: 0.1054 ||:  29%|##9       | 28/95 [00:18<00:44,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8816, UAS: 0.9291, LAS: 0.8684, UEM: 0.5310, LEM: 0.2862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5477, partial_loss/deprel_loss: 0.7332, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8018, loss: 0.8681, batch_reg_loss: 0.1057, reg_loss: 0.1054 ||:  33%|###2      | 31/95 [00:20<00:43,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8494, UAS: 0.9309, LAS: 0.8711, UEM: 0.5795, LEM: 0.3469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0689, partial_loss/deprel_loss: 0.9747, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0993, loss: 0.8510, batch_reg_loss: 0.1058, reg_loss: 0.1054 ||:  36%|###5      | 34/95 [00:23<00:45,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8451, UAS: 0.9288, LAS: 0.8687, UEM: 0.5669, LEM: 0.3364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9300, partial_loss/deprel_loss: 0.9667, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0652, loss: 0.8740, batch_reg_loss: 0.1059, reg_loss: 0.1055 ||:  39%|###8      | 37/95 [00:25<00:41,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9303, LAS: 0.8708, UEM: 0.5728, LEM: 0.3387, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2012, partial_loss/deprel_loss: 0.4225, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4842, loss: 0.8581, batch_reg_loss: 0.1059, reg_loss: 0.1055 ||:  42%|####2     | 40/95 [00:27<00:39,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9324, LAS: 0.8733, UEM: 0.5812, LEM: 0.3390, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3429, partial_loss/deprel_loss: 0.5983, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6532, loss: 0.8376, batch_reg_loss: 0.1060, reg_loss: 0.1055 ||:  46%|####6     | 44/95 [00:30<00:35,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9312, LAS: 0.8722, UEM: 0.5699, LEM: 0.3276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4785, partial_loss/deprel_loss: 0.6576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7279, loss: 0.8446, batch_reg_loss: 0.1061, reg_loss: 0.1056 ||:  51%|#####     | 48/95 [00:33<00:33,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.9314, LAS: 0.8722, UEM: 0.5611, LEM: 0.3180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5880, partial_loss/deprel_loss: 0.7489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8229, loss: 0.8442, batch_reg_loss: 0.1062, reg_loss: 0.1056 ||:  54%|#####3    | 51/95 [00:35<00:31,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8172, UAS: 0.9304, LAS: 0.8710, UEM: 0.5544, LEM: 0.3118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3823, partial_loss/deprel_loss: 1.1230, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2811, loss: 0.8544, batch_reg_loss: 0.1062, reg_loss: 0.1056 ||:  57%|#####6    | 54/95 [00:37<00:29,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9306, LAS: 0.8711, UEM: 0.5548, LEM: 0.3100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2805, partial_loss/deprel_loss: 0.5140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5736, loss: 0.8514, batch_reg_loss: 0.1063, reg_loss: 0.1057 ||:  60%|######    | 57/95 [00:39<00:27,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8903, UAS: 0.9310, LAS: 0.8713, UEM: 0.5602, LEM: 0.3124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3802, partial_loss/deprel_loss: 0.6500, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7024, loss: 0.8500, batch_reg_loss: 0.1063, reg_loss: 0.1057 ||:  63%|######3   | 60/95 [00:41<00:24,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8057, UAS: 0.9302, LAS: 0.8704, UEM: 0.5490, LEM: 0.3036, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6765, partial_loss/deprel_loss: 1.2324, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4277, loss: 0.8589, batch_reg_loss: 0.1064, reg_loss: 0.1058 ||:  67%|######7   | 64/95 [00:44<00:20,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8780, UAS: 0.9303, LAS: 0.8706, UEM: 0.5485, LEM: 0.3040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5443, partial_loss/deprel_loss: 0.6740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7546, loss: 0.8559, batch_reg_loss: 0.1065, reg_loss: 0.1058 ||:  71%|#######   | 67/95 [00:46<00:19,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8771, UAS: 0.9307, LAS: 0.8712, UEM: 0.5517, LEM: 0.3062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5476, partial_loss/deprel_loss: 0.7697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8318, loss: 0.8514, batch_reg_loss: 0.1066, reg_loss: 0.1058 ||:  74%|#######3  | 70/95 [00:48<00:17,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9311, LAS: 0.8715, UEM: 0.5508, LEM: 0.3045, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4542, partial_loss/deprel_loss: 0.5922, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6712, loss: 0.8487, batch_reg_loss: 0.1066, reg_loss: 0.1059 ||:  77%|#######6  | 73/95 [00:51<00:16,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9302, LAS: 0.8703, UEM: 0.5410, LEM: 0.2972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5016, partial_loss/deprel_loss: 0.6399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7189, loss: 0.8583, batch_reg_loss: 0.1067, reg_loss: 0.1059 ||:  81%|########1 | 77/95 [00:53<00:12,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9304, LAS: 0.8706, UEM: 0.5378, LEM: 0.2938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7016, partial_loss/deprel_loss: 0.8249, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9071, loss: 0.8573, batch_reg_loss: 0.1068, reg_loss: 0.1059 ||:  84%|########4 | 80/95 [00:55<00:10,  1.40it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8727, UAS: 0.9299, LAS: 0.8699, UEM: 0.5320, LEM: 0.2889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6495, partial_loss/deprel_loss: 0.8076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8828, loss: 0.8622, batch_reg_loss: 0.1068, reg_loss: 0.1060 ||:  87%|########7 | 83/95 [00:57<00:08,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9300, LAS: 0.8701, UEM: 0.5276, LEM: 0.2850, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3396, partial_loss/deprel_loss: 0.5973, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6527, loss: 0.8619, batch_reg_loss: 0.1069, reg_loss: 0.1060 ||:  92%|#########1| 87/95 [01:00<00:05,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9301, LAS: 0.8702, UEM: 0.5347, LEM: 0.2917, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1448, partial_loss/deprel_loss: 0.3613, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4250, loss: 0.8602, batch_reg_loss: 0.1070, reg_loss: 0.1060 ||:  95%|#########4| 90/95 [01:03<00:03,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8696, UAS: 0.9307, LAS: 0.8709, UEM: 0.5418, LEM: 0.2965, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6193, partial_loss/deprel_loss: 0.8146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8826, loss: 0.8549, batch_reg_loss: 0.1071, reg_loss: 0.1061 ||:  98%|#########7| 93/95 [01:05<00:01,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9309, LAS: 0.8709, UEM: 0.5424, LEM: 0.2963, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2886, partial_loss/deprel_loss: 0.5511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6057, loss: 0.8538, batch_reg_loss: 0.1071, reg_loss: 0.1061 ||: 100%|##########| 95/95 [01:06<00:00,  1.42it/s]\n",
+      "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.106  |       N/A\n",
+      "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - UEM                      |     0.542  |       N/A\n",
+      "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - LEM                      |     0.296  |       N/A\n",
+      "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - EM                       |     0.893  |       N/A\n",
+      "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.289  |       N/A\n",
+      "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:23:25,678 - INFO - combo.training.tensorboard_writer - UAS                      |     0.931  |       N/A\n",
+      "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.551  |       N/A\n",
+      "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - loss                     |     0.854  |       N/A\n",
+      "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - LAS                      |     0.871  |       N/A\n",
+      "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.596  |       N/A\n",
+      "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:23:25,679 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:23:25,680 - INFO - combo.training.trainer - Epoch duration: 0:01:06.809689\n",
+      "2023-04-06 23:23:25,680 - INFO - combo.training.trainer - Estimated training time remaining: 6:57:10\n",
+      "2023-04-06 23:23:25,680 - INFO - allennlp.training.trainer - Epoch 30/399\n",
+      "2023-04-06 23:23:25,680 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:23:25,680 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:23:25,687 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9485, LAS: 0.8883, UEM: 0.6172, LEM: 0.3185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2032, partial_loss/deprel_loss: 0.4108, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4765, loss: 0.6787, batch_reg_loss: 0.1072, reg_loss: 0.1071 ||:   3%|3         | 3/95 [00:02<01:09,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8077, UAS: 0.9325, LAS: 0.8739, UEM: 0.5788, LEM: 0.3163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4854, partial_loss/deprel_loss: 1.1183, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2989, loss: 0.8021, batch_reg_loss: 0.1072, reg_loss: 0.1072 ||:   6%|6         | 6/95 [00:04<01:04,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7762, UAS: 0.9219, LAS: 0.8624, UEM: 0.5396, LEM: 0.2932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0344, partial_loss/deprel_loss: 1.3158, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5668, loss: 0.8970, batch_reg_loss: 0.1073, reg_loss: 0.1072 ||:  11%|#         | 10/95 [00:06<01:00,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8236, UAS: 0.9129, LAS: 0.8517, UEM: 0.4775, LEM: 0.2577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1380, partial_loss/deprel_loss: 1.0848, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2028, loss: 0.9815, batch_reg_loss: 0.1074, reg_loss: 0.1072 ||:  14%|#3        | 13/95 [00:09<01:00,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8573, UAS: 0.9162, LAS: 0.8554, UEM: 0.4791, LEM: 0.2574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9552, partial_loss/deprel_loss: 0.8739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9976, loss: 0.9576, batch_reg_loss: 0.1074, reg_loss: 0.1073 ||:  17%|#6        | 16/95 [00:11<00:58,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9234, LAS: 0.8629, UEM: 0.5195, LEM: 0.2770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3310, partial_loss/deprel_loss: 0.5365, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6029, loss: 0.9025, batch_reg_loss: 0.1075, reg_loss: 0.1073 ||:  21%|##1       | 20/95 [00:14<00:55,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9275, LAS: 0.8668, UEM: 0.5569, LEM: 0.3066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1406, partial_loss/deprel_loss: 0.3556, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4202, loss: 0.8713, batch_reg_loss: 0.1076, reg_loss: 0.1073 ||:  24%|##4       | 23/95 [00:16<00:52,  1.37it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9051, UAS: 0.9298, LAS: 0.8694, UEM: 0.5545, LEM: 0.2980, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2576, partial_loss/deprel_loss: 0.5630, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6095, loss: 0.8538, batch_reg_loss: 0.1077, reg_loss: 0.1074 ||:  27%|##7       | 26/95 [00:18<00:49,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8950, UAS: 0.9318, LAS: 0.8718, UEM: 0.5587, LEM: 0.2977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4433, partial_loss/deprel_loss: 0.6041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6797, loss: 0.8347, batch_reg_loss: 0.1077, reg_loss: 0.1074 ||:  32%|###1      | 30/95 [00:21<00:45,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8581, UAS: 0.9319, LAS: 0.8721, UEM: 0.5770, LEM: 0.3248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7107, partial_loss/deprel_loss: 0.7784, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8727, loss: 0.8302, batch_reg_loss: 0.1078, reg_loss: 0.1075 ||:  35%|###4      | 33/95 [00:23<00:44,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8996, UAS: 0.9326, LAS: 0.8732, UEM: 0.5866, LEM: 0.3376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3633, partial_loss/deprel_loss: 0.5928, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6547, loss: 0.8227, batch_reg_loss: 0.1079, reg_loss: 0.1075 ||:  38%|###7      | 36/95 [00:26<00:44,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9322, LAS: 0.8728, UEM: 0.5688, LEM: 0.3217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5312, partial_loss/deprel_loss: 0.6978, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7724, loss: 0.8291, batch_reg_loss: 0.1079, reg_loss: 0.1075 ||:  42%|####2     | 40/95 [00:28<00:40,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9310, LAS: 0.8717, UEM: 0.5667, LEM: 0.3221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2758, partial_loss/deprel_loss: 0.4176, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4972, loss: 0.8379, batch_reg_loss: 0.1080, reg_loss: 0.1076 ||:  45%|####5     | 43/95 [00:31<00:38,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8928, UAS: 0.9312, LAS: 0.8718, UEM: 0.5623, LEM: 0.3153, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3805, partial_loss/deprel_loss: 0.5855, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6526, loss: 0.8358, batch_reg_loss: 0.1080, reg_loss: 0.1076 ||:  48%|####8     | 46/95 [00:33<00:35,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8767, UAS: 0.9322, LAS: 0.8732, UEM: 0.5874, LEM: 0.3501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4912, partial_loss/deprel_loss: 0.6406, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7188, loss: 0.8241, batch_reg_loss: 0.1081, reg_loss: 0.1076 ||:  52%|#####1    | 49/95 [00:35<00:36,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8712, UAS: 0.9321, LAS: 0.8729, UEM: 0.5790, LEM: 0.3395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6182, partial_loss/deprel_loss: 0.7551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8359, loss: 0.8273, batch_reg_loss: 0.1082, reg_loss: 0.1077 ||:  56%|#####5    | 53/95 [00:38<00:30,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9317, LAS: 0.8724, UEM: 0.5672, LEM: 0.3272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6344, partial_loss/deprel_loss: 0.7732, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8537, loss: 0.8331, batch_reg_loss: 0.1083, reg_loss: 0.1077 ||:  60%|######    | 57/95 [00:40<00:26,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8763, UAS: 0.9317, LAS: 0.8721, UEM: 0.5641, LEM: 0.3220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5027, partial_loss/deprel_loss: 0.6883, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7596, loss: 0.8379, batch_reg_loss: 0.1084, reg_loss: 0.1077 ||:  64%|######4   | 61/95 [00:43<00:22,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8700, UAS: 0.9305, LAS: 0.8704, UEM: 0.5515, LEM: 0.3111, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6451, partial_loss/deprel_loss: 0.8968, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9549, loss: 0.8522, batch_reg_loss: 0.1084, reg_loss: 0.1078 ||:  68%|######8   | 65/95 [00:45<00:19,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8938, UAS: 0.9315, LAS: 0.8714, UEM: 0.5530, LEM: 0.3078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2872, partial_loss/deprel_loss: 0.5400, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5980, loss: 0.8460, batch_reg_loss: 0.1085, reg_loss: 0.1078 ||:  73%|#######2  | 69/95 [00:48<00:17,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9325, LAS: 0.8724, UEM: 0.5549, LEM: 0.3061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2872, partial_loss/deprel_loss: 0.5391, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5974, loss: 0.8382, batch_reg_loss: 0.1086, reg_loss: 0.1079 ||:  77%|#######6  | 73/95 [00:51<00:14,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8723, UAS: 0.9322, LAS: 0.8720, UEM: 0.5487, LEM: 0.2992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6038, partial_loss/deprel_loss: 0.7871, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8591, loss: 0.8423, batch_reg_loss: 0.1087, reg_loss: 0.1079 ||:  81%|########1 | 77/95 [00:53<00:11,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8324, UAS: 0.9292, LAS: 0.8688, UEM: 0.5399, LEM: 0.2935, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3246, partial_loss/deprel_loss: 0.9912, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1667, loss: 0.8666, batch_reg_loss: 0.1088, reg_loss: 0.1080 ||:  85%|########5 | 81/95 [00:56<00:08,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9303, LAS: 0.8701, UEM: 0.5412, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4508, partial_loss/deprel_loss: 0.6363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7081, loss: 0.8578, batch_reg_loss: 0.1089, reg_loss: 0.1080 ||:  89%|########9 | 85/95 [00:58<00:06,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8341, UAS: 0.9302, LAS: 0.8701, UEM: 0.5400, LEM: 0.2905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1560, partial_loss/deprel_loss: 1.0515, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1814, loss: 0.8587, batch_reg_loss: 0.1090, reg_loss: 0.1080 ||:  94%|#########3| 89/95 [01:01<00:03,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8224, UAS: 0.9308, LAS: 0.8708, UEM: 0.5543, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3766, partial_loss/deprel_loss: 1.1223, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2822, loss: 0.8519, batch_reg_loss: 0.1091, reg_loss: 0.1081 ||:  98%|#########7| 93/95 [01:04<00:01,  1.51it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8323, UAS: 0.9304, LAS: 0.8703, UEM: 0.5497, LEM: 0.2994, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0909, partial_loss/deprel_loss: 1.0622, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1771, loss: 0.8557, batch_reg_loss: 0.1091, reg_loss: 0.1081 ||: 100%|##########| 95/95 [01:05<00:00,  1.45it/s]\n",
+      "2023-04-06 23:24:31,061 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9013, UAS: 0.9493, LAS: 0.8889, UEM: 0.5691, LEM: 0.1780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4038, partial_loss/deprel_loss: 28.1250, partial_loss/cycle_loss: 0.0000, batch_loss: 22.5808, loss: 22.6030, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  27%|##7       | 3/11 [00:02<00:06,  1.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9441, LAS: 0.8850, UEM: 0.5694, LEM: 0.2298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2868, partial_loss/deprel_loss: 27.3593, partial_loss/cycle_loss: 0.0000, batch_loss: 21.9448, loss: 27.0188, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:04<00:05,  1.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8665, UAS: 0.9383, LAS: 0.8790, UEM: 0.4910, LEM: 0.1820, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8210, partial_loss/deprel_loss: 42.9013, partial_loss/cycle_loss: 0.0000, batch_loss: 34.4852, loss: 28.7889, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  73%|#######2  | 8/11 [00:07<00:02,  1.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9470, LAS: 0.8918, UEM: 0.6641, LEM: 0.3843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2145, partial_loss/deprel_loss: 22.0492, partial_loss/cycle_loss: 0.0000, batch_loss: 17.6823, loss: 25.6736, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.05it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9470, LAS: 0.8918, UEM: 0.6641, LEM: 0.3843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2145, partial_loss/deprel_loss: 22.0492, partial_loss/cycle_loss: 0.0000, batch_loss: 17.6823, loss: 25.6736, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.04it/s]\n",
+      "2023-04-06 23:24:41,625 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:24:41,626 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-06 23:24:41,626 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.108  |     0.000\n",
+      "2023-04-06 23:24:41,626 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:24:41,626 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:24:41,626 - INFO - combo.training.tensorboard_writer - UEM                      |     0.550  |     0.664\n",
+      "2023-04-06 23:24:41,626 - INFO - combo.training.tensorboard_writer - LEM                      |     0.299  |     0.384\n",
+      "2023-04-06 23:24:41,626 - INFO - combo.training.tensorboard_writer - EM                       |     0.832  |     0.927\n",
+      "2023-04-06 23:24:41,626 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.091  |     0.214\n",
+      "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - UAS                      |     0.930  |     0.947\n",
+      "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.062  |    22.049\n",
+      "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - loss                     |     0.856  |    25.674\n",
+      "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - LAS                      |     0.870  |     0.892\n",
+      "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.596  |       N/A\n",
+      "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:24:41,627 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 23:24:41,628 - INFO - combo.training.trainer - Epoch duration: 0:01:15.948043\n",
+      "2023-04-06 23:24:41,628 - INFO - combo.training.trainer - Estimated training time remaining: 6:57:41\n",
+      "2023-04-06 23:24:41,628 - INFO - allennlp.training.trainer - Epoch 31/399\n",
+      "2023-04-06 23:24:41,628 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:24:41,629 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:24:41,636 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8776, UAS: 0.9554, LAS: 0.8921, UEM: 0.6602, LEM: 0.3069, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3671, partial_loss/deprel_loss: 0.6465, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6998, loss: 0.6303, batch_reg_loss: 0.1092, reg_loss: 0.1091 ||:   3%|3         | 3/95 [00:02<01:12,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8760, UAS: 0.9520, LAS: 0.8914, UEM: 0.6391, LEM: 0.3340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4923, partial_loss/deprel_loss: 0.7018, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7691, loss: 0.6716, batch_reg_loss: 0.1092, reg_loss: 0.1092 ||:   7%|7         | 7/95 [00:05<01:06,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8593, UAS: 0.9453, LAS: 0.8853, UEM: 0.5792, LEM: 0.2940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7182, partial_loss/deprel_loss: 0.7852, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8811, loss: 0.7250, batch_reg_loss: 0.1093, reg_loss: 0.1092 ||:  12%|#1        | 11/95 [00:07<00:59,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8511, UAS: 0.9388, LAS: 0.8788, UEM: 0.5190, LEM: 0.2554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9456, partial_loss/deprel_loss: 0.8558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9832, loss: 0.7850, batch_reg_loss: 0.1094, reg_loss: 0.1093 ||:  16%|#5        | 15/95 [00:10<00:55,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8880, UAS: 0.9360, LAS: 0.8756, UEM: 0.5046, LEM: 0.2419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5136, partial_loss/deprel_loss: 0.6491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7315, loss: 0.8117, batch_reg_loss: 0.1095, reg_loss: 0.1093 ||:  20%|##        | 19/95 [00:12<00:51,  1.49it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8336, UAS: 0.9332, LAS: 0.8718, UEM: 0.4720, LEM: 0.2205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1145, partial_loss/deprel_loss: 1.1053, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2167, loss: 0.8445, batch_reg_loss: 0.1096, reg_loss: 0.1094 ||:  24%|##4       | 23/95 [00:15<00:46,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9323, LAS: 0.8711, UEM: 0.4599, LEM: 0.2114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4132, partial_loss/deprel_loss: 0.5635, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6431, loss: 0.8527, batch_reg_loss: 0.1097, reg_loss: 0.1094 ||:  27%|##7       | 26/95 [00:17<00:45,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8258, UAS: 0.9323, LAS: 0.8707, UEM: 0.4526, LEM: 0.2018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2397, partial_loss/deprel_loss: 1.0853, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2260, loss: 0.8561, batch_reg_loss: 0.1098, reg_loss: 0.1094 ||:  32%|###1      | 30/95 [00:19<00:43,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8778, UAS: 0.9332, LAS: 0.8717, UEM: 0.4648, LEM: 0.2095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5229, partial_loss/deprel_loss: 0.7206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7909, loss: 0.8484, batch_reg_loss: 0.1098, reg_loss: 0.1095 ||:  35%|###4      | 33/95 [00:21<00:41,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8922, UAS: 0.9322, LAS: 0.8707, UEM: 0.4506, LEM: 0.2005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4654, partial_loss/deprel_loss: 0.6659, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7357, loss: 0.8623, batch_reg_loss: 0.1099, reg_loss: 0.1095 ||:  39%|###8      | 37/95 [00:24<00:39,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8660, UAS: 0.9307, LAS: 0.8692, UEM: 0.4356, LEM: 0.1922, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8033, partial_loss/deprel_loss: 0.7658, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8833, loss: 0.8725, batch_reg_loss: 0.1100, reg_loss: 0.1095 ||:  42%|####2     | 40/95 [00:26<00:37,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9296, LAS: 0.8678, UEM: 0.4272, LEM: 0.1879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5058, partial_loss/deprel_loss: 0.7003, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7714, loss: 0.8843, batch_reg_loss: 0.1101, reg_loss: 0.1096 ||:  45%|####5     | 43/95 [00:28<00:36,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8312, UAS: 0.9295, LAS: 0.8681, UEM: 0.4315, LEM: 0.1898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2709, partial_loss/deprel_loss: 1.0338, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1913, loss: 0.8818, batch_reg_loss: 0.1101, reg_loss: 0.1096 ||:  48%|####8     | 46/95 [00:31<00:34,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8474, UAS: 0.9283, LAS: 0.8667, UEM: 0.4210, LEM: 0.1832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8996, partial_loss/deprel_loss: 0.9643, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0616, loss: 0.8929, batch_reg_loss: 0.1102, reg_loss: 0.1096 ||:  52%|#####1    | 49/95 [00:33<00:32,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8787, UAS: 0.9301, LAS: 0.8692, UEM: 0.4763, LEM: 0.2466, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4993, partial_loss/deprel_loss: 0.7887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8411, loss: 0.8742, batch_reg_loss: 0.1103, reg_loss: 0.1097 ||:  55%|#####4    | 52/95 [00:35<00:32,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8096, UAS: 0.9290, LAS: 0.8679, UEM: 0.4825, LEM: 0.2531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5268, partial_loss/deprel_loss: 1.2334, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4024, loss: 0.8846, batch_reg_loss: 0.1103, reg_loss: 0.1097 ||:  58%|#####7    | 55/95 [00:37<00:29,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8947, UAS: 0.9300, LAS: 0.8691, UEM: 0.4876, LEM: 0.2528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3654, partial_loss/deprel_loss: 0.5977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6616, loss: 0.8741, batch_reg_loss: 0.1104, reg_loss: 0.1098 ||:  62%|######2   | 59/95 [00:40<00:25,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9287, LAS: 0.8678, UEM: 0.4850, LEM: 0.2498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3838, partial_loss/deprel_loss: 0.5707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6438, loss: 0.8828, batch_reg_loss: 0.1105, reg_loss: 0.1098 ||:  65%|######5   | 62/95 [00:42<00:23,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9287, LAS: 0.8679, UEM: 0.4826, LEM: 0.2463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2953, partial_loss/deprel_loss: 0.4981, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5681, loss: 0.8820, batch_reg_loss: 0.1106, reg_loss: 0.1098 ||:  69%|######9   | 66/95 [00:45<00:19,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9191, UAS: 0.9300, LAS: 0.8695, UEM: 0.5009, LEM: 0.2615, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2549, partial_loss/deprel_loss: 0.4462, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5186, loss: 0.8702, batch_reg_loss: 0.1107, reg_loss: 0.1099 ||:  73%|#######2  | 69/95 [00:47<00:18,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8733, UAS: 0.9294, LAS: 0.8688, UEM: 0.5009, LEM: 0.2610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6164, partial_loss/deprel_loss: 0.7282, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8166, loss: 0.8738, batch_reg_loss: 0.1107, reg_loss: 0.1099 ||:  77%|#######6  | 73/95 [00:49<00:14,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9307, LAS: 0.8707, UEM: 0.5151, LEM: 0.2706, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3304, partial_loss/deprel_loss: 0.4397, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5286, loss: 0.8588, batch_reg_loss: 0.1108, reg_loss: 0.1100 ||:  81%|########1 | 77/95 [00:52<00:12,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9316, LAS: 0.8717, UEM: 0.5285, LEM: 0.2812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3180, partial_loss/deprel_loss: 0.4770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5561, loss: 0.8500, batch_reg_loss: 0.1109, reg_loss: 0.1100 ||:  84%|########4 | 80/95 [00:54<00:10,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8129, UAS: 0.9313, LAS: 0.8716, UEM: 0.5363, LEM: 0.2931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3228, partial_loss/deprel_loss: 1.0582, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2221, loss: 0.8503, batch_reg_loss: 0.1110, reg_loss: 0.1100 ||:  88%|########8 | 84/95 [00:57<00:07,  1.47it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8308, UAS: 0.9315, LAS: 0.8718, UEM: 0.5368, LEM: 0.2930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2220, partial_loss/deprel_loss: 1.0879, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2257, loss: 0.8498, batch_reg_loss: 0.1110, reg_loss: 0.1101 ||:  93%|#########2| 88/95 [00:59<00:04,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9328, LAS: 0.8732, UEM: 0.5466, LEM: 0.2976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2679, partial_loss/deprel_loss: 0.5869, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6342, loss: 0.8388, batch_reg_loss: 0.1111, reg_loss: 0.1101 ||:  97%|#########6| 92/95 [01:02<00:01,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9209, UAS: 0.9323, LAS: 0.8726, UEM: 0.5503, LEM: 0.3030, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1446, partial_loss/deprel_loss: 0.3587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4271, loss: 0.8418, batch_reg_loss: 0.1112, reg_loss: 0.1102 ||: 100%|##########| 95/95 [01:04<00:00,  1.48it/s]\n",
+      "2023-04-06 23:25:45,951 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:25:45,951 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:25:45,951 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.110  |       N/A\n",
+      "2023-04-06 23:25:45,951 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:25:45,951 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:25:45,951 - INFO - combo.training.tensorboard_writer - UEM                      |     0.550  |       N/A\n",
+      "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - LEM                      |     0.303  |       N/A\n",
+      "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - EM                       |     0.921  |       N/A\n",
+      "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.145  |       N/A\n",
+      "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - UAS                      |     0.932  |       N/A\n",
+      "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.359  |       N/A\n",
+      "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - loss                     |     0.842  |       N/A\n",
+      "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - LAS                      |     0.873  |       N/A\n",
+      "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.596  |       N/A\n",
+      "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:25:45,952 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:25:45,953 - INFO - combo.training.trainer - Epoch duration: 0:01:04.324762\n",
+      "2023-04-06 23:25:45,953 - INFO - combo.training.trainer - Estimated training time remaining: 6:55:52\n",
+      "2023-04-06 23:25:45,953 - INFO - allennlp.training.trainer - Epoch 32/399\n",
+      "2023-04-06 23:25:45,953 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:25:45,954 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:25:45,959 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9301, LAS: 0.8697, UEM: 0.4459, LEM: 0.2277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4560, partial_loss/deprel_loss: 0.6288, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7054, loss: 0.8977, batch_reg_loss: 0.1112, reg_loss: 0.1112 ||:   4%|4         | 4/95 [00:02<01:00,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8786, UAS: 0.9292, LAS: 0.8692, UEM: 0.4227, LEM: 0.1978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6525, partial_loss/deprel_loss: 0.7815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8671, loss: 0.8927, batch_reg_loss: 0.1113, reg_loss: 0.1112 ||:   8%|8         | 8/95 [00:05<00:56,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9238, LAS: 0.8639, UEM: 0.4082, LEM: 0.1875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4358, partial_loss/deprel_loss: 0.5976, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6766, loss: 0.9322, batch_reg_loss: 0.1114, reg_loss: 0.1113 ||:  13%|#2        | 12/95 [00:07<00:53,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9035, UAS: 0.9317, LAS: 0.8737, UEM: 0.5259, LEM: 0.2819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3335, partial_loss/deprel_loss: 0.5011, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5790, loss: 0.8531, batch_reg_loss: 0.1115, reg_loss: 0.1113 ||:  16%|#5        | 15/95 [00:09<00:52,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8878, UAS: 0.9319, LAS: 0.8730, UEM: 0.5110, LEM: 0.2590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5019, partial_loss/deprel_loss: 0.6581, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7384, loss: 0.8532, batch_reg_loss: 0.1116, reg_loss: 0.1114 ||:  20%|##        | 19/95 [00:12<00:49,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9342, LAS: 0.8755, UEM: 0.5384, LEM: 0.2840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1421, partial_loss/deprel_loss: 0.3785, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4428, loss: 0.8315, batch_reg_loss: 0.1116, reg_loss: 0.1114 ||:  24%|##4       | 23/95 [00:14<00:46,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9353, LAS: 0.8765, UEM: 0.5362, LEM: 0.2757, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4069, partial_loss/deprel_loss: 0.6017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6745, loss: 0.8210, batch_reg_loss: 0.1117, reg_loss: 0.1114 ||:  27%|##7       | 26/95 [00:17<00:47,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7829, UAS: 0.9313, LAS: 0.8721, UEM: 0.5203, LEM: 0.2657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9171, partial_loss/deprel_loss: 1.3065, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5404, loss: 0.8508, batch_reg_loss: 0.1118, reg_loss: 0.1115 ||:  31%|###       | 29/95 [00:19<00:44,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8923, UAS: 0.9340, LAS: 0.8752, UEM: 0.5428, LEM: 0.2809, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3922, partial_loss/deprel_loss: 0.5541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6335, loss: 0.8246, batch_reg_loss: 0.1118, reg_loss: 0.1115 ||:  34%|###3      | 32/95 [00:21<00:44,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8264, UAS: 0.9337, LAS: 0.8745, UEM: 0.5313, LEM: 0.2701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2626, partial_loss/deprel_loss: 1.0762, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2253, loss: 0.8320, batch_reg_loss: 0.1119, reg_loss: 0.1115 ||:  38%|###7      | 36/95 [00:23<00:39,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9334, LAS: 0.8741, UEM: 0.5304, LEM: 0.2715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2678, partial_loss/deprel_loss: 0.5026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5676, loss: 0.8348, batch_reg_loss: 0.1120, reg_loss: 0.1116 ||:  41%|####1     | 39/95 [00:26<00:40,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.9327, LAS: 0.8730, UEM: 0.5162, LEM: 0.2619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5278, partial_loss/deprel_loss: 0.7001, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7776, loss: 0.8433, batch_reg_loss: 0.1120, reg_loss: 0.1116 ||:  44%|####4     | 42/95 [00:28<00:37,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9329, LAS: 0.8732, UEM: 0.5139, LEM: 0.2592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3069, partial_loss/deprel_loss: 0.5136, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5843, loss: 0.8430, batch_reg_loss: 0.1121, reg_loss: 0.1116 ||:  47%|####7     | 45/95 [00:30<00:35,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8254, UAS: 0.9331, LAS: 0.8734, UEM: 0.5439, LEM: 0.3044, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1491, partial_loss/deprel_loss: 1.0949, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2179, loss: 0.8432, batch_reg_loss: 0.1121, reg_loss: 0.1117 ||:  51%|#####     | 48/95 [00:32<00:34,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9332, LAS: 0.8734, UEM: 0.5434, LEM: 0.3024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2184, partial_loss/deprel_loss: 0.4329, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5022, loss: 0.8439, batch_reg_loss: 0.1122, reg_loss: 0.1117 ||:  55%|#####4    | 52/95 [00:35<00:30,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8553, UAS: 0.9338, LAS: 0.8742, UEM: 0.5455, LEM: 0.3016, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0053, partial_loss/deprel_loss: 0.9650, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0853, loss: 0.8405, batch_reg_loss: 0.1123, reg_loss: 0.1117 ||:  58%|#####7    | 55/95 [00:37<00:28,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8492, UAS: 0.9324, LAS: 0.8728, UEM: 0.5294, LEM: 0.2897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8218, partial_loss/deprel_loss: 0.9741, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0561, loss: 0.8512, batch_reg_loss: 0.1124, reg_loss: 0.1118 ||:  62%|######2   | 59/95 [00:39<00:24,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9331, LAS: 0.8736, UEM: 0.5349, LEM: 0.2919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1961, partial_loss/deprel_loss: 0.4335, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4984, loss: 0.8452, batch_reg_loss: 0.1125, reg_loss: 0.1118 ||:  65%|######5   | 62/95 [00:42<00:22,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9335, LAS: 0.8738, UEM: 0.5307, LEM: 0.2867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2864, partial_loss/deprel_loss: 0.5466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6071, loss: 0.8436, batch_reg_loss: 0.1125, reg_loss: 0.1119 ||:  69%|######9   | 66/95 [00:44<00:19,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8010, UAS: 0.9334, LAS: 0.8740, UEM: 0.5416, LEM: 0.2971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5383, partial_loss/deprel_loss: 1.2065, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3855, loss: 0.8403, batch_reg_loss: 0.1126, reg_loss: 0.1119 ||:  74%|#######3  | 70/95 [00:47<00:16,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8606, UAS: 0.9331, LAS: 0.8737, UEM: 0.5406, LEM: 0.2966, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7620, partial_loss/deprel_loss: 0.8850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9730, loss: 0.8439, batch_reg_loss: 0.1127, reg_loss: 0.1119 ||:  77%|#######6  | 73/95 [00:49<00:14,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9328, LAS: 0.8733, UEM: 0.5343, LEM: 0.2904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5312, partial_loss/deprel_loss: 0.6720, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7566, loss: 0.8478, batch_reg_loss: 0.1127, reg_loss: 0.1120 ||:  80%|########  | 76/95 [00:51<00:12,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9316, LAS: 0.8721, UEM: 0.5348, LEM: 0.2911, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2271, partial_loss/deprel_loss: 0.4674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5322, loss: 0.8570, batch_reg_loss: 0.1128, reg_loss: 0.1120 ||:  83%|########3 | 79/95 [00:53<00:11,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8859, UAS: 0.9323, LAS: 0.8730, UEM: 0.5379, LEM: 0.2908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4902, partial_loss/deprel_loss: 0.6764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7520, loss: 0.8507, batch_reg_loss: 0.1129, reg_loss: 0.1120 ||:  86%|########6 | 82/95 [00:56<00:09,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9326, LAS: 0.8733, UEM: 0.5386, LEM: 0.2910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2232, partial_loss/deprel_loss: 0.4530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5200, loss: 0.8478, batch_reg_loss: 0.1129, reg_loss: 0.1121 ||:  89%|########9 | 85/95 [00:58<00:07,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8612, UAS: 0.9326, LAS: 0.8732, UEM: 0.5383, LEM: 0.2906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6636, partial_loss/deprel_loss: 0.7732, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8643, loss: 0.8471, batch_reg_loss: 0.1130, reg_loss: 0.1121 ||:  93%|#########2| 88/95 [01:00<00:05,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8125, UAS: 0.9313, LAS: 0.8716, UEM: 0.5328, LEM: 0.2867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4500, partial_loss/deprel_loss: 1.1874, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3530, loss: 0.8586, batch_reg_loss: 0.1131, reg_loss: 0.1121 ||:  96%|#########5| 91/95 [01:02<00:02,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8528, UAS: 0.9320, LAS: 0.8725, UEM: 0.5489, LEM: 0.3050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8698, partial_loss/deprel_loss: 0.9173, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0209, loss: 0.8512, batch_reg_loss: 0.1131, reg_loss: 0.1121 ||:  99%|#########8| 94/95 [01:04<00:00,  1.41it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9084, UAS: 0.9323, LAS: 0.8729, UEM: 0.5514, LEM: 0.3059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2711, partial_loss/deprel_loss: 0.4642, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5387, loss: 0.8479, batch_reg_loss: 0.1131, reg_loss: 0.1122 ||: 100%|##########| 95/95 [01:05<00:00,  1.45it/s]\n",
+      "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.112  |       N/A\n",
+      "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - UEM                      |     0.551  |       N/A\n",
+      "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - LEM                      |     0.306  |       N/A\n",
+      "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - EM                       |     0.908  |       N/A\n",
+      "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.271  |       N/A\n",
+      "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:26:51,300 - INFO - combo.training.tensorboard_writer - UAS                      |     0.932  |       N/A\n",
+      "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.464  |       N/A\n",
+      "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - loss                     |     0.848  |       N/A\n",
+      "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - LAS                      |     0.873  |       N/A\n",
+      "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:26:51,301 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:26:51,302 - INFO - combo.training.trainer - Epoch duration: 0:01:05.348414\n",
+      "2023-04-06 23:26:51,302 - INFO - combo.training.trainer - Estimated training time remaining: 6:54:17\n",
+      "2023-04-06 23:26:51,302 - INFO - allennlp.training.trainer - Epoch 33/399\n",
+      "2023-04-06 23:26:51,302 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:26:51,302 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:26:51,308 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9486, LAS: 0.8924, UEM: 0.7037, LEM: 0.4360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2468, partial_loss/deprel_loss: 0.4336, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5094, loss: 0.6325, batch_reg_loss: 0.1132, reg_loss: 0.1132 ||:   3%|3         | 3/95 [00:02<01:11,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8413, UAS: 0.9275, LAS: 0.8681, UEM: 0.5495, LEM: 0.3218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8843, partial_loss/deprel_loss: 0.8701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9862, loss: 0.8366, batch_reg_loss: 0.1133, reg_loss: 0.1132 ||:   7%|7         | 7/95 [00:04<01:03,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7927, UAS: 0.9251, LAS: 0.8656, UEM: 0.5293, LEM: 0.2882, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7105, partial_loss/deprel_loss: 1.2121, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4251, loss: 0.8632, batch_reg_loss: 0.1133, reg_loss: 0.1132 ||:  11%|#         | 10/95 [00:06<01:01,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9341, LAS: 0.8756, UEM: 0.6130, LEM: 0.3508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1157, partial_loss/deprel_loss: 0.3530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4190, loss: 0.7885, batch_reg_loss: 0.1134, reg_loss: 0.1133 ||:  14%|#3        | 13/95 [00:09<01:01,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8733, UAS: 0.9371, LAS: 0.8785, UEM: 0.6068, LEM: 0.3334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6198, partial_loss/deprel_loss: 0.7161, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8103, loss: 0.7708, batch_reg_loss: 0.1135, reg_loss: 0.1133 ||:  17%|#6        | 16/95 [00:11<00:57,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9419, LAS: 0.8848, UEM: 0.6580, LEM: 0.3863, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2149, partial_loss/deprel_loss: 0.4466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5137, loss: 0.7275, batch_reg_loss: 0.1135, reg_loss: 0.1133 ||:  20%|##        | 19/95 [00:13<00:57,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8433, UAS: 0.9369, LAS: 0.8787, UEM: 0.6148, LEM: 0.3552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9499, partial_loss/deprel_loss: 0.9590, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0708, loss: 0.7791, batch_reg_loss: 0.1136, reg_loss: 0.1134 ||:  24%|##4       | 23/95 [00:16<00:51,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9355, LAS: 0.8764, UEM: 0.5868, LEM: 0.3315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3288, partial_loss/deprel_loss: 0.6071, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6651, loss: 0.8012, batch_reg_loss: 0.1137, reg_loss: 0.1134 ||:  28%|##8       | 27/95 [00:18<00:47,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8259, UAS: 0.9343, LAS: 0.8750, UEM: 0.5813, LEM: 0.3274, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2071, partial_loss/deprel_loss: 1.0966, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2324, loss: 0.8155, batch_reg_loss: 0.1137, reg_loss: 0.1134 ||:  32%|###1      | 30/95 [00:21<00:45,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9336, LAS: 0.8742, UEM: 0.5707, LEM: 0.3162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4102, partial_loss/deprel_loss: 0.6142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6872, loss: 0.8187, batch_reg_loss: 0.1138, reg_loss: 0.1135 ||:  35%|###4      | 33/95 [00:23<00:43,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9355, LAS: 0.8767, UEM: 0.5810, LEM: 0.3218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3768, partial_loss/deprel_loss: 0.5456, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6257, loss: 0.8022, batch_reg_loss: 0.1138, reg_loss: 0.1135 ||:  38%|###7      | 36/95 [00:25<00:43,  1.36it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8634, UAS: 0.9352, LAS: 0.8765, UEM: 0.5675, LEM: 0.3089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7297, partial_loss/deprel_loss: 0.8530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9423, loss: 0.8053, batch_reg_loss: 0.1139, reg_loss: 0.1135 ||:  41%|####1     | 39/95 [00:27<00:40,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9338, LAS: 0.8749, UEM: 0.5621, LEM: 0.3036, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2653, partial_loss/deprel_loss: 0.5660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6198, loss: 0.8215, batch_reg_loss: 0.1140, reg_loss: 0.1136 ||:  44%|####4     | 42/95 [00:29<00:37,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8497, UAS: 0.9320, LAS: 0.8728, UEM: 0.5448, LEM: 0.2900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8942, partial_loss/deprel_loss: 0.9231, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0313, loss: 0.8381, batch_reg_loss: 0.1141, reg_loss: 0.1136 ||:  48%|####8     | 46/95 [00:31<00:32,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8354, UAS: 0.9327, LAS: 0.8732, UEM: 0.5526, LEM: 0.2956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1232, partial_loss/deprel_loss: 1.0909, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2115, loss: 0.8358, batch_reg_loss: 0.1141, reg_loss: 0.1136 ||:  53%|#####2    | 50/95 [00:34<00:30,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8364, UAS: 0.9309, LAS: 0.8713, UEM: 0.5454, LEM: 0.2928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1690, partial_loss/deprel_loss: 0.9704, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1244, loss: 0.8545, batch_reg_loss: 0.1142, reg_loss: 0.1137 ||:  57%|#####6    | 54/95 [00:37<00:27,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9310, LAS: 0.8713, UEM: 0.5375, LEM: 0.2834, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4611, partial_loss/deprel_loss: 0.6311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7114, loss: 0.8543, batch_reg_loss: 0.1143, reg_loss: 0.1137 ||:  61%|######1   | 58/95 [00:39<00:23,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8470, UAS: 0.9307, LAS: 0.8712, UEM: 0.5276, LEM: 0.2754, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0411, partial_loss/deprel_loss: 0.9490, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0818, loss: 0.8585, batch_reg_loss: 0.1144, reg_loss: 0.1138 ||:  65%|######5   | 62/95 [00:42<00:21,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7762, UAS: 0.9291, LAS: 0.8694, UEM: 0.5234, LEM: 0.2733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2625, partial_loss/deprel_loss: 1.5342, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7944, loss: 0.8754, batch_reg_loss: 0.1145, reg_loss: 0.1138 ||:  69%|######9   | 66/95 [00:45<00:18,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9030, UAS: 0.9305, LAS: 0.8709, UEM: 0.5339, LEM: 0.2775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3025, partial_loss/deprel_loss: 0.5761, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6360, loss: 0.8629, batch_reg_loss: 0.1146, reg_loss: 0.1139 ||:  74%|#######3  | 70/95 [00:47<00:15,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9320, LAS: 0.8724, UEM: 0.5526, LEM: 0.2934, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2794, partial_loss/deprel_loss: 0.4444, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5261, loss: 0.8488, batch_reg_loss: 0.1147, reg_loss: 0.1139 ||:  78%|#######7  | 74/95 [00:50<00:14,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8843, UAS: 0.9328, LAS: 0.8733, UEM: 0.5528, LEM: 0.2902, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4616, partial_loss/deprel_loss: 0.6105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6955, loss: 0.8418, batch_reg_loss: 0.1148, reg_loss: 0.1139 ||:  82%|########2 | 78/95 [00:52<00:11,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8836, UAS: 0.9323, LAS: 0.8727, UEM: 0.5434, LEM: 0.2835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5145, partial_loss/deprel_loss: 0.6636, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7486, loss: 0.8450, batch_reg_loss: 0.1148, reg_loss: 0.1140 ||:  86%|########6 | 82/95 [00:55<00:08,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8574, UAS: 0.9326, LAS: 0.8728, UEM: 0.5411, LEM: 0.2807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7292, partial_loss/deprel_loss: 0.9182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9953, loss: 0.8444, batch_reg_loss: 0.1149, reg_loss: 0.1140 ||:  91%|######### | 86/95 [00:58<00:06,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7848, UAS: 0.9314, LAS: 0.8716, UEM: 0.5342, LEM: 0.2754, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8967, partial_loss/deprel_loss: 1.2783, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5170, loss: 0.8545, batch_reg_loss: 0.1150, reg_loss: 0.1141 ||:  95%|#########4| 90/95 [01:01<00:03,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9317, LAS: 0.8721, UEM: 0.5383, LEM: 0.2787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3309, partial_loss/deprel_loss: 0.5393, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6127, loss: 0.8494, batch_reg_loss: 0.1151, reg_loss: 0.1141 ||:  98%|#########7| 93/95 [01:03<00:01,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9473, UAS: 0.9323, LAS: 0.8730, UEM: 0.5542, LEM: 0.3005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0884, partial_loss/deprel_loss: 0.2159, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3055, loss: 0.8428, batch_reg_loss: 0.1151, reg_loss: 0.1141 ||: 100%|##########| 95/95 [01:05<00:00,  1.46it/s]\n",
+      "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.114  |       N/A\n",
+      "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer - UEM                      |     0.554  |       N/A\n",
+      "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer - LEM                      |     0.301  |       N/A\n",
+      "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer - EM                       |     0.947  |       N/A\n",
+      "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.088  |       N/A\n",
+      "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:27:56,390 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - UAS                      |     0.932  |       N/A\n",
+      "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.216  |       N/A\n",
+      "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - loss                     |     0.843  |       N/A\n",
+      "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - LAS                      |     0.873  |       N/A\n",
+      "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:27:56,391 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:27:56,392 - INFO - combo.training.trainer - Epoch duration: 0:01:05.090000\n",
+      "2023-04-06 23:27:56,392 - INFO - combo.training.trainer - Estimated training time remaining: 6:52:40\n",
+      "2023-04-06 23:27:56,392 - INFO - allennlp.training.trainer - Epoch 34/399\n",
+      "2023-04-06 23:27:56,392 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:27:56,392 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:27:56,399 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9454, LAS: 0.8897, UEM: 0.5625, LEM: 0.2768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2900, partial_loss/deprel_loss: 0.4427, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5273, loss: 0.6903, batch_reg_loss: 0.1152, reg_loss: 0.1151 ||:   3%|3         | 3/95 [00:02<01:07,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9508, LAS: 0.8929, UEM: 0.5816, LEM: 0.2577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3096, partial_loss/deprel_loss: 0.5456, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6136, loss: 0.6771, batch_reg_loss: 0.1152, reg_loss: 0.1152 ||:   6%|6         | 6/95 [00:04<01:07,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8149, UAS: 0.9394, LAS: 0.8797, UEM: 0.5386, LEM: 0.2403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4532, partial_loss/deprel_loss: 1.0855, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2743, loss: 0.7823, batch_reg_loss: 0.1153, reg_loss: 0.1152 ||:   9%|9         | 9/95 [00:06<01:02,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9356, LAS: 0.8751, UEM: 0.5214, LEM: 0.2343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2411, partial_loss/deprel_loss: 0.5428, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5978, loss: 0.8289, batch_reg_loss: 0.1153, reg_loss: 0.1152 ||:  13%|#2        | 12/95 [00:08<00:59,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9389, LAS: 0.8795, UEM: 0.5678, LEM: 0.2862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2516, partial_loss/deprel_loss: 0.4979, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5640, loss: 0.7939, batch_reg_loss: 0.1154, reg_loss: 0.1153 ||:  16%|#5        | 15/95 [00:10<00:57,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9031, UAS: 0.9348, LAS: 0.8752, UEM: 0.5681, LEM: 0.2872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3626, partial_loss/deprel_loss: 0.5587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6350, loss: 0.8295, batch_reg_loss: 0.1155, reg_loss: 0.1153 ||:  20%|##        | 19/95 [00:13<00:53,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9346, LAS: 0.8753, UEM: 0.5636, LEM: 0.2900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1973, partial_loss/deprel_loss: 0.4340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5022, loss: 0.8377, batch_reg_loss: 0.1156, reg_loss: 0.1153 ||:  24%|##4       | 23/95 [00:16<00:50,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8652, UAS: 0.9337, LAS: 0.8742, UEM: 0.5384, LEM: 0.2678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9168, partial_loss/deprel_loss: 0.8650, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9910, loss: 0.8480, batch_reg_loss: 0.1156, reg_loss: 0.1154 ||:  28%|##8       | 27/95 [00:18<00:45,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8347, UAS: 0.9311, LAS: 0.8712, UEM: 0.5121, LEM: 0.2509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0191, partial_loss/deprel_loss: 1.0519, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1611, loss: 0.8715, batch_reg_loss: 0.1157, reg_loss: 0.1154 ||:  33%|###2      | 31/95 [00:21<00:41,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9537, UAS: 0.9323, LAS: 0.8731, UEM: 0.5610, LEM: 0.3197, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0757, partial_loss/deprel_loss: 0.1835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2778, loss: 0.8571, batch_reg_loss: 0.1158, reg_loss: 0.1155 ||:  37%|###6      | 35/95 [00:24<00:43,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8708, UAS: 0.9323, LAS: 0.8734, UEM: 0.5630, LEM: 0.3250, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7922, partial_loss/deprel_loss: 0.7743, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8938, loss: 0.8563, batch_reg_loss: 0.1159, reg_loss: 0.1155 ||:  40%|####      | 38/95 [00:27<00:42,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9324, LAS: 0.8735, UEM: 0.5549, LEM: 0.3176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6392, partial_loss/deprel_loss: 0.7389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8349, loss: 0.8536, batch_reg_loss: 0.1160, reg_loss: 0.1155 ||:  43%|####3     | 41/95 [00:29<00:39,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9329, LAS: 0.8741, UEM: 0.5491, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3573, partial_loss/deprel_loss: 0.5804, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6518, loss: 0.8504, batch_reg_loss: 0.1160, reg_loss: 0.1156 ||:  46%|####6     | 44/95 [00:31<00:36,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8609, UAS: 0.9322, LAS: 0.8733, UEM: 0.5394, LEM: 0.3008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6864, partial_loss/deprel_loss: 0.8533, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9360, loss: 0.8589, batch_reg_loss: 0.1161, reg_loss: 0.1156 ||:  49%|####9     | 47/95 [00:33<00:34,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9318, LAS: 0.8731, UEM: 0.5378, LEM: 0.3014, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3048, partial_loss/deprel_loss: 0.4642, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5485, loss: 0.8600, batch_reg_loss: 0.1162, reg_loss: 0.1156 ||:  53%|#####2    | 50/95 [00:35<00:33,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9308, LAS: 0.8725, UEM: 0.5379, LEM: 0.3045, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2728, partial_loss/deprel_loss: 0.4212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5077, loss: 0.8667, batch_reg_loss: 0.1162, reg_loss: 0.1157 ||:  56%|#####5    | 53/95 [00:37<00:30,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9318, LAS: 0.8736, UEM: 0.5398, LEM: 0.3014, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4101, partial_loss/deprel_loss: 0.5982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6769, loss: 0.8583, batch_reg_loss: 0.1163, reg_loss: 0.1157 ||:  59%|#####8    | 56/95 [00:40<00:28,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9318, LAS: 0.8738, UEM: 0.5579, LEM: 0.3196, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1905, partial_loss/deprel_loss: 0.4280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4969, loss: 0.8554, batch_reg_loss: 0.1163, reg_loss: 0.1157 ||:  62%|######2   | 59/95 [00:42<00:26,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8851, UAS: 0.9326, LAS: 0.8744, UEM: 0.5555, LEM: 0.3129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5130, partial_loss/deprel_loss: 0.6787, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7620, loss: 0.8500, batch_reg_loss: 0.1164, reg_loss: 0.1158 ||:  66%|######6   | 63/95 [00:44<00:22,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9080, UAS: 0.9323, LAS: 0.8740, UEM: 0.5542, LEM: 0.3114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2823, partial_loss/deprel_loss: 0.4911, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5659, loss: 0.8528, batch_reg_loss: 0.1165, reg_loss: 0.1158 ||:  69%|######9   | 66/95 [00:46<00:20,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8840, UAS: 0.9335, LAS: 0.8752, UEM: 0.5605, LEM: 0.3125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4231, partial_loss/deprel_loss: 0.6362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7102, loss: 0.8413, batch_reg_loss: 0.1166, reg_loss: 0.1158 ||:  74%|#######3  | 70/95 [00:49<00:17,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9339, LAS: 0.8756, UEM: 0.5551, LEM: 0.3062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4018, partial_loss/deprel_loss: 0.5605, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6454, loss: 0.8376, batch_reg_loss: 0.1167, reg_loss: 0.1159 ||:  78%|#######7  | 74/95 [00:52<00:14,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8717, UAS: 0.9341, LAS: 0.8758, UEM: 0.5480, LEM: 0.2983, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6369, partial_loss/deprel_loss: 0.7233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8228, loss: 0.8353, batch_reg_loss: 0.1167, reg_loss: 0.1159 ||:  82%|########2 | 78/95 [00:54<00:11,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9335, LAS: 0.8753, UEM: 0.5534, LEM: 0.3080, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1816, partial_loss/deprel_loss: 0.3116, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4024, loss: 0.8385, batch_reg_loss: 0.1168, reg_loss: 0.1160 ||:  86%|########6 | 82/95 [00:57<00:08,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9338, LAS: 0.8754, UEM: 0.5523, LEM: 0.3058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3737, partial_loss/deprel_loss: 0.6308, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6962, loss: 0.8371, batch_reg_loss: 0.1169, reg_loss: 0.1160 ||:  91%|######### | 86/95 [00:59<00:05,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7668, UAS: 0.9333, LAS: 0.8749, UEM: 0.5530, LEM: 0.3044, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1193, partial_loss/deprel_loss: 1.3323, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6066, loss: 0.8406, batch_reg_loss: 0.1170, reg_loss: 0.1160 ||:  95%|#########4| 90/95 [01:02<00:03,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9335, LAS: 0.8749, UEM: 0.5575, LEM: 0.3089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1158, partial_loss/deprel_loss: 0.3491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4195, loss: 0.8389, batch_reg_loss: 0.1171, reg_loss: 0.1161 ||:  99%|#########8| 94/95 [01:05<00:00,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8372, UAS: 0.9332, LAS: 0.8745, UEM: 0.5553, LEM: 0.3072, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0379, partial_loss/deprel_loss: 0.9985, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1235, loss: 0.8419, batch_reg_loss: 0.1171, reg_loss: 0.1161 ||: 100%|##########| 95/95 [01:06<00:00,  1.43it/s]\n",
+      "2023-04-06 23:29:02,672 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.116  |       N/A\n",
+      "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - UEM                      |     0.555  |       N/A\n",
+      "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - LEM                      |     0.307  |       N/A\n",
+      "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - EM                       |     0.837  |       N/A\n",
+      "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.038  |       N/A\n",
+      "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - UAS                      |     0.933  |       N/A\n",
+      "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.999  |       N/A\n",
+      "2023-04-06 23:29:02,673 - INFO - combo.training.tensorboard_writer - loss                     |     0.842  |       N/A\n",
+      "2023-04-06 23:29:02,674 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:29:02,674 - INFO - combo.training.tensorboard_writer - LAS                      |     0.874  |       N/A\n",
+      "2023-04-06 23:29:02,674 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:29:02,674 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:29:02,674 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:29:02,674 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:29:02,674 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:29:02,674 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:29:02,675 - INFO - combo.training.trainer - Epoch duration: 0:01:06.282521\n",
+      "2023-04-06 23:29:02,675 - INFO - combo.training.trainer - Estimated training time remaining: 6:51:18\n",
+      "2023-04-06 23:29:02,675 - INFO - allennlp.training.trainer - Epoch 35/399\n",
+      "2023-04-06 23:29:02,675 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:29:02,675 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:29:02,682 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8403, UAS: 0.9328, LAS: 0.8700, UEM: 0.4015, LEM: 0.1409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8949, partial_loss/deprel_loss: 1.0499, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1360, loss: 0.8917, batch_reg_loss: 0.1172, reg_loss: 0.1171 ||:   4%|4         | 4/95 [00:02<00:56,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9388, LAS: 0.8803, UEM: 0.5021, LEM: 0.2380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6407, partial_loss/deprel_loss: 0.8017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8867, loss: 0.8298, batch_reg_loss: 0.1172, reg_loss: 0.1172 ||:   8%|8         | 8/95 [00:04<00:54,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9330, LAS: 0.8742, UEM: 0.4814, LEM: 0.2262, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7000, partial_loss/deprel_loss: 0.7975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8953, loss: 0.8565, batch_reg_loss: 0.1173, reg_loss: 0.1172 ||:  13%|#2        | 12/95 [00:08<00:59,  1.40it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9149, UAS: 0.9296, LAS: 0.8717, UEM: 0.4975, LEM: 0.2517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2341, partial_loss/deprel_loss: 0.4173, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4980, loss: 0.8744, batch_reg_loss: 0.1174, reg_loss: 0.1172 ||:  16%|#5        | 15/95 [00:10<00:57,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9355, LAS: 0.8785, UEM: 0.5918, LEM: 0.3425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1491, partial_loss/deprel_loss: 0.3454, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4236, loss: 0.8180, batch_reg_loss: 0.1175, reg_loss: 0.1173 ||:  19%|#8        | 18/95 [00:13<00:57,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8332, UAS: 0.9327, LAS: 0.8755, UEM: 0.5839, LEM: 0.3368, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1837, partial_loss/deprel_loss: 1.0341, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1816, loss: 0.8458, batch_reg_loss: 0.1175, reg_loss: 0.1173 ||:  22%|##2       | 21/95 [00:15<00:53,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8790, UAS: 0.9330, LAS: 0.8747, UEM: 0.5557, LEM: 0.3085, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5207, partial_loss/deprel_loss: 0.6897, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7735, loss: 0.8494, batch_reg_loss: 0.1176, reg_loss: 0.1174 ||:  26%|##6       | 25/95 [00:17<00:47,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8585, UAS: 0.9341, LAS: 0.8764, UEM: 0.5420, LEM: 0.2900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8242, partial_loss/deprel_loss: 0.8496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9622, loss: 0.8364, batch_reg_loss: 0.1177, reg_loss: 0.1174 ||:  31%|###       | 29/95 [00:20<00:43,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9352, LAS: 0.8772, UEM: 0.5393, LEM: 0.2806, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3497, partial_loss/deprel_loss: 0.5675, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6417, loss: 0.8275, batch_reg_loss: 0.1177, reg_loss: 0.1174 ||:  34%|###3      | 32/95 [00:22<00:44,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8463, UAS: 0.9349, LAS: 0.8771, UEM: 0.5751, LEM: 0.3358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9193, partial_loss/deprel_loss: 0.9739, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0808, loss: 0.8269, batch_reg_loss: 0.1178, reg_loss: 0.1175 ||:  37%|###6      | 35/95 [00:24<00:44,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8839, UAS: 0.9314, LAS: 0.8731, UEM: 0.5634, LEM: 0.3265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5175, partial_loss/deprel_loss: 0.6489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7405, loss: 0.8570, batch_reg_loss: 0.1179, reg_loss: 0.1175 ||:  40%|####      | 38/95 [00:27<00:40,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8866, UAS: 0.9312, LAS: 0.8725, UEM: 0.5498, LEM: 0.3132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4005, partial_loss/deprel_loss: 0.5868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6675, loss: 0.8583, batch_reg_loss: 0.1179, reg_loss: 0.1175 ||:  44%|####4     | 42/95 [00:29<00:36,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9329, LAS: 0.8745, UEM: 0.5573, LEM: 0.3144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4212, partial_loss/deprel_loss: 0.6137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6932, loss: 0.8438, batch_reg_loss: 0.1180, reg_loss: 0.1176 ||:  47%|####7     | 45/95 [00:31<00:34,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9329, LAS: 0.8745, UEM: 0.5568, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2502, partial_loss/deprel_loss: 0.4501, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5282, loss: 0.8414, batch_reg_loss: 0.1181, reg_loss: 0.1176 ||:  52%|#####1    | 49/95 [00:34<00:31,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8264, UAS: 0.9305, LAS: 0.8721, UEM: 0.5382, LEM: 0.2991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3343, partial_loss/deprel_loss: 1.0364, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2141, loss: 0.8611, batch_reg_loss: 0.1182, reg_loss: 0.1176 ||:  56%|#####5    | 53/95 [00:36<00:27,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8599, UAS: 0.9303, LAS: 0.8717, UEM: 0.5311, LEM: 0.2938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8531, partial_loss/deprel_loss: 0.8836, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9957, loss: 0.8645, batch_reg_loss: 0.1183, reg_loss: 0.1177 ||:  60%|######    | 57/95 [00:38<00:24,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9003, UAS: 0.9305, LAS: 0.8718, UEM: 0.5282, LEM: 0.2904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4067, partial_loss/deprel_loss: 0.5351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6278, loss: 0.8638, batch_reg_loss: 0.1183, reg_loss: 0.1177 ||:  64%|######4   | 61/95 [00:41<00:22,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8993, UAS: 0.9321, LAS: 0.8736, UEM: 0.5395, LEM: 0.2949, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2952, partial_loss/deprel_loss: 0.5256, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5979, loss: 0.8497, batch_reg_loss: 0.1184, reg_loss: 0.1178 ||:  68%|######8   | 65/95 [00:44<00:20,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9329, LAS: 0.8746, UEM: 0.5445, LEM: 0.2967, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4054, partial_loss/deprel_loss: 0.5342, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6270, loss: 0.8416, batch_reg_loss: 0.1185, reg_loss: 0.1178 ||:  72%|#######1  | 68/95 [00:47<00:19,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9326, LAS: 0.8743, UEM: 0.5391, LEM: 0.2923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6426, partial_loss/deprel_loss: 0.7426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8412, loss: 0.8432, batch_reg_loss: 0.1186, reg_loss: 0.1178 ||:  76%|#######5  | 72/95 [00:49<00:16,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9332, LAS: 0.8750, UEM: 0.5475, LEM: 0.2987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2027, partial_loss/deprel_loss: 0.4440, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5144, loss: 0.8362, batch_reg_loss: 0.1186, reg_loss: 0.1179 ||:  79%|#######8  | 75/95 [00:52<00:14,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9341, LAS: 0.8760, UEM: 0.5571, LEM: 0.3040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1853, partial_loss/deprel_loss: 0.4359, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5045, loss: 0.8281, batch_reg_loss: 0.1187, reg_loss: 0.1179 ||:  82%|########2 | 78/95 [00:54<00:12,  1.37it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9068, UAS: 0.9347, LAS: 0.8766, UEM: 0.5570, LEM: 0.3021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2554, partial_loss/deprel_loss: 0.4840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5570, loss: 0.8217, batch_reg_loss: 0.1188, reg_loss: 0.1179 ||:  85%|########5 | 81/95 [00:56<00:10,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8452, UAS: 0.9342, LAS: 0.8760, UEM: 0.5472, LEM: 0.2948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8270, partial_loss/deprel_loss: 0.9002, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0044, loss: 0.8251, batch_reg_loss: 0.1188, reg_loss: 0.1180 ||:  89%|########9 | 85/95 [00:59<00:07,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8049, UAS: 0.9342, LAS: 0.8761, UEM: 0.5568, LEM: 0.3079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6723, partial_loss/deprel_loss: 1.2662, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4663, loss: 0.8257, batch_reg_loss: 0.1189, reg_loss: 0.1180 ||:  93%|#########2| 88/95 [01:01<00:04,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9342, LAS: 0.8763, UEM: 0.5618, LEM: 0.3131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3461, partial_loss/deprel_loss: 0.4791, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5714, loss: 0.8216, batch_reg_loss: 0.1189, reg_loss: 0.1180 ||:  96%|#########5| 91/95 [01:03<00:02,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8801, UAS: 0.9329, LAS: 0.8749, UEM: 0.5539, LEM: 0.3072, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6375, partial_loss/deprel_loss: 0.6770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7881, loss: 0.8337, batch_reg_loss: 0.1190, reg_loss: 0.1181 ||: 100%|##########| 95/95 [01:06<00:00,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8801, UAS: 0.9329, LAS: 0.8749, UEM: 0.5539, LEM: 0.3072, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6375, partial_loss/deprel_loss: 0.6770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7881, loss: 0.8337, batch_reg_loss: 0.1190, reg_loss: 0.1181 ||: 100%|##########| 95/95 [01:06<00:00,  1.44it/s]\n",
+      "2023-04-06 23:30:08,851 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9266, UAS: 0.9588, LAS: 0.9043, UEM: 0.7300, LEM: 0.4288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2290, partial_loss/deprel_loss: 22.2542, partial_loss/cycle_loss: 0.0000, batch_loss: 17.8492, loss: 24.0080, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  27%|##7       | 3/11 [00:03<00:08,  1.06s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8407, UAS: 0.9461, LAS: 0.8875, UEM: 0.6354, LEM: 0.3292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3987, partial_loss/deprel_loss: 56.9363, partial_loss/cycle_loss: 0.0000, batch_loss: 45.8288, loss: 27.9184, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  55%|#####4    | 6/11 [00:06<00:05,  1.07s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9473, LAS: 0.8914, UEM: 0.6242, LEM: 0.3156, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3161, partial_loss/deprel_loss: 27.6688, partial_loss/cycle_loss: 0.0000, batch_loss: 22.1982, loss: 25.7038, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  82%|########1 | 9/11 [00:09<00:02,  1.02s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8777, UAS: 0.9482, LAS: 0.8943, UEM: 0.6692, LEM: 0.3951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0665, partial_loss/deprel_loss: 47.8072, partial_loss/cycle_loss: 0.0000, batch_loss: 38.4590, loss: 25.9505, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:11<00:00,  1.01s/it]\n",
+      "2023-04-06 23:30:19,988 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.118  |     0.000\n",
+      "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - UEM                      |     0.554  |     0.669\n",
+      "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - LEM                      |     0.307  |     0.395\n",
+      "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - EM                       |     0.880  |     0.878\n",
+      "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.637  |     1.067\n",
+      "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - UAS                      |     0.933  |     0.948\n",
+      "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.677  |    47.807\n",
+      "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - loss                     |     0.834  |    25.951\n",
+      "2023-04-06 23:30:19,989 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:30:19,990 - INFO - combo.training.tensorboard_writer - LAS                      |     0.875  |     0.894\n",
+      "2023-04-06 23:30:19,990 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:30:19,990 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:30:19,990 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:30:19,990 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:30:19,990 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:30:19,990 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 23:30:19,991 - INFO - combo.training.trainer - Epoch duration: 0:01:17.315801\n",
+      "2023-04-06 23:30:19,991 - INFO - combo.training.trainer - Estimated training time remaining: 6:51:49\n",
+      "2023-04-06 23:30:19,991 - INFO - allennlp.training.trainer - Epoch 36/399\n",
+      "2023-04-06 23:30:19,991 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:30:19,991 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:30:19,998 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9477, LAS: 0.8948, UEM: 0.7414, LEM: 0.5057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1763, partial_loss/deprel_loss: 0.3357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4228, loss: 0.6724, batch_reg_loss: 0.1191, reg_loss: 0.1190 ||:   3%|3         | 3/95 [00:02<01:18,  1.17it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9447, LAS: 0.8907, UEM: 0.7507, LEM: 0.5066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1926, partial_loss/deprel_loss: 0.4058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4823, loss: 0.7071, batch_reg_loss: 0.1191, reg_loss: 0.1191 ||:   6%|6         | 6/95 [00:04<01:14,  1.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8546, UAS: 0.9437, LAS: 0.8877, UEM: 0.6831, LEM: 0.4276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8091, partial_loss/deprel_loss: 0.8481, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9595, loss: 0.7308, batch_reg_loss: 0.1192, reg_loss: 0.1191 ||:   9%|9         | 9/95 [00:07<01:08,  1.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9124, UAS: 0.9433, LAS: 0.8878, UEM: 0.6720, LEM: 0.4069, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2829, partial_loss/deprel_loss: 0.4594, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5434, loss: 0.7337, batch_reg_loss: 0.1193, reg_loss: 0.1191 ||:  14%|#3        | 13/95 [00:09<01:01,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8571, UAS: 0.9337, LAS: 0.8770, UEM: 0.6113, LEM: 0.3640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9070, partial_loss/deprel_loss: 0.9308, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0454, loss: 0.8210, batch_reg_loss: 0.1194, reg_loss: 0.1192 ||:  18%|#7        | 17/95 [00:12<00:55,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8553, UAS: 0.9360, LAS: 0.8786, UEM: 0.6085, LEM: 0.3557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6687, partial_loss/deprel_loss: 0.8803, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9574, loss: 0.8055, batch_reg_loss: 0.1194, reg_loss: 0.1192 ||:  22%|##2       | 21/95 [00:14<00:50,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8860, UAS: 0.9339, LAS: 0.8761, UEM: 0.5774, LEM: 0.3296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4460, partial_loss/deprel_loss: 0.5838, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6758, loss: 0.8180, batch_reg_loss: 0.1195, reg_loss: 0.1193 ||:  26%|##6       | 25/95 [00:16<00:45,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9016, UAS: 0.9365, LAS: 0.8790, UEM: 0.5851, LEM: 0.3262, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3892, partial_loss/deprel_loss: 0.5473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6353, loss: 0.7989, batch_reg_loss: 0.1196, reg_loss: 0.1193 ||:  31%|###       | 29/95 [00:19<00:41,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8875, UAS: 0.9373, LAS: 0.8797, UEM: 0.5731, LEM: 0.3118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4843, partial_loss/deprel_loss: 0.6256, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7170, loss: 0.7960, batch_reg_loss: 0.1197, reg_loss: 0.1194 ||:  35%|###4      | 33/95 [00:21<00:37,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9384, LAS: 0.8806, UEM: 0.5733, LEM: 0.3105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1741, partial_loss/deprel_loss: 0.3951, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4707, loss: 0.7905, batch_reg_loss: 0.1198, reg_loss: 0.1194 ||:  39%|###8      | 37/95 [00:24<00:36,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9369, LAS: 0.8790, UEM: 0.5588, LEM: 0.2999, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5788, partial_loss/deprel_loss: 0.6406, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7481, loss: 0.8037, batch_reg_loss: 0.1199, reg_loss: 0.1194 ||:  43%|####3     | 41/95 [00:26<00:33,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9184, UAS: 0.9392, LAS: 0.8820, UEM: 0.5883, LEM: 0.3275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2532, partial_loss/deprel_loss: 0.4424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5245, loss: 0.7805, batch_reg_loss: 0.1199, reg_loss: 0.1195 ||:  47%|####7     | 45/95 [00:29<00:33,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8351, UAS: 0.9385, LAS: 0.8812, UEM: 0.5812, LEM: 0.3207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0758, partial_loss/deprel_loss: 1.0011, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1360, loss: 0.7848, batch_reg_loss: 0.1200, reg_loss: 0.1195 ||:  52%|#####1    | 49/95 [00:32<00:30,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9356, LAS: 0.8781, UEM: 0.5654, LEM: 0.3101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5366, partial_loss/deprel_loss: 0.6590, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7546, loss: 0.8110, batch_reg_loss: 0.1201, reg_loss: 0.1196 ||:  56%|#####5    | 53/95 [00:34<00:26,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8106, UAS: 0.9349, LAS: 0.8773, UEM: 0.5602, LEM: 0.3040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5064, partial_loss/deprel_loss: 1.1534, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3441, loss: 0.8169, batch_reg_loss: 0.1202, reg_loss: 0.1196 ||:  60%|######    | 57/95 [00:37<00:24,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8379, UAS: 0.9353, LAS: 0.8777, UEM: 0.5632, LEM: 0.3045, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0102, partial_loss/deprel_loss: 1.0672, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1761, loss: 0.8153, batch_reg_loss: 0.1202, reg_loss: 0.1196 ||:  64%|######4   | 61/95 [00:39<00:21,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8971, UAS: 0.9368, LAS: 0.8799, UEM: 0.5933, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3850, partial_loss/deprel_loss: 0.5073, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6032, loss: 0.7989, batch_reg_loss: 0.1203, reg_loss: 0.1197 ||:  68%|######8   | 65/95 [00:43<00:20,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9374, LAS: 0.8805, UEM: 0.5959, LEM: 0.3443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2705, partial_loss/deprel_loss: 0.4385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5253, loss: 0.7937, batch_reg_loss: 0.1204, reg_loss: 0.1197 ||:  72%|#######1  | 68/95 [00:45<00:18,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8600, UAS: 0.9362, LAS: 0.8789, UEM: 0.5825, LEM: 0.3345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7992, partial_loss/deprel_loss: 0.8101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9284, loss: 0.8062, batch_reg_loss: 0.1205, reg_loss: 0.1198 ||:  76%|#######5  | 72/95 [00:47<00:15,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8851, UAS: 0.9347, LAS: 0.8771, UEM: 0.5741, LEM: 0.3277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4389, partial_loss/deprel_loss: 0.6778, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7506, loss: 0.8209, batch_reg_loss: 0.1206, reg_loss: 0.1198 ||:  80%|########  | 76/95 [00:50<00:12,  1.51it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9343, LAS: 0.8766, UEM: 0.5661, LEM: 0.3215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5118, partial_loss/deprel_loss: 0.6204, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7193, loss: 0.8243, batch_reg_loss: 0.1206, reg_loss: 0.1198 ||:  84%|########4 | 80/95 [00:52<00:09,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8893, UAS: 0.9334, LAS: 0.8756, UEM: 0.5653, LEM: 0.3213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4969, partial_loss/deprel_loss: 0.6062, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7051, loss: 0.8302, batch_reg_loss: 0.1207, reg_loss: 0.1199 ||:  88%|########8 | 84/95 [00:55<00:07,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9330, LAS: 0.8751, UEM: 0.5612, LEM: 0.3176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5179, partial_loss/deprel_loss: 0.6615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7536, loss: 0.8346, batch_reg_loss: 0.1208, reg_loss: 0.1199 ||:  92%|#########1| 87/95 [00:57<00:05,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9330, LAS: 0.8751, UEM: 0.5596, LEM: 0.3155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2933, partial_loss/deprel_loss: 0.4630, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5499, loss: 0.8357, batch_reg_loss: 0.1209, reg_loss: 0.1199 ||:  95%|#########4| 90/95 [00:59<00:03,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8294, UAS: 0.9328, LAS: 0.8748, UEM: 0.5558, LEM: 0.3116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1469, partial_loss/deprel_loss: 1.0104, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1587, loss: 0.8370, batch_reg_loss: 0.1210, reg_loss: 0.1200 ||:  99%|#########8| 94/95 [01:02<00:00,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9329, LAS: 0.8749, UEM: 0.5544, LEM: 0.3103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5993, partial_loss/deprel_loss: 0.7079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8071, loss: 0.8367, batch_reg_loss: 0.1210, reg_loss: 0.1200 ||: 100%|##########| 95/95 [01:02<00:00,  1.51it/s]\n",
+      "2023-04-06 23:31:22,906 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.120  |       N/A\n",
+      "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - UEM                      |     0.554  |       N/A\n",
+      "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - LEM                      |     0.310  |       N/A\n",
+      "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - EM                       |     0.884  |       N/A\n",
+      "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.599  |       N/A\n",
+      "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - UAS                      |     0.933  |       N/A\n",
+      "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.708  |       N/A\n",
+      "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - loss                     |     0.837  |       N/A\n",
+      "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:31:22,907 - INFO - combo.training.tensorboard_writer - LAS                      |     0.875  |       N/A\n",
+      "2023-04-06 23:31:22,908 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:31:22,908 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:31:22,908 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:31:22,908 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:31:22,908 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:31:22,908 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:31:22,908 - INFO - combo.training.trainer - Epoch duration: 0:01:02.917721\n",
+      "2023-04-06 23:31:22,909 - INFO - combo.training.trainer - Estimated training time remaining: 6:49:52\n",
+      "2023-04-06 23:31:22,909 - INFO - allennlp.training.trainer - Epoch 37/399\n",
+      "2023-04-06 23:31:22,909 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:31:22,909 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:31:22,916 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8784, UAS: 0.9514, LAS: 0.8954, UEM: 0.5949, LEM: 0.2786, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6434, partial_loss/deprel_loss: 0.7854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8781, loss: 0.6990, batch_reg_loss: 0.1211, reg_loss: 0.1210 ||:   4%|4         | 4/95 [00:02<00:54,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8874, UAS: 0.9370, LAS: 0.8811, UEM: 0.5511, LEM: 0.2706, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4832, partial_loss/deprel_loss: 0.6702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7539, loss: 0.8023, batch_reg_loss: 0.1211, reg_loss: 0.1211 ||:   8%|8         | 8/95 [00:04<00:52,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9313, LAS: 0.8750, UEM: 0.4997, LEM: 0.2391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6666, partial_loss/deprel_loss: 0.7253, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8347, loss: 0.8502, batch_reg_loss: 0.1212, reg_loss: 0.1211 ||:  12%|#1        | 11/95 [00:06<00:53,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9320, LAS: 0.8754, UEM: 0.4993, LEM: 0.2396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7533, partial_loss/deprel_loss: 0.7773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8938, loss: 0.8417, batch_reg_loss: 0.1213, reg_loss: 0.1211 ||:  15%|#4        | 14/95 [00:09<00:54,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9336, LAS: 0.8763, UEM: 0.4745, LEM: 0.2181, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4635, partial_loss/deprel_loss: 0.5870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6837, loss: 0.8257, batch_reg_loss: 0.1214, reg_loss: 0.1212 ||:  19%|#8        | 18/95 [00:11<00:50,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9368, LAS: 0.8794, UEM: 0.5117, LEM: 0.2452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5865, partial_loss/deprel_loss: 0.7784, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8615, loss: 0.8011, batch_reg_loss: 0.1215, reg_loss: 0.1212 ||:  23%|##3       | 22/95 [00:14<00:47,  1.53it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.9362, LAS: 0.8787, UEM: 0.4922, LEM: 0.2322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8021, partial_loss/deprel_loss: 0.8052, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9261, loss: 0.8076, batch_reg_loss: 0.1215, reg_loss: 0.1213 ||:  27%|##7       | 26/95 [00:16<00:43,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9360, LAS: 0.8787, UEM: 0.4889, LEM: 0.2287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3007, partial_loss/deprel_loss: 0.5390, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6129, loss: 0.8082, batch_reg_loss: 0.1216, reg_loss: 0.1213 ||:  32%|###1      | 30/95 [00:19<00:43,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9366, LAS: 0.8795, UEM: 0.5116, LEM: 0.2537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1484, partial_loss/deprel_loss: 0.3678, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4456, loss: 0.8037, batch_reg_loss: 0.1217, reg_loss: 0.1213 ||:  35%|###4      | 33/95 [00:21<00:42,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8447, UAS: 0.9365, LAS: 0.8796, UEM: 0.5081, LEM: 0.2506, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1201, partial_loss/deprel_loss: 0.9817, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1311, loss: 0.8029, batch_reg_loss: 0.1217, reg_loss: 0.1214 ||:  38%|###7      | 36/95 [00:24<00:42,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9141, UAS: 0.9357, LAS: 0.8786, UEM: 0.5266, LEM: 0.2659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2559, partial_loss/deprel_loss: 0.4295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5165, loss: 0.8096, batch_reg_loss: 0.1218, reg_loss: 0.1214 ||:  41%|####1     | 39/95 [00:26<00:40,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8265, UAS: 0.9358, LAS: 0.8790, UEM: 0.5437, LEM: 0.2860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2482, partial_loss/deprel_loss: 1.0411, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2044, loss: 0.8043, batch_reg_loss: 0.1218, reg_loss: 0.1214 ||:  44%|####4     | 42/95 [00:29<00:40,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7986, UAS: 0.9314, LAS: 0.8745, UEM: 0.5338, LEM: 0.2795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8628, partial_loss/deprel_loss: 1.1907, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4471, loss: 0.8394, batch_reg_loss: 0.1219, reg_loss: 0.1215 ||:  48%|####8     | 46/95 [00:31<00:36,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9324, LAS: 0.8757, UEM: 0.5487, LEM: 0.2985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1373, partial_loss/deprel_loss: 0.2893, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3809, loss: 0.8302, batch_reg_loss: 0.1220, reg_loss: 0.1215 ||:  52%|#####1    | 49/95 [00:33<00:33,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9332, LAS: 0.8763, UEM: 0.5467, LEM: 0.2950, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2825, partial_loss/deprel_loss: 0.4777, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5607, loss: 0.8246, batch_reg_loss: 0.1221, reg_loss: 0.1215 ||:  55%|#####4    | 52/95 [00:35<00:30,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9061, UAS: 0.9329, LAS: 0.8760, UEM: 0.5492, LEM: 0.2966, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2645, partial_loss/deprel_loss: 0.5083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5817, loss: 0.8270, batch_reg_loss: 0.1221, reg_loss: 0.1216 ||:  58%|#####7    | 55/95 [00:38<00:28,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8588, UAS: 0.9322, LAS: 0.8753, UEM: 0.5408, LEM: 0.2908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8819, partial_loss/deprel_loss: 0.8136, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9494, loss: 0.8340, batch_reg_loss: 0.1222, reg_loss: 0.1216 ||:  61%|######1   | 58/95 [00:40<00:26,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8506, UAS: 0.9315, LAS: 0.8742, UEM: 0.5311, LEM: 0.2835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0343, partial_loss/deprel_loss: 0.8963, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0462, loss: 0.8424, batch_reg_loss: 0.1222, reg_loss: 0.1216 ||:  64%|######4   | 61/95 [00:42<00:24,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9128, UAS: 0.9313, LAS: 0.8739, UEM: 0.5281, LEM: 0.2806, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3109, partial_loss/deprel_loss: 0.4351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5326, loss: 0.8451, batch_reg_loss: 0.1223, reg_loss: 0.1217 ||:  68%|######8   | 65/95 [00:44<00:20,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9308, LAS: 0.8734, UEM: 0.5217, LEM: 0.2748, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4480, partial_loss/deprel_loss: 0.6569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7375, loss: 0.8507, batch_reg_loss: 0.1224, reg_loss: 0.1217 ||:  73%|#######2  | 69/95 [00:47<00:17,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8762, UAS: 0.9316, LAS: 0.8742, UEM: 0.5276, LEM: 0.2791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5359, partial_loss/deprel_loss: 0.6530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7521, loss: 0.8441, batch_reg_loss: 0.1225, reg_loss: 0.1218 ||:  77%|#######6  | 73/95 [00:50<00:15,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8364, UAS: 0.9317, LAS: 0.8741, UEM: 0.5278, LEM: 0.2776, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1349, partial_loss/deprel_loss: 1.0402, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1817, loss: 0.8445, batch_reg_loss: 0.1226, reg_loss: 0.1218 ||:  80%|########  | 76/95 [00:52<00:14,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8504, UAS: 0.9314, LAS: 0.8737, UEM: 0.5233, LEM: 0.2737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0308, partial_loss/deprel_loss: 0.8860, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0376, loss: 0.8476, batch_reg_loss: 0.1226, reg_loss: 0.1218 ||:  83%|########3 | 79/95 [00:55<00:11,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9140, UAS: 0.9320, LAS: 0.8747, UEM: 0.5446, LEM: 0.3028, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2678, partial_loss/deprel_loss: 0.4654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5486, loss: 0.8411, batch_reg_loss: 0.1227, reg_loss: 0.1218 ||:  86%|########6 | 82/95 [00:57<00:10,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8501, UAS: 0.9321, LAS: 0.8748, UEM: 0.5496, LEM: 0.3095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9542, partial_loss/deprel_loss: 1.0536, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1565, loss: 0.8409, batch_reg_loss: 0.1228, reg_loss: 0.1219 ||:  89%|########9 | 85/95 [01:00<00:07,  1.29it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8563, UAS: 0.9322, LAS: 0.8749, UEM: 0.5446, LEM: 0.3041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7975, partial_loss/deprel_loss: 0.9283, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0250, loss: 0.8398, batch_reg_loss: 0.1228, reg_loss: 0.1219 ||:  94%|#########3| 89/95 [01:02<00:04,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8692, UAS: 0.9325, LAS: 0.8750, UEM: 0.5452, LEM: 0.3023, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5842, partial_loss/deprel_loss: 0.7836, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8666, loss: 0.8388, batch_reg_loss: 0.1229, reg_loss: 0.1219 ||:  97%|#########6| 92/95 [01:04<00:02,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8745, UAS: 0.9333, LAS: 0.8758, UEM: 0.5520, LEM: 0.3065, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6730, partial_loss/deprel_loss: 0.7886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8884, loss: 0.8336, batch_reg_loss: 0.1230, reg_loss: 0.1220 ||: 100%|##########| 95/95 [01:06<00:00,  1.42it/s]\n",
+      "2023-04-06 23:32:29,689 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.122  |       N/A\n",
+      "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - UEM                      |     0.552  |       N/A\n",
+      "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - LEM                      |     0.306  |       N/A\n",
+      "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - EM                       |     0.875  |       N/A\n",
+      "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.673  |       N/A\n",
+      "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - UAS                      |     0.933  |       N/A\n",
+      "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.789  |       N/A\n",
+      "2023-04-06 23:32:29,690 - INFO - combo.training.tensorboard_writer - loss                     |     0.834  |       N/A\n",
+      "2023-04-06 23:32:29,691 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:32:29,691 - INFO - combo.training.tensorboard_writer - LAS                      |     0.876  |       N/A\n",
+      "2023-04-06 23:32:29,691 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:32:29,691 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:32:29,691 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:32:29,691 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:32:29,691 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:32:29,691 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:32:29,692 - INFO - combo.training.trainer - Epoch duration: 0:01:06.782898\n",
+      "2023-04-06 23:32:29,692 - INFO - combo.training.trainer - Estimated training time remaining: 6:48:35\n",
+      "2023-04-06 23:32:29,692 - INFO - allennlp.training.trainer - Epoch 38/399\n",
+      "2023-04-06 23:32:29,692 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:32:29,692 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:32:29,699 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9468, LAS: 0.8878, UEM: 0.5179, LEM: 0.2321, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3875, partial_loss/deprel_loss: 0.5396, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6322, loss: 0.7048, batch_reg_loss: 0.1230, reg_loss: 0.1230 ||:   3%|3         | 3/95 [00:02<01:04,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9404, LAS: 0.8853, UEM: 0.5849, LEM: 0.3034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2919, partial_loss/deprel_loss: 0.4636, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5523, loss: 0.7458, batch_reg_loss: 0.1231, reg_loss: 0.1230 ||:   6%|6         | 6/95 [00:04<01:01,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8524, UAS: 0.9322, LAS: 0.8764, UEM: 0.5648, LEM: 0.3061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8550, partial_loss/deprel_loss: 0.9004, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0144, loss: 0.8174, batch_reg_loss: 0.1231, reg_loss: 0.1231 ||:  11%|#         | 10/95 [00:06<00:57,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8336, UAS: 0.9306, LAS: 0.8744, UEM: 0.5312, LEM: 0.2768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0999, partial_loss/deprel_loss: 0.9766, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1245, loss: 0.8379, batch_reg_loss: 0.1232, reg_loss: 0.1231 ||:  15%|#4        | 14/95 [00:09<00:54,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9303, LAS: 0.8744, UEM: 0.5064, LEM: 0.2534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5468, partial_loss/deprel_loss: 0.6683, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7673, loss: 0.8399, batch_reg_loss: 0.1233, reg_loss: 0.1231 ||:  19%|#8        | 18/95 [00:11<00:51,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9305, LAS: 0.8738, UEM: 0.5088, LEM: 0.2519, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2656, partial_loss/deprel_loss: 0.4825, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5625, loss: 0.8459, batch_reg_loss: 0.1234, reg_loss: 0.1232 ||:  22%|##2       | 21/95 [00:14<00:51,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8021, UAS: 0.9296, LAS: 0.8724, UEM: 0.4969, LEM: 0.2394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5105, partial_loss/deprel_loss: 1.2375, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4156, loss: 0.8596, batch_reg_loss: 0.1234, reg_loss: 0.1232 ||:  26%|##6       | 25/95 [00:16<00:46,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8946, UAS: 0.9308, LAS: 0.8741, UEM: 0.5015, LEM: 0.2442, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4046, partial_loss/deprel_loss: 0.6064, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6896, loss: 0.8492, batch_reg_loss: 0.1235, reg_loss: 0.1232 ||:  29%|##9       | 28/95 [00:18<00:45,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8883, UAS: 0.9338, LAS: 0.8778, UEM: 0.5633, LEM: 0.3213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5251, partial_loss/deprel_loss: 0.6847, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7764, loss: 0.8249, batch_reg_loss: 0.1236, reg_loss: 0.1233 ||:  33%|###2      | 31/95 [00:21<00:45,  1.41it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8463, UAS: 0.9338, LAS: 0.8776, UEM: 0.5580, LEM: 0.3140, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9901, partial_loss/deprel_loss: 0.9016, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0430, loss: 0.8267, batch_reg_loss: 0.1236, reg_loss: 0.1233 ||:  36%|###5      | 34/95 [00:23<00:42,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8903, UAS: 0.9350, LAS: 0.8789, UEM: 0.5612, LEM: 0.3120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4870, partial_loss/deprel_loss: 0.5764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6822, loss: 0.8136, batch_reg_loss: 0.1237, reg_loss: 0.1233 ||:  39%|###8      | 37/95 [00:25<00:40,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8894, UAS: 0.9359, LAS: 0.8801, UEM: 0.5639, LEM: 0.3124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5278, partial_loss/deprel_loss: 0.6427, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7435, loss: 0.8035, batch_reg_loss: 0.1237, reg_loss: 0.1234 ||:  42%|####2     | 40/95 [00:27<00:38,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9368, LAS: 0.8812, UEM: 0.5744, LEM: 0.3240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1437, partial_loss/deprel_loss: 0.3322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4183, loss: 0.7933, batch_reg_loss: 0.1238, reg_loss: 0.1234 ||:  45%|####5     | 43/95 [00:29<00:37,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9356, LAS: 0.8795, UEM: 0.5579, LEM: 0.3102, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4626, partial_loss/deprel_loss: 0.6600, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7444, loss: 0.8057, batch_reg_loss: 0.1239, reg_loss: 0.1234 ||:  49%|####9     | 47/95 [00:32<00:32,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8432, UAS: 0.9358, LAS: 0.8798, UEM: 0.5603, LEM: 0.3130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9331, partial_loss/deprel_loss: 0.8576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9967, loss: 0.8002, batch_reg_loss: 0.1239, reg_loss: 0.1235 ||:  53%|#####2    | 50/95 [00:34<00:31,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8193, UAS: 0.9354, LAS: 0.8789, UEM: 0.5552, LEM: 0.3087, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3234, partial_loss/deprel_loss: 1.0071, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1944, loss: 0.8053, batch_reg_loss: 0.1240, reg_loss: 0.1235 ||:  57%|#####6    | 54/95 [00:36<00:27,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9363, LAS: 0.8802, UEM: 0.5559, LEM: 0.3079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2073, partial_loss/deprel_loss: 0.5454, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6018, loss: 0.7968, batch_reg_loss: 0.1241, reg_loss: 0.1235 ||:  61%|######1   | 58/95 [00:39<00:23,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8752, UAS: 0.9352, LAS: 0.8788, UEM: 0.5565, LEM: 0.3083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5459, partial_loss/deprel_loss: 0.7448, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8291, loss: 0.8069, batch_reg_loss: 0.1241, reg_loss: 0.1236 ||:  65%|######5   | 62/95 [00:41<00:21,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9360, LAS: 0.8799, UEM: 0.5602, LEM: 0.3110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3582, partial_loss/deprel_loss: 0.5754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6562, loss: 0.7988, batch_reg_loss: 0.1242, reg_loss: 0.1236 ||:  69%|######9   | 66/95 [00:44<00:19,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8825, UAS: 0.9357, LAS: 0.8793, UEM: 0.5555, LEM: 0.3068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5896, partial_loss/deprel_loss: 0.7611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8511, loss: 0.8060, batch_reg_loss: 0.1243, reg_loss: 0.1236 ||:  74%|#######3  | 70/95 [00:47<00:17,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8668, UAS: 0.9362, LAS: 0.8798, UEM: 0.5560, LEM: 0.3056, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7461, partial_loss/deprel_loss: 0.7575, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8796, loss: 0.8015, batch_reg_loss: 0.1243, reg_loss: 0.1237 ||:  77%|#######6  | 73/95 [00:50<00:15,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8308, UAS: 0.9359, LAS: 0.8796, UEM: 0.5522, LEM: 0.3017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1170, partial_loss/deprel_loss: 1.0188, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1628, loss: 0.8031, batch_reg_loss: 0.1244, reg_loss: 0.1237 ||:  80%|########  | 76/95 [00:52<00:13,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9110, UAS: 0.9371, LAS: 0.8808, UEM: 0.5712, LEM: 0.3192, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2030, partial_loss/deprel_loss: 0.4119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4946, loss: 0.7918, batch_reg_loss: 0.1245, reg_loss: 0.1237 ||:  83%|########3 | 79/95 [00:54<00:11,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7651, UAS: 0.9347, LAS: 0.8780, UEM: 0.5644, LEM: 0.3149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1664, partial_loss/deprel_loss: 1.4685, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7326, loss: 0.8152, batch_reg_loss: 0.1245, reg_loss: 0.1238 ||:  86%|########6 | 82/95 [00:56<00:09,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9344, LAS: 0.8776, UEM: 0.5591, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3251, partial_loss/deprel_loss: 0.5764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6508, loss: 0.8192, batch_reg_loss: 0.1246, reg_loss: 0.1238 ||:  91%|######### | 86/95 [00:59<00:06,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8431, UAS: 0.9337, LAS: 0.8768, UEM: 0.5541, LEM: 0.3063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9655, partial_loss/deprel_loss: 0.9398, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0696, loss: 0.8243, batch_reg_loss: 0.1247, reg_loss: 0.1238 ||:  95%|#########4| 90/95 [01:02<00:03,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8577, UAS: 0.9334, LAS: 0.8764, UEM: 0.5476, LEM: 0.3011, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9685, partial_loss/deprel_loss: 0.8837, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0254, loss: 0.8279, batch_reg_loss: 0.1247, reg_loss: 0.1239 ||:  98%|#########7| 93/95 [01:04<00:01,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9338, LAS: 0.8769, UEM: 0.5566, LEM: 0.3123, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1388, partial_loss/deprel_loss: 0.2844, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3800, loss: 0.8233, batch_reg_loss: 0.1248, reg_loss: 0.1239 ||: 100%|##########| 95/95 [01:05<00:00,  1.44it/s]\n",
+      "2023-04-06 23:33:35,455 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:33:35,455 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:33:35,455 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.124  |       N/A\n",
+      "2023-04-06 23:33:35,455 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - UEM                      |     0.557  |       N/A\n",
+      "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - LEM                      |     0.312  |       N/A\n",
+      "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - EM                       |     0.932  |       N/A\n",
+      "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.139  |       N/A\n",
+      "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - UAS                      |     0.934  |       N/A\n",
+      "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.284  |       N/A\n",
+      "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - loss                     |     0.823  |       N/A\n",
+      "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - LAS                      |     0.877  |       N/A\n",
+      "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:33:35,456 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:33:35,457 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:33:35,457 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:33:35,457 - INFO - combo.training.trainer - Epoch duration: 0:01:05.765487\n",
+      "2023-04-06 23:33:35,457 - INFO - combo.training.trainer - Estimated training time remaining: 6:47:10\n",
+      "2023-04-06 23:33:35,458 - INFO - allennlp.training.trainer - Epoch 39/399\n",
+      "2023-04-06 23:33:35,458 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:33:35,458 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:33:35,465 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7854, UAS: 0.9013, LAS: 0.8406, UEM: 0.2256, LEM: 0.0677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9358, partial_loss/deprel_loss: 1.3153, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5643, loss: 1.1230, batch_reg_loss: 0.1249, reg_loss: 0.1248 ||:   3%|3         | 3/95 [00:02<01:07,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8874, UAS: 0.9146, LAS: 0.8558, UEM: 0.3082, LEM: 0.0959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4825, partial_loss/deprel_loss: 0.6405, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7338, loss: 1.0103, batch_reg_loss: 0.1249, reg_loss: 0.1249 ||:   6%|6         | 6/95 [00:04<01:04,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9284, LAS: 0.8724, UEM: 0.5318, LEM: 0.2772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2490, partial_loss/deprel_loss: 0.3859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4835, loss: 0.8735, batch_reg_loss: 0.1250, reg_loss: 0.1249 ||:  11%|#         | 10/95 [00:07<01:00,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8680, UAS: 0.9343, LAS: 0.8784, UEM: 0.5593, LEM: 0.2963, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5965, partial_loss/deprel_loss: 0.7453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8407, loss: 0.8243, batch_reg_loss: 0.1251, reg_loss: 0.1249 ||:  14%|#3        | 13/95 [00:09<00:58,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8874, UAS: 0.9323, LAS: 0.8762, UEM: 0.5283, LEM: 0.2729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5030, partial_loss/deprel_loss: 0.5858, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6944, loss: 0.8411, batch_reg_loss: 0.1251, reg_loss: 0.1250 ||:  17%|#6        | 16/95 [00:11<00:56,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9370, LAS: 0.8817, UEM: 0.6207, LEM: 0.3765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1209, partial_loss/deprel_loss: 0.2790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3726, loss: 0.7979, batch_reg_loss: 0.1252, reg_loss: 0.1250 ||:  20%|##        | 19/95 [00:13<00:56,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8486, UAS: 0.9374, LAS: 0.8823, UEM: 0.6201, LEM: 0.3755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0154, partial_loss/deprel_loss: 0.9240, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0676, loss: 0.7916, batch_reg_loss: 0.1253, reg_loss: 0.1250 ||:  23%|##3       | 22/95 [00:16<00:55,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9358, LAS: 0.8805, UEM: 0.6121, LEM: 0.3726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1837, partial_loss/deprel_loss: 0.3674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4560, loss: 0.8050, batch_reg_loss: 0.1253, reg_loss: 0.1251 ||:  27%|##7       | 26/95 [00:18<00:50,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9380, LAS: 0.8832, UEM: 0.6298, LEM: 0.3865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3012, partial_loss/deprel_loss: 0.3943, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5011, loss: 0.7793, batch_reg_loss: 0.1254, reg_loss: 0.1251 ||:  31%|###       | 29/95 [00:21<00:54,  1.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8963, UAS: 0.9364, LAS: 0.8817, UEM: 0.6136, LEM: 0.3734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4184, partial_loss/deprel_loss: 0.4977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6073, loss: 0.7870, batch_reg_loss: 0.1254, reg_loss: 0.1251 ||:  34%|###3      | 32/95 [00:23<00:49,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9369, LAS: 0.8820, UEM: 0.6008, LEM: 0.3582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2908, partial_loss/deprel_loss: 0.5142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5950, loss: 0.7869, batch_reg_loss: 0.1255, reg_loss: 0.1252 ||:  38%|###7      | 36/95 [00:26<00:44,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8875, UAS: 0.9359, LAS: 0.8805, UEM: 0.5898, LEM: 0.3466, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4490, partial_loss/deprel_loss: 0.5749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6753, loss: 0.7989, batch_reg_loss: 0.1256, reg_loss: 0.1252 ||:  41%|####1     | 39/95 [00:28<00:40,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9365, LAS: 0.8817, UEM: 0.6143, LEM: 0.3838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5383, partial_loss/deprel_loss: 0.6646, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7650, loss: 0.7930, batch_reg_loss: 0.1256, reg_loss: 0.1252 ||:  44%|####4     | 42/95 [00:31<00:41,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9361, LAS: 0.8814, UEM: 0.6079, LEM: 0.3749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3776, partial_loss/deprel_loss: 0.5837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6681, loss: 0.7952, batch_reg_loss: 0.1257, reg_loss: 0.1253 ||:  47%|####7     | 45/95 [00:33<00:37,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8932, UAS: 0.9357, LAS: 0.8805, UEM: 0.5984, LEM: 0.3630, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3667, partial_loss/deprel_loss: 0.5887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6700, loss: 0.8030, batch_reg_loss: 0.1258, reg_loss: 0.1253 ||:  52%|#####1    | 49/95 [00:36<00:33,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9373, LAS: 0.8821, UEM: 0.6066, LEM: 0.3657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2052, partial_loss/deprel_loss: 0.3975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4849, loss: 0.7901, batch_reg_loss: 0.1259, reg_loss: 0.1253 ||:  56%|#####5    | 53/95 [00:38<00:29,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9367, LAS: 0.8813, UEM: 0.5989, LEM: 0.3579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3410, partial_loss/deprel_loss: 0.5433, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6287, loss: 0.7944, batch_reg_loss: 0.1259, reg_loss: 0.1254 ||:  59%|#####8    | 56/95 [00:40<00:27,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8728, UAS: 0.9367, LAS: 0.8811, UEM: 0.5948, LEM: 0.3536, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6581, partial_loss/deprel_loss: 0.7599, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8655, loss: 0.7959, batch_reg_loss: 0.1260, reg_loss: 0.1254 ||:  62%|######2   | 59/95 [00:42<00:25,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9377, LAS: 0.8821, UEM: 0.5973, LEM: 0.3518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2486, partial_loss/deprel_loss: 0.4472, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5335, loss: 0.7878, batch_reg_loss: 0.1260, reg_loss: 0.1254 ||:  65%|######5   | 62/95 [00:45<00:23,  1.41it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8567, UAS: 0.9366, LAS: 0.8807, UEM: 0.5859, LEM: 0.3439, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7358, partial_loss/deprel_loss: 0.8422, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9470, loss: 0.7992, batch_reg_loss: 0.1261, reg_loss: 0.1255 ||:  68%|######8   | 65/95 [00:47<00:20,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9368, LAS: 0.8807, UEM: 0.5874, LEM: 0.3408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2687, partial_loss/deprel_loss: 0.4925, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5739, loss: 0.7989, batch_reg_loss: 0.1262, reg_loss: 0.1255 ||:  73%|#######2  | 69/95 [00:49<00:17,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7954, UAS: 0.9347, LAS: 0.8782, UEM: 0.5760, LEM: 0.3330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8442, partial_loss/deprel_loss: 1.2007, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4556, loss: 0.8182, batch_reg_loss: 0.1262, reg_loss: 0.1255 ||:  77%|#######6  | 73/95 [00:52<00:15,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8319, UAS: 0.9348, LAS: 0.8782, UEM: 0.5740, LEM: 0.3308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1669, partial_loss/deprel_loss: 1.1540, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2829, loss: 0.8196, batch_reg_loss: 0.1263, reg_loss: 0.1256 ||:  80%|########  | 76/95 [00:54<00:12,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8684, UAS: 0.9344, LAS: 0.8778, UEM: 0.5651, LEM: 0.3226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7605, partial_loss/deprel_loss: 0.7363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8675, loss: 0.8245, batch_reg_loss: 0.1264, reg_loss: 0.1256 ||:  84%|########4 | 80/95 [00:56<00:09,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8849, UAS: 0.9346, LAS: 0.8778, UEM: 0.5585, LEM: 0.3154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5044, partial_loss/deprel_loss: 0.6359, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7361, loss: 0.8251, batch_reg_loss: 0.1265, reg_loss: 0.1257 ||:  88%|########8 | 84/95 [00:59<00:07,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8640, UAS: 0.9349, LAS: 0.8780, UEM: 0.5571, LEM: 0.3119, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7289, partial_loss/deprel_loss: 0.8303, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9366, loss: 0.8227, batch_reg_loss: 0.1265, reg_loss: 0.1257 ||:  92%|#########1| 87/95 [01:01<00:05,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8932, UAS: 0.9353, LAS: 0.8782, UEM: 0.5545, LEM: 0.3067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4038, partial_loss/deprel_loss: 0.5717, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6647, loss: 0.8211, batch_reg_loss: 0.1266, reg_loss: 0.1257 ||:  96%|#########5| 91/95 [01:04<00:02,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8968, UAS: 0.9357, LAS: 0.8788, UEM: 0.5600, LEM: 0.3125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3942, partial_loss/deprel_loss: 0.5844, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6730, loss: 0.8153, batch_reg_loss: 0.1267, reg_loss: 0.1257 ||:  99%|#########8| 94/95 [01:06<00:00,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7955, UAS: 0.9349, LAS: 0.8780, UEM: 0.5581, LEM: 0.3115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7372, partial_loss/deprel_loss: 1.3056, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5186, loss: 0.8227, batch_reg_loss: 0.1267, reg_loss: 0.1258 ||: 100%|##########| 95/95 [01:07<00:00,  1.41it/s]\n",
+      "2023-04-06 23:34:42,924 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:34:42,924 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:34:42,924 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.126  |       N/A\n",
+      "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - UEM                      |     0.558  |       N/A\n",
+      "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - LEM                      |     0.311  |       N/A\n",
+      "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - EM                       |     0.795  |       N/A\n",
+      "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.737  |       N/A\n",
+      "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - UAS                      |     0.935  |       N/A\n",
+      "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.306  |       N/A\n",
+      "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - loss                     |     0.823  |       N/A\n",
+      "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - LAS                      |     0.878  |       N/A\n",
+      "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:34:42,925 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:34:42,926 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:34:42,926 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:34:42,926 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:34:42,926 - INFO - combo.training.trainer - Epoch duration: 0:01:07.468682\n",
+      "2023-04-06 23:34:42,926 - INFO - combo.training.trainer - Estimated training time remaining: 6:46:00\n",
+      "2023-04-06 23:34:42,926 - INFO - allennlp.training.trainer - Epoch 40/399\n",
+      "2023-04-06 23:34:42,927 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:34:42,927 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:34:42,933 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8670, UAS: 0.9400, LAS: 0.8828, UEM: 0.4868, LEM: 0.2070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6732, partial_loss/deprel_loss: 0.7949, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8973, loss: 0.8036, batch_reg_loss: 0.1268, reg_loss: 0.1267 ||:   4%|4         | 4/95 [00:02<00:51,  1.76it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9421, LAS: 0.8870, UEM: 0.4658, LEM: 0.1947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6863, partial_loss/deprel_loss: 0.7191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8394, loss: 0.7717, batch_reg_loss: 0.1268, reg_loss: 0.1268 ||:   7%|7         | 7/95 [00:04<00:55,  1.59it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9476, LAS: 0.8928, UEM: 0.5637, LEM: 0.2815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2650, partial_loss/deprel_loss: 0.4735, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5587, loss: 0.7269, batch_reg_loss: 0.1269, reg_loss: 0.1268 ||:  11%|#         | 10/95 [00:07<00:58,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9020, UAS: 0.9404, LAS: 0.8855, UEM: 0.5344, LEM: 0.2657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3865, partial_loss/deprel_loss: 0.5412, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6372, loss: 0.7765, batch_reg_loss: 0.1269, reg_loss: 0.1268 ||:  14%|#3        | 13/95 [00:09<00:56,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9422, LAS: 0.8870, UEM: 0.5699, LEM: 0.3060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1448, partial_loss/deprel_loss: 0.3290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4191, loss: 0.7601, batch_reg_loss: 0.1270, reg_loss: 0.1268 ||:  17%|#6        | 16/95 [00:11<00:57,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9116, UAS: 0.9428, LAS: 0.8874, UEM: 0.5908, LEM: 0.3189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2763, partial_loss/deprel_loss: 0.4794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5658, loss: 0.7553, batch_reg_loss: 0.1270, reg_loss: 0.1269 ||:  20%|##        | 19/95 [00:13<00:54,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7986, UAS: 0.9376, LAS: 0.8821, UEM: 0.5716, LEM: 0.3090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7296, partial_loss/deprel_loss: 1.2162, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4460, loss: 0.8000, batch_reg_loss: 0.1271, reg_loss: 0.1269 ||:  24%|##4       | 23/95 [00:16<00:49,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9389, LAS: 0.8848, UEM: 0.6288, LEM: 0.3959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2579, partial_loss/deprel_loss: 0.3547, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4625, loss: 0.7762, batch_reg_loss: 0.1272, reg_loss: 0.1269 ||:  27%|##7       | 26/95 [00:19<00:53,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8824, UAS: 0.9381, LAS: 0.8835, UEM: 0.6019, LEM: 0.3694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6894, partial_loss/deprel_loss: 0.6837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8121, loss: 0.7863, batch_reg_loss: 0.1273, reg_loss: 0.1270 ||:  32%|###1      | 30/95 [00:21<00:47,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9404, LAS: 0.8862, UEM: 0.6130, LEM: 0.3716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2661, partial_loss/deprel_loss: 0.4562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5455, loss: 0.7672, batch_reg_loss: 0.1273, reg_loss: 0.1270 ||:  35%|###4      | 33/95 [00:23<00:44,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8936, UAS: 0.9384, LAS: 0.8841, UEM: 0.5955, LEM: 0.3546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3805, partial_loss/deprel_loss: 0.5536, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6464, loss: 0.7814, batch_reg_loss: 0.1274, reg_loss: 0.1270 ||:  39%|###8      | 37/95 [00:26<00:41,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8371, UAS: 0.9361, LAS: 0.8813, UEM: 0.5781, LEM: 0.3425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1116, partial_loss/deprel_loss: 0.9277, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0919, loss: 0.8044, batch_reg_loss: 0.1274, reg_loss: 0.1271 ||:  42%|####2     | 40/95 [00:28<00:40,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8429, UAS: 0.9349, LAS: 0.8800, UEM: 0.5685, LEM: 0.3341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0994, partial_loss/deprel_loss: 0.9195, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0830, loss: 0.8124, batch_reg_loss: 0.1275, reg_loss: 0.1271 ||:  45%|####5     | 43/95 [00:31<00:38,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8563, UAS: 0.9339, LAS: 0.8786, UEM: 0.5597, LEM: 0.3257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7561, partial_loss/deprel_loss: 0.8972, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9965, loss: 0.8232, batch_reg_loss: 0.1275, reg_loss: 0.1271 ||:  48%|####8     | 46/95 [00:33<00:37,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9345, LAS: 0.8791, UEM: 0.5693, LEM: 0.3349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1239, partial_loss/deprel_loss: 0.3585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4392, loss: 0.8194, batch_reg_loss: 0.1276, reg_loss: 0.1272 ||:  52%|#####1    | 49/95 [00:35<00:35,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9347, LAS: 0.8792, UEM: 0.5634, LEM: 0.3275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3834, partial_loss/deprel_loss: 0.5559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6491, loss: 0.8214, batch_reg_loss: 0.1277, reg_loss: 0.1272 ||:  55%|#####4    | 52/95 [00:38<00:32,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8395, UAS: 0.9352, LAS: 0.8798, UEM: 0.5676, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4259, partial_loss/deprel_loss: 1.1430, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3273, loss: 0.8205, batch_reg_loss: 0.1277, reg_loss: 0.1272 ||:  58%|#####7    | 55/95 [00:40<00:29,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9358, LAS: 0.8805, UEM: 0.5735, LEM: 0.3334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1972, partial_loss/deprel_loss: 0.4667, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5406, loss: 0.8155, batch_reg_loss: 0.1278, reg_loss: 0.1272 ||:  61%|######1   | 58/95 [00:42<00:27,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8612, UAS: 0.9364, LAS: 0.8807, UEM: 0.5704, LEM: 0.3261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6597, partial_loss/deprel_loss: 0.7953, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8960, loss: 0.8129, batch_reg_loss: 0.1279, reg_loss: 0.1273 ||:  65%|######5   | 62/95 [00:44<00:22,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8891, UAS: 0.9368, LAS: 0.8811, UEM: 0.5682, LEM: 0.3213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4632, partial_loss/deprel_loss: 0.6542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7439, loss: 0.8092, batch_reg_loss: 0.1279, reg_loss: 0.1273 ||:  68%|######8   | 65/95 [00:46<00:20,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7714, UAS: 0.9352, LAS: 0.8794, UEM: 0.5582, LEM: 0.3132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2057, partial_loss/deprel_loss: 1.4002, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6893, loss: 0.8228, batch_reg_loss: 0.1280, reg_loss: 0.1273 ||:  73%|#######2  | 69/95 [00:49<00:17,  1.47it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8624, UAS: 0.9349, LAS: 0.8790, UEM: 0.5481, LEM: 0.3048, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9324, partial_loss/deprel_loss: 0.9164, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0477, loss: 0.8266, batch_reg_loss: 0.1281, reg_loss: 0.1274 ||:  77%|#######6  | 73/95 [00:51<00:13,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8872, UAS: 0.9343, LAS: 0.8782, UEM: 0.5396, LEM: 0.2980, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4719, partial_loss/deprel_loss: 0.6551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7466, loss: 0.8310, batch_reg_loss: 0.1282, reg_loss: 0.1274 ||:  81%|########1 | 77/95 [00:54<00:11,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8917, UAS: 0.9355, LAS: 0.8795, UEM: 0.5530, LEM: 0.3079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4529, partial_loss/deprel_loss: 0.6099, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7067, loss: 0.8195, batch_reg_loss: 0.1283, reg_loss: 0.1275 ||:  85%|########5 | 81/95 [00:56<00:09,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9354, LAS: 0.8793, UEM: 0.5509, LEM: 0.3043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4369, partial_loss/deprel_loss: 0.5590, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6630, loss: 0.8217, batch_reg_loss: 0.1283, reg_loss: 0.1275 ||:  89%|########9 | 85/95 [00:59<00:06,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8636, UAS: 0.9360, LAS: 0.8801, UEM: 0.5586, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8639, partial_loss/deprel_loss: 0.7844, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9288, loss: 0.8147, batch_reg_loss: 0.1284, reg_loss: 0.1275 ||:  94%|#########3| 89/95 [01:02<00:03,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8271, UAS: 0.9354, LAS: 0.8793, UEM: 0.5562, LEM: 0.3087, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1743, partial_loss/deprel_loss: 0.9940, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1585, loss: 0.8192, batch_reg_loss: 0.1285, reg_loss: 0.1276 ||:  98%|#########7| 93/95 [01:04<00:01,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9352, LAS: 0.8793, UEM: 0.5649, LEM: 0.3207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1439, partial_loss/deprel_loss: 0.2729, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3757, loss: 0.8192, batch_reg_loss: 0.1285, reg_loss: 0.1276 ||: 100%|##########| 95/95 [01:06<00:00,  1.44it/s]\n",
+      "2023-04-06 23:35:48,999 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9453, LAS: 0.8944, UEM: 0.7057, LEM: 0.4387, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2201, partial_loss/deprel_loss: 22.8404, partial_loss/cycle_loss: 0.0000, batch_loss: 18.3164, loss: 29.2944, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  18%|#8        | 2/11 [00:02<00:09,  1.03s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8969, UAS: 0.9470, LAS: 0.8957, UEM: 0.6582, LEM: 0.3625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4912, partial_loss/deprel_loss: 24.5113, partial_loss/cycle_loss: 0.0000, batch_loss: 19.7073, loss: 24.2815, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:04<00:05,  1.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9209, UAS: 0.9471, LAS: 0.8932, UEM: 0.6188, LEM: 0.3239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2938, partial_loss/deprel_loss: 28.4128, partial_loss/cycle_loss: 0.0000, batch_loss: 22.7890, loss: 26.0436, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  73%|#######2  | 8/11 [00:07<00:02,  1.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9459, LAS: 0.8926, UEM: 0.6672, LEM: 0.3981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2192, partial_loss/deprel_loss: 19.9219, partial_loss/cycle_loss: 0.0000, batch_loss: 15.9814, loss: 26.8978, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.01s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9459, LAS: 0.8926, UEM: 0.6672, LEM: 0.3981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2192, partial_loss/deprel_loss: 19.9219, partial_loss/cycle_loss: 0.0000, batch_loss: 15.9814, loss: 26.8978, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.02it/s]\n",
+      "2023-04-06 23:35:59,794 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.128  |     0.000\n",
+      "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - UEM                      |     0.565  |     0.667\n",
+      "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - LEM                      |     0.321  |     0.398\n",
+      "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - EM                       |     0.936  |     0.937\n",
+      "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.144  |     0.219\n",
+      "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - UAS                      |     0.935  |     0.946\n",
+      "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.273  |    19.922\n",
+      "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - loss                     |     0.819  |    26.898\n",
+      "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - LAS                      |     0.879  |     0.893\n",
+      "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:35:59,795 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:35:59,796 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:35:59,796 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 23:35:59,796 - INFO - combo.training.trainer - Epoch duration: 0:01:16.869728\n",
+      "2023-04-06 23:35:59,796 - INFO - combo.training.trainer - Estimated training time remaining: 6:46:13\n",
+      "2023-04-06 23:35:59,796 - INFO - allennlp.training.trainer - Epoch 41/399\n",
+      "2023-04-06 23:35:59,796 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:35:59,797 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:35:59,803 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8579, UAS: 0.9360, LAS: 0.8791, UEM: 0.4178, LEM: 0.1620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7190, partial_loss/deprel_loss: 0.8510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9532, loss: 0.8111, batch_reg_loss: 0.1286, reg_loss: 0.1286 ||:   3%|3         | 3/95 [00:02<01:01,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8220, UAS: 0.9273, LAS: 0.8723, UEM: 0.3843, LEM: 0.1462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3957, partial_loss/deprel_loss: 1.0064, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2129, loss: 0.8524, batch_reg_loss: 0.1287, reg_loss: 0.1286 ||:   7%|7         | 7/95 [00:04<00:58,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8973, UAS: 0.9241, LAS: 0.8685, UEM: 0.3692, LEM: 0.1388, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4538, partial_loss/deprel_loss: 0.5585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6663, loss: 0.8688, batch_reg_loss: 0.1287, reg_loss: 0.1286 ||:  12%|#1        | 11/95 [00:06<00:53,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8372, UAS: 0.9240, LAS: 0.8673, UEM: 0.3374, LEM: 0.1240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1968, partial_loss/deprel_loss: 0.8812, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0732, loss: 0.8840, batch_reg_loss: 0.1288, reg_loss: 0.1287 ||:  16%|#5        | 15/95 [00:09<00:50,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8579, UAS: 0.9250, LAS: 0.8676, UEM: 0.3484, LEM: 0.1303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7812, partial_loss/deprel_loss: 0.8881, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9956, loss: 0.8889, batch_reg_loss: 0.1289, reg_loss: 0.1287 ||:  19%|#8        | 18/95 [00:11<00:50,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8025, UAS: 0.9218, LAS: 0.8643, UEM: 0.3429, LEM: 0.1296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8468, partial_loss/deprel_loss: 1.1586, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4252, loss: 0.9182, batch_reg_loss: 0.1289, reg_loss: 0.1287 ||:  22%|##2       | 21/95 [00:13<00:49,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9241, LAS: 0.8671, UEM: 0.3746, LEM: 0.1478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4220, partial_loss/deprel_loss: 0.5515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6546, loss: 0.8955, batch_reg_loss: 0.1290, reg_loss: 0.1288 ||:  25%|##5       | 24/95 [00:16<00:50,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9108, UAS: 0.9262, LAS: 0.8692, UEM: 0.3980, LEM: 0.1641, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2627, partial_loss/deprel_loss: 0.4659, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5544, loss: 0.8827, batch_reg_loss: 0.1291, reg_loss: 0.1288 ||:  28%|##8       | 27/95 [00:18<00:47,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8416, UAS: 0.9284, LAS: 0.8709, UEM: 0.4256, LEM: 0.1786, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0322, partial_loss/deprel_loss: 0.9060, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0604, loss: 0.8674, batch_reg_loss: 0.1292, reg_loss: 0.1288 ||:  33%|###2      | 31/95 [00:20<00:42,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8587, UAS: 0.9290, LAS: 0.8714, UEM: 0.4254, LEM: 0.1775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8132, partial_loss/deprel_loss: 0.8807, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9964, loss: 0.8620, batch_reg_loss: 0.1292, reg_loss: 0.1289 ||:  36%|###5      | 34/95 [00:22<00:42,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8776, UAS: 0.9295, LAS: 0.8721, UEM: 0.4283, LEM: 0.1798, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5825, partial_loss/deprel_loss: 0.7448, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8416, loss: 0.8553, batch_reg_loss: 0.1293, reg_loss: 0.1289 ||:  40%|####      | 38/95 [00:25<00:38,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8530, UAS: 0.9303, LAS: 0.8732, UEM: 0.4489, LEM: 0.2006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0398, partial_loss/deprel_loss: 0.9269, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0788, loss: 0.8499, batch_reg_loss: 0.1294, reg_loss: 0.1289 ||:  43%|####3     | 41/95 [00:27<00:36,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9306, LAS: 0.8737, UEM: 0.4761, LEM: 0.2369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1365, partial_loss/deprel_loss: 0.2568, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3622, loss: 0.8484, batch_reg_loss: 0.1294, reg_loss: 0.1290 ||:  46%|####6     | 44/95 [00:29<00:36,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9313, LAS: 0.8745, UEM: 0.4715, LEM: 0.2310, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5074, partial_loss/deprel_loss: 0.6380, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7414, loss: 0.8422, batch_reg_loss: 0.1295, reg_loss: 0.1290 ||:  51%|#####     | 48/95 [00:32<00:32,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9327, LAS: 0.8761, UEM: 0.4949, LEM: 0.2510, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6366, partial_loss/deprel_loss: 0.7918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8903, loss: 0.8296, batch_reg_loss: 0.1295, reg_loss: 0.1290 ||:  54%|#####3    | 51/95 [00:34<00:31,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8209, UAS: 0.9322, LAS: 0.8756, UEM: 0.4983, LEM: 0.2559, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3103, partial_loss/deprel_loss: 1.1247, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2914, loss: 0.8344, batch_reg_loss: 0.1296, reg_loss: 0.1291 ||:  58%|#####7    | 55/95 [00:36<00:27,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7698, UAS: 0.9314, LAS: 0.8749, UEM: 0.5076, LEM: 0.2664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0794, partial_loss/deprel_loss: 1.3318, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6110, loss: 0.8396, batch_reg_loss: 0.1297, reg_loss: 0.1291 ||:  61%|######1   | 58/95 [00:39<00:25,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9332, LAS: 0.8771, UEM: 0.5475, LEM: 0.3113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4219, partial_loss/deprel_loss: 0.5777, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6762, loss: 0.8229, batch_reg_loss: 0.1297, reg_loss: 0.1291 ||:  64%|######4   | 61/95 [00:41<00:25,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9168, UAS: 0.9341, LAS: 0.8781, UEM: 0.5496, LEM: 0.3119, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2618, partial_loss/deprel_loss: 0.4587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5491, loss: 0.8169, batch_reg_loss: 0.1298, reg_loss: 0.1292 ||:  67%|######7   | 64/95 [00:43<00:23,  1.34it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8843, UAS: 0.9342, LAS: 0.8783, UEM: 0.5438, LEM: 0.3058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4889, partial_loss/deprel_loss: 0.6987, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7866, loss: 0.8161, batch_reg_loss: 0.1298, reg_loss: 0.1292 ||:  71%|#######   | 67/95 [00:46<00:20,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8365, UAS: 0.9343, LAS: 0.8784, UEM: 0.5427, LEM: 0.3033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1633, partial_loss/deprel_loss: 1.0104, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1708, loss: 0.8170, batch_reg_loss: 0.1299, reg_loss: 0.1292 ||:  74%|#######3  | 70/95 [00:48<00:18,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8491, UAS: 0.9327, LAS: 0.8766, UEM: 0.5300, LEM: 0.2950, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9013, partial_loss/deprel_loss: 0.9811, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0951, loss: 0.8309, batch_reg_loss: 0.1300, reg_loss: 0.1293 ||:  78%|#######7  | 74/95 [00:50<00:14,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9333, LAS: 0.8771, UEM: 0.5329, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2841, partial_loss/deprel_loss: 0.5063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5919, loss: 0.8263, batch_reg_loss: 0.1300, reg_loss: 0.1293 ||:  81%|########1 | 77/95 [00:53<00:13,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9209, UAS: 0.9342, LAS: 0.8780, UEM: 0.5402, LEM: 0.3009, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1776, partial_loss/deprel_loss: 0.3950, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4816, loss: 0.8205, batch_reg_loss: 0.1301, reg_loss: 0.1293 ||:  84%|########4 | 80/95 [00:55<00:10,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9349, LAS: 0.8785, UEM: 0.5445, LEM: 0.3024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3958, partial_loss/deprel_loss: 0.6372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7191, loss: 0.8184, batch_reg_loss: 0.1302, reg_loss: 0.1294 ||:  88%|########8 | 84/95 [00:57<00:07,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9345, LAS: 0.8780, UEM: 0.5462, LEM: 0.3023, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3038, partial_loss/deprel_loss: 0.5278, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6132, loss: 0.8204, batch_reg_loss: 0.1302, reg_loss: 0.1294 ||:  92%|#########1| 87/95 [01:00<00:05,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9350, LAS: 0.8786, UEM: 0.5507, LEM: 0.3049, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3045, partial_loss/deprel_loss: 0.4945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5868, loss: 0.8158, batch_reg_loss: 0.1303, reg_loss: 0.1294 ||:  95%|#########4| 90/95 [01:02<00:03,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9341, LAS: 0.8776, UEM: 0.5549, LEM: 0.3115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1568, partial_loss/deprel_loss: 0.3802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4659, loss: 0.8229, batch_reg_loss: 0.1303, reg_loss: 0.1295 ||:  98%|#########7| 93/95 [01:04<00:01,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8902, UAS: 0.9344, LAS: 0.8780, UEM: 0.5592, LEM: 0.3146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4078, partial_loss/deprel_loss: 0.5990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6911, loss: 0.8183, batch_reg_loss: 0.1304, reg_loss: 0.1295 ||: 100%|##########| 95/95 [01:05<00:00,  1.44it/s]\n",
+      "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.129  |       N/A\n",
+      "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - UEM                      |     0.559  |       N/A\n",
+      "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - LEM                      |     0.315  |       N/A\n",
+      "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - EM                       |     0.890  |       N/A\n",
+      "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.408  |       N/A\n",
+      "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:37:05,772 - INFO - combo.training.tensorboard_writer - UAS                      |     0.934  |       N/A\n",
+      "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.599  |       N/A\n",
+      "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - loss                     |     0.818  |       N/A\n",
+      "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - LAS                      |     0.878  |       N/A\n",
+      "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:37:05,773 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:37:05,774 - INFO - combo.training.trainer - Epoch duration: 0:01:05.977443\n",
+      "2023-04-06 23:37:05,774 - INFO - combo.training.trainer - Estimated training time remaining: 6:44:49\n",
+      "2023-04-06 23:37:05,774 - INFO - allennlp.training.trainer - Epoch 42/399\n",
+      "2023-04-06 23:37:05,774 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:37:05,775 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:37:05,781 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9303, LAS: 0.8783, UEM: 0.6649, LEM: 0.4584, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3038, partial_loss/deprel_loss: 0.4927, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5854, loss: 0.8148, batch_reg_loss: 0.1304, reg_loss: 0.1304 ||:   4%|4         | 4/95 [00:02<00:52,  1.74it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8777, UAS: 0.9310, LAS: 0.8747, UEM: 0.5858, LEM: 0.3371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5777, partial_loss/deprel_loss: 0.7217, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8234, loss: 0.8341, batch_reg_loss: 0.1305, reg_loss: 0.1305 ||:   8%|8         | 8/95 [00:04<00:49,  1.76it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8432, UAS: 0.9321, LAS: 0.8765, UEM: 0.5879, LEM: 0.3550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9779, partial_loss/deprel_loss: 0.9717, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1036, loss: 0.8301, batch_reg_loss: 0.1306, reg_loss: 0.1305 ||:  13%|#2        | 12/95 [00:07<00:48,  1.71it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9364, LAS: 0.8806, UEM: 0.6022, LEM: 0.3424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2397, partial_loss/deprel_loss: 0.4584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5453, loss: 0.7917, batch_reg_loss: 0.1307, reg_loss: 0.1305 ||:  17%|#6        | 16/95 [00:09<00:47,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9104, UAS: 0.9375, LAS: 0.8823, UEM: 0.5799, LEM: 0.3194, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3787, partial_loss/deprel_loss: 0.5640, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6576, loss: 0.7849, batch_reg_loss: 0.1307, reg_loss: 0.1306 ||:  21%|##1       | 20/95 [00:11<00:43,  1.73it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9379, LAS: 0.8825, UEM: 0.5854, LEM: 0.3265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1910, partial_loss/deprel_loss: 0.3831, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4754, loss: 0.7820, batch_reg_loss: 0.1308, reg_loss: 0.1306 ||:  24%|##4       | 23/95 [00:13<00:43,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9385, LAS: 0.8835, UEM: 0.5862, LEM: 0.3275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3787, partial_loss/deprel_loss: 0.5514, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6477, loss: 0.7759, batch_reg_loss: 0.1308, reg_loss: 0.1306 ||:  27%|##7       | 26/95 [00:15<00:43,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9382, LAS: 0.8834, UEM: 0.5912, LEM: 0.3274, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2382, partial_loss/deprel_loss: 0.4722, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5563, loss: 0.7758, batch_reg_loss: 0.1309, reg_loss: 0.1306 ||:  31%|###       | 29/95 [00:18<00:44,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9363, LAS: 0.8811, UEM: 0.5848, LEM: 0.3215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4300, partial_loss/deprel_loss: 0.5942, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6923, loss: 0.7947, batch_reg_loss: 0.1310, reg_loss: 0.1307 ||:  34%|###3      | 32/95 [00:20<00:43,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8532, UAS: 0.9350, LAS: 0.8798, UEM: 0.5674, LEM: 0.3094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8510, partial_loss/deprel_loss: 0.8855, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0096, loss: 0.8071, batch_reg_loss: 0.1310, reg_loss: 0.1307 ||:  37%|###6      | 35/95 [00:22<00:41,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9367, LAS: 0.8819, UEM: 0.5845, LEM: 0.3315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3981, partial_loss/deprel_loss: 0.5429, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6450, loss: 0.7921, batch_reg_loss: 0.1311, reg_loss: 0.1307 ||:  41%|####1     | 39/95 [00:24<00:37,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8363, UAS: 0.9352, LAS: 0.8802, UEM: 0.5727, LEM: 0.3216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1738, partial_loss/deprel_loss: 0.9203, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1022, loss: 0.8053, batch_reg_loss: 0.1312, reg_loss: 0.1308 ||:  45%|####5     | 43/95 [00:27<00:34,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8829, UAS: 0.9348, LAS: 0.8799, UEM: 0.5619, LEM: 0.3125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6058, partial_loss/deprel_loss: 0.7052, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8165, loss: 0.8099, batch_reg_loss: 0.1312, reg_loss: 0.1308 ||:  48%|####8     | 46/95 [00:29<00:33,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9329, LAS: 0.8774, UEM: 0.5492, LEM: 0.3038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4213, partial_loss/deprel_loss: 0.5934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6902, loss: 0.8315, batch_reg_loss: 0.1313, reg_loss: 0.1308 ||:  53%|#####2    | 50/95 [00:32<00:30,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9192, UAS: 0.9343, LAS: 0.8790, UEM: 0.5635, LEM: 0.3117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2668, partial_loss/deprel_loss: 0.4025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5067, loss: 0.8181, batch_reg_loss: 0.1314, reg_loss: 0.1309 ||:  56%|#####5    | 53/95 [00:34<00:29,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8914, UAS: 0.9334, LAS: 0.8781, UEM: 0.5632, LEM: 0.3101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4459, partial_loss/deprel_loss: 0.5907, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6931, loss: 0.8239, batch_reg_loss: 0.1314, reg_loss: 0.1309 ||:  59%|#####8    | 56/95 [00:36<00:27,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9340, LAS: 0.8785, UEM: 0.5642, LEM: 0.3119, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2055, partial_loss/deprel_loss: 0.3961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4895, loss: 0.8222, batch_reg_loss: 0.1315, reg_loss: 0.1309 ||:  62%|######2   | 59/95 [00:39<00:26,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9600, UAS: 0.9346, LAS: 0.8796, UEM: 0.5936, LEM: 0.3518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0504, partial_loss/deprel_loss: 0.1567, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2670, loss: 0.8129, batch_reg_loss: 0.1315, reg_loss: 0.1310 ||:  65%|######5   | 62/95 [00:41<00:25,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8592, UAS: 0.9339, LAS: 0.8788, UEM: 0.5859, LEM: 0.3440, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8858, partial_loss/deprel_loss: 0.8773, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0106, loss: 0.8194, batch_reg_loss: 0.1316, reg_loss: 0.1310 ||:  69%|######9   | 66/95 [00:44<00:20,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9333, LAS: 0.8780, UEM: 0.5756, LEM: 0.3342, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6500, partial_loss/deprel_loss: 0.7221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8394, loss: 0.8262, batch_reg_loss: 0.1317, reg_loss: 0.1310 ||:  74%|#######3  | 70/95 [00:46<00:17,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8645, UAS: 0.9338, LAS: 0.8782, UEM: 0.5723, LEM: 0.3298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8521, partial_loss/deprel_loss: 0.8831, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0087, loss: 0.8255, batch_reg_loss: 0.1318, reg_loss: 0.1311 ||:  78%|#######7  | 74/95 [00:48<00:13,  1.52it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9341, LAS: 0.8784, UEM: 0.5675, LEM: 0.3241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3544, partial_loss/deprel_loss: 0.5790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6659, loss: 0.8236, batch_reg_loss: 0.1319, reg_loss: 0.1311 ||:  82%|########2 | 78/95 [00:51<00:11,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9351, LAS: 0.8792, UEM: 0.5704, LEM: 0.3239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1957, partial_loss/deprel_loss: 0.4452, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5272, loss: 0.8173, batch_reg_loss: 0.1319, reg_loss: 0.1311 ||:  86%|########6 | 82/95 [00:54<00:08,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9355, LAS: 0.8796, UEM: 0.5687, LEM: 0.3214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2853, partial_loss/deprel_loss: 0.4352, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5372, loss: 0.8150, batch_reg_loss: 0.1320, reg_loss: 0.1312 ||:  91%|######### | 86/95 [00:57<00:06,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9360, LAS: 0.8801, UEM: 0.5755, LEM: 0.3261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3179, partial_loss/deprel_loss: 0.4863, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5847, loss: 0.8097, batch_reg_loss: 0.1321, reg_loss: 0.1312 ||:  95%|#########4| 90/95 [01:00<00:03,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8689, UAS: 0.9359, LAS: 0.8798, UEM: 0.5678, LEM: 0.3185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7598, partial_loss/deprel_loss: 0.8543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9676, loss: 0.8136, batch_reg_loss: 0.1321, reg_loss: 0.1313 ||:  99%|#########8| 94/95 [01:02<00:00,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8312, UAS: 0.9355, LAS: 0.8793, UEM: 0.5654, LEM: 0.3171, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3172, partial_loss/deprel_loss: 1.0476, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2337, loss: 0.8180, batch_reg_loss: 0.1322, reg_loss: 0.1313 ||: 100%|##########| 95/95 [01:03<00:00,  1.49it/s]\n",
+      "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.131  |       N/A\n",
+      "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - UEM                      |     0.565  |       N/A\n",
+      "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - LEM                      |     0.317  |       N/A\n",
+      "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - EM                       |     0.831  |       N/A\n",
+      "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.317  |       N/A\n",
+      "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - UAS                      |     0.935  |       N/A\n",
+      "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:38:09,335 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.048  |       N/A\n",
+      "2023-04-06 23:38:09,336 - INFO - combo.training.tensorboard_writer - loss                     |     0.818  |       N/A\n",
+      "2023-04-06 23:38:09,336 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:38:09,336 - INFO - combo.training.tensorboard_writer - LAS                      |     0.879  |       N/A\n",
+      "2023-04-06 23:38:09,336 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:38:09,336 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:38:09,336 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:38:09,336 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:38:09,336 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:38:09,336 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:38:09,337 - INFO - combo.training.trainer - Epoch duration: 0:01:03.562509\n",
+      "2023-04-06 23:38:09,337 - INFO - combo.training.trainer - Estimated training time remaining: 6:43:05\n",
+      "2023-04-06 23:38:09,337 - INFO - allennlp.training.trainer - Epoch 43/399\n",
+      "2023-04-06 23:38:09,337 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:38:09,337 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:38:09,344 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9328, LAS: 0.8776, UEM: 0.5302, LEM: 0.3178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2034, partial_loss/deprel_loss: 0.3875, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4829, loss: 0.8172, batch_reg_loss: 0.1322, reg_loss: 0.1322 ||:   4%|4         | 4/95 [00:02<01:02,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9293, LAS: 0.8726, UEM: 0.5152, LEM: 0.3057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2611, partial_loss/deprel_loss: 0.4816, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5698, loss: 0.8541, batch_reg_loss: 0.1323, reg_loss: 0.1322 ||:   7%|7         | 7/95 [00:05<01:03,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8938, UAS: 0.9360, LAS: 0.8807, UEM: 0.5238, LEM: 0.2915, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4714, partial_loss/deprel_loss: 0.5702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6828, loss: 0.8027, batch_reg_loss: 0.1324, reg_loss: 0.1323 ||:  12%|#1        | 11/95 [00:07<00:58,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9424, LAS: 0.8876, UEM: 0.5878, LEM: 0.3337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2110, partial_loss/deprel_loss: 0.4511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5355, loss: 0.7549, batch_reg_loss: 0.1325, reg_loss: 0.1323 ||:  16%|#5        | 15/95 [00:10<00:53,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8994, UAS: 0.9433, LAS: 0.8887, UEM: 0.5881, LEM: 0.3302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4317, partial_loss/deprel_loss: 0.5252, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6390, loss: 0.7440, batch_reg_loss: 0.1325, reg_loss: 0.1324 ||:  19%|#8        | 18/95 [00:12<00:56,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9172, UAS: 0.9392, LAS: 0.8839, UEM: 0.5833, LEM: 0.3211, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2968, partial_loss/deprel_loss: 0.4036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5148, loss: 0.7767, batch_reg_loss: 0.1326, reg_loss: 0.1324 ||:  23%|##3       | 22/95 [00:15<00:51,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9424, LAS: 0.8877, UEM: 0.6161, LEM: 0.3575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3311, partial_loss/deprel_loss: 0.5547, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6426, loss: 0.7507, batch_reg_loss: 0.1327, reg_loss: 0.1324 ||:  27%|##7       | 26/95 [00:18<00:47,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9437, LAS: 0.8891, UEM: 0.6301, LEM: 0.3657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3410, partial_loss/deprel_loss: 0.4690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5761, loss: 0.7341, batch_reg_loss: 0.1327, reg_loss: 0.1325 ||:  31%|###       | 29/95 [00:20<00:46,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8706, UAS: 0.9429, LAS: 0.8883, UEM: 0.6261, LEM: 0.3618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7372, partial_loss/deprel_loss: 0.7821, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9059, loss: 0.7425, batch_reg_loss: 0.1328, reg_loss: 0.1325 ||:  35%|###4      | 33/95 [00:22<00:42,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8224, UAS: 0.9407, LAS: 0.8858, UEM: 0.6095, LEM: 0.3460, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5700, partial_loss/deprel_loss: 1.0050, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2509, loss: 0.7631, batch_reg_loss: 0.1328, reg_loss: 0.1325 ||:  39%|###8      | 37/95 [00:25<00:38,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9395, LAS: 0.8842, UEM: 0.5960, LEM: 0.3339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5814, partial_loss/deprel_loss: 0.7784, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8719, loss: 0.7767, batch_reg_loss: 0.1329, reg_loss: 0.1326 ||:  42%|####2     | 40/95 [00:27<00:36,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8710, UAS: 0.9399, LAS: 0.8844, UEM: 0.5876, LEM: 0.3251, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6151, partial_loss/deprel_loss: 0.7105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8243, loss: 0.7740, batch_reg_loss: 0.1329, reg_loss: 0.1326 ||:  45%|####5     | 43/95 [00:29<00:35,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8717, UAS: 0.9370, LAS: 0.8810, UEM: 0.5682, LEM: 0.3120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5969, partial_loss/deprel_loss: 0.7569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8579, loss: 0.7990, batch_reg_loss: 0.1330, reg_loss: 0.1326 ||:  49%|####9     | 47/95 [00:31<00:32,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9387, LAS: 0.8830, UEM: 0.5834, LEM: 0.3226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2709, partial_loss/deprel_loss: 0.4182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5218, loss: 0.7847, batch_reg_loss: 0.1331, reg_loss: 0.1326 ||:  53%|#####2    | 50/95 [00:34<00:31,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8726, UAS: 0.9390, LAS: 0.8832, UEM: 0.5795, LEM: 0.3175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6686, partial_loss/deprel_loss: 0.7567, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8722, loss: 0.7829, batch_reg_loss: 0.1331, reg_loss: 0.1327 ||:  56%|#####5    | 53/95 [00:36<00:29,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9390, LAS: 0.8832, UEM: 0.5714, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4463, partial_loss/deprel_loss: 0.5824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6884, loss: 0.7834, batch_reg_loss: 0.1332, reg_loss: 0.1327 ||:  59%|#####8    | 56/95 [00:38<00:27,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9398, LAS: 0.8838, UEM: 0.5810, LEM: 0.3198, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3849, partial_loss/deprel_loss: 0.5608, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6588, loss: 0.7789, batch_reg_loss: 0.1333, reg_loss: 0.1327 ||:  62%|######2   | 59/95 [00:40<00:26,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9388, LAS: 0.8827, UEM: 0.5779, LEM: 0.3193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1482, partial_loss/deprel_loss: 0.4166, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4963, loss: 0.7892, batch_reg_loss: 0.1333, reg_loss: 0.1328 ||:  66%|######6   | 63/95 [00:43<00:22,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9391, LAS: 0.8832, UEM: 0.5753, LEM: 0.3155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4211, partial_loss/deprel_loss: 0.5615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6668, loss: 0.7859, batch_reg_loss: 0.1334, reg_loss: 0.1328 ||:  69%|######9   | 66/95 [00:45<00:20,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9396, LAS: 0.8837, UEM: 0.5836, LEM: 0.3240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1483, partial_loss/deprel_loss: 0.3676, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4572, loss: 0.7803, batch_reg_loss: 0.1335, reg_loss: 0.1328 ||:  74%|#######3  | 70/95 [00:48<00:17,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7856, UAS: 0.9378, LAS: 0.8816, UEM: 0.5722, LEM: 0.3161, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9450, partial_loss/deprel_loss: 1.2410, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5154, loss: 0.7974, batch_reg_loss: 0.1335, reg_loss: 0.1329 ||:  78%|#######7  | 74/95 [00:51<00:14,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8512, UAS: 0.9365, LAS: 0.8803, UEM: 0.5662, LEM: 0.3120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9895, partial_loss/deprel_loss: 0.9200, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0675, loss: 0.8079, batch_reg_loss: 0.1336, reg_loss: 0.1329 ||:  82%|########2 | 78/95 [00:53<00:11,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9533, UAS: 0.9369, LAS: 0.8808, UEM: 0.5785, LEM: 0.3323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0708, partial_loss/deprel_loss: 0.1772, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2896, loss: 0.8039, batch_reg_loss: 0.1337, reg_loss: 0.1329 ||:  86%|########6 | 82/95 [00:56<00:09,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8437, UAS: 0.9366, LAS: 0.8805, UEM: 0.5736, LEM: 0.3276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1568, partial_loss/deprel_loss: 1.0099, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1730, loss: 0.8072, batch_reg_loss: 0.1338, reg_loss: 0.1330 ||:  89%|########9 | 85/95 [00:58<00:06,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.9356, LAS: 0.8793, UEM: 0.5682, LEM: 0.3238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4791, partial_loss/deprel_loss: 1.0106, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2382, loss: 0.8170, batch_reg_loss: 0.1338, reg_loss: 0.1330 ||:  94%|#########3| 89/95 [01:01<00:04,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8704, UAS: 0.9363, LAS: 0.8801, UEM: 0.5704, LEM: 0.3241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6599, partial_loss/deprel_loss: 0.7541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8692, loss: 0.8104, batch_reg_loss: 0.1339, reg_loss: 0.1330 ||:  98%|#########7| 93/95 [01:03<00:01,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8364, UAS: 0.9361, LAS: 0.8797, UEM: 0.5673, LEM: 0.3213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0906, partial_loss/deprel_loss: 0.9511, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1129, loss: 0.8123, batch_reg_loss: 0.1340, reg_loss: 0.1331 ||: 100%|##########| 95/95 [01:05<00:00,  1.46it/s]\n",
+      "2023-04-06 23:39:14,539 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:39:14,539 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:39:14,539 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.133  |       N/A\n",
+      "2023-04-06 23:39:14,539 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:39:14,539 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:39:14,539 - INFO - combo.training.tensorboard_writer - UEM                      |     0.567  |       N/A\n",
+      "2023-04-06 23:39:14,539 - INFO - combo.training.tensorboard_writer - LEM                      |     0.321  |       N/A\n",
+      "2023-04-06 23:39:14,539 - INFO - combo.training.tensorboard_writer - EM                       |     0.836  |       N/A\n",
+      "2023-04-06 23:39:14,539 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.091  |       N/A\n",
+      "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - UAS                      |     0.936  |       N/A\n",
+      "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.951  |       N/A\n",
+      "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - loss                     |     0.812  |       N/A\n",
+      "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - LAS                      |     0.880  |       N/A\n",
+      "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:39:14,540 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:39:14,541 - INFO - combo.training.trainer - Epoch duration: 0:01:05.204106\n",
+      "2023-04-06 23:39:14,541 - INFO - combo.training.trainer - Estimated training time remaining: 6:41:37\n",
+      "2023-04-06 23:39:14,541 - INFO - allennlp.training.trainer - Epoch 44/399\n",
+      "2023-04-06 23:39:14,541 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:39:14,542 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:39:14,548 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9467, LAS: 0.8917, UEM: 0.4808, LEM: 0.1828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4529, partial_loss/deprel_loss: 0.6344, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7321, loss: 0.7410, batch_reg_loss: 0.1340, reg_loss: 0.1340 ||:   3%|3         | 3/95 [00:02<01:04,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9530, LAS: 0.8992, UEM: 0.5987, LEM: 0.3134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1523, partial_loss/deprel_loss: 0.3490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4438, loss: 0.6830, batch_reg_loss: 0.1341, reg_loss: 0.1340 ||:   6%|6         | 6/95 [00:04<01:02,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8851, UAS: 0.9495, LAS: 0.8961, UEM: 0.5836, LEM: 0.3069, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5068, partial_loss/deprel_loss: 0.6826, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7815, loss: 0.7073, batch_reg_loss: 0.1341, reg_loss: 0.1340 ||:   9%|9         | 9/95 [00:06<01:00,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9483, LAS: 0.8941, UEM: 0.5763, LEM: 0.2967, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2854, partial_loss/deprel_loss: 0.5206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6077, loss: 0.7241, batch_reg_loss: 0.1342, reg_loss: 0.1341 ||:  14%|#3        | 13/95 [00:08<00:56,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9498, LAS: 0.8967, UEM: 0.5941, LEM: 0.3130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2181, partial_loss/deprel_loss: 0.4274, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5197, loss: 0.7078, batch_reg_loss: 0.1342, reg_loss: 0.1341 ||:  17%|#6        | 16/95 [00:10<00:53,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9483, LAS: 0.8945, UEM: 0.5725, LEM: 0.2928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6361, partial_loss/deprel_loss: 0.6631, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7920, loss: 0.7192, batch_reg_loss: 0.1343, reg_loss: 0.1341 ||:  21%|##1       | 20/95 [00:13<00:48,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9460, LAS: 0.8921, UEM: 0.5715, LEM: 0.2928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4193, partial_loss/deprel_loss: 0.6510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7390, loss: 0.7372, batch_reg_loss: 0.1344, reg_loss: 0.1342 ||:  24%|##4       | 23/95 [00:15<00:47,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9124, UAS: 0.9434, LAS: 0.8882, UEM: 0.5545, LEM: 0.2806, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2756, partial_loss/deprel_loss: 0.4521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5512, loss: 0.7633, batch_reg_loss: 0.1344, reg_loss: 0.1342 ||:  28%|##8       | 27/95 [00:17<00:43,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9439, LAS: 0.8889, UEM: 0.5700, LEM: 0.3025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4635, partial_loss/deprel_loss: 0.5984, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7059, loss: 0.7591, batch_reg_loss: 0.1345, reg_loss: 0.1342 ||:  33%|###2      | 31/95 [00:20<00:41,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9427, LAS: 0.8874, UEM: 0.5599, LEM: 0.2962, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2640, partial_loss/deprel_loss: 0.4821, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5730, loss: 0.7653, batch_reg_loss: 0.1346, reg_loss: 0.1343 ||:  37%|###6      | 35/95 [00:23<00:40,  1.50it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9389, LAS: 0.8834, UEM: 0.5573, LEM: 0.2981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1891, partial_loss/deprel_loss: 0.4254, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5128, loss: 0.7916, batch_reg_loss: 0.1347, reg_loss: 0.1343 ||:  41%|####1     | 39/95 [00:25<00:36,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8373, UAS: 0.9398, LAS: 0.8849, UEM: 0.5937, LEM: 0.3496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1354, partial_loss/deprel_loss: 0.9741, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1411, loss: 0.7816, batch_reg_loss: 0.1347, reg_loss: 0.1343 ||:  44%|####4     | 42/95 [00:28<00:37,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9413, LAS: 0.8865, UEM: 0.6106, LEM: 0.3641, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1261, partial_loss/deprel_loss: 0.3357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4286, loss: 0.7688, batch_reg_loss: 0.1348, reg_loss: 0.1344 ||:  47%|####7     | 45/95 [00:30<00:36,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8616, UAS: 0.9401, LAS: 0.8851, UEM: 0.6033, LEM: 0.3592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7775, partial_loss/deprel_loss: 0.7674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9043, loss: 0.7779, batch_reg_loss: 0.1348, reg_loss: 0.1344 ||:  51%|#####     | 48/95 [00:32<00:34,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8563, UAS: 0.9393, LAS: 0.8844, UEM: 0.5934, LEM: 0.3499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0858, partial_loss/deprel_loss: 0.9209, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0888, loss: 0.7858, batch_reg_loss: 0.1349, reg_loss: 0.1344 ||:  54%|#####3    | 51/95 [00:34<00:32,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9394, LAS: 0.8846, UEM: 0.5909, LEM: 0.3468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2761, partial_loss/deprel_loss: 0.4039, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5133, loss: 0.7819, batch_reg_loss: 0.1350, reg_loss: 0.1345 ||:  57%|#####6    | 54/95 [00:37<00:30,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8232, UAS: 0.9394, LAS: 0.8846, UEM: 0.5911, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4536, partial_loss/deprel_loss: 1.1444, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3413, loss: 0.7833, batch_reg_loss: 0.1350, reg_loss: 0.1345 ||:  61%|######1   | 58/95 [00:39<00:25,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9165, UAS: 0.9399, LAS: 0.8851, UEM: 0.6075, LEM: 0.3635, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2542, partial_loss/deprel_loss: 0.4055, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5103, loss: 0.7784, batch_reg_loss: 0.1351, reg_loss: 0.1345 ||:  64%|######4   | 61/95 [00:41<00:24,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8378, UAS: 0.9386, LAS: 0.8836, UEM: 0.6004, LEM: 0.3571, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0466, partial_loss/deprel_loss: 0.9946, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1402, loss: 0.7893, batch_reg_loss: 0.1351, reg_loss: 0.1346 ||:  67%|######7   | 64/95 [00:44<00:22,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8638, UAS: 0.9380, LAS: 0.8827, UEM: 0.5919, LEM: 0.3494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7341, partial_loss/deprel_loss: 0.8138, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9330, loss: 0.7970, batch_reg_loss: 0.1352, reg_loss: 0.1346 ||:  71%|#######   | 67/95 [00:46<00:20,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8284, UAS: 0.9381, LAS: 0.8826, UEM: 0.5893, LEM: 0.3439, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1434, partial_loss/deprel_loss: 1.0298, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1878, loss: 0.7969, batch_reg_loss: 0.1353, reg_loss: 0.1346 ||:  75%|#######4  | 71/95 [00:48<00:16,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8548, UAS: 0.9379, LAS: 0.8824, UEM: 0.5830, LEM: 0.3385, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8588, partial_loss/deprel_loss: 0.8827, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0132, loss: 0.7989, batch_reg_loss: 0.1353, reg_loss: 0.1346 ||:  78%|#######7  | 74/95 [00:50<00:14,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8550, UAS: 0.9370, LAS: 0.8813, UEM: 0.5752, LEM: 0.3325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8835, partial_loss/deprel_loss: 0.8707, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0087, loss: 0.8073, batch_reg_loss: 0.1354, reg_loss: 0.1347 ||:  81%|########1 | 77/95 [00:53<00:12,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8675, UAS: 0.9360, LAS: 0.8800, UEM: 0.5718, LEM: 0.3283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7483, partial_loss/deprel_loss: 0.8180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9395, loss: 0.8174, batch_reg_loss: 0.1354, reg_loss: 0.1347 ||:  84%|########4 | 80/95 [00:55<00:10,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9362, LAS: 0.8801, UEM: 0.5681, LEM: 0.3248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4420, partial_loss/deprel_loss: 0.5820, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6895, loss: 0.8163, batch_reg_loss: 0.1355, reg_loss: 0.1347 ||:  87%|########7 | 83/95 [00:57<00:08,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8756, UAS: 0.9367, LAS: 0.8806, UEM: 0.5683, LEM: 0.3223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6559, partial_loss/deprel_loss: 0.7691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8820, loss: 0.8131, batch_reg_loss: 0.1356, reg_loss: 0.1348 ||:  91%|######### | 86/95 [00:59<00:06,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9232, UAS: 0.9372, LAS: 0.8813, UEM: 0.5741, LEM: 0.3278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2528, partial_loss/deprel_loss: 0.3779, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4885, loss: 0.8076, batch_reg_loss: 0.1356, reg_loss: 0.1348 ||:  94%|#########3| 89/95 [01:02<00:04,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8839, UAS: 0.9369, LAS: 0.8811, UEM: 0.5679, LEM: 0.3218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4904, partial_loss/deprel_loss: 0.6834, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7805, loss: 0.8105, batch_reg_loss: 0.1357, reg_loss: 0.1348 ||:  98%|#########7| 93/95 [01:04<00:01,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8958, UAS: 0.9364, LAS: 0.8805, UEM: 0.5661, LEM: 0.3201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4135, partial_loss/deprel_loss: 0.5995, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6980, loss: 0.8161, batch_reg_loss: 0.1357, reg_loss: 0.1348 ||: 100%|##########| 95/95 [01:06<00:00,  1.44it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-06 23:40:20,623 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:40:20,623 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:40:20,623 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.135  |       N/A\n",
+      "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - UEM                      |     0.566  |       N/A\n",
+      "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - LEM                      |     0.320  |       N/A\n",
+      "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - EM                       |     0.896  |       N/A\n",
+      "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.413  |       N/A\n",
+      "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - UAS                      |     0.936  |       N/A\n",
+      "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.599  |       N/A\n",
+      "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - loss                     |     0.816  |       N/A\n",
+      "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - LAS                      |     0.880  |       N/A\n",
+      "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:40:20,624 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:40:20,625 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:40:20,625 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:40:20,625 - INFO - combo.training.trainer - Epoch duration: 0:01:06.084070\n",
+      "2023-04-06 23:40:20,625 - INFO - combo.training.trainer - Estimated training time remaining: 6:40:17\n",
+      "2023-04-06 23:40:20,625 - INFO - allennlp.training.trainer - Epoch 45/399\n",
+      "2023-04-06 23:40:20,626 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:40:20,626 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:40:20,633 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9494, LAS: 0.8960, UEM: 0.6741, LEM: 0.4170, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2605, partial_loss/deprel_loss: 0.4747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5676, loss: 0.6745, batch_reg_loss: 0.1358, reg_loss: 0.1358 ||:   3%|3         | 3/95 [00:02<01:03,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8680, UAS: 0.9461, LAS: 0.8939, UEM: 0.6654, LEM: 0.4282, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8130, partial_loss/deprel_loss: 0.8523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9803, loss: 0.7075, batch_reg_loss: 0.1359, reg_loss: 0.1358 ||:   6%|6         | 6/95 [00:04<01:05,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9465, LAS: 0.8949, UEM: 0.6410, LEM: 0.3850, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3733, partial_loss/deprel_loss: 0.5640, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6618, loss: 0.7026, batch_reg_loss: 0.1359, reg_loss: 0.1358 ||:   9%|9         | 9/95 [00:07<01:05,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9419, LAS: 0.8882, UEM: 0.5945, LEM: 0.3371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4328, partial_loss/deprel_loss: 0.5513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6636, loss: 0.7535, batch_reg_loss: 0.1360, reg_loss: 0.1359 ||:  14%|#3        | 13/95 [00:09<00:59,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9455, LAS: 0.8920, UEM: 0.6111, LEM: 0.3359, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3072, partial_loss/deprel_loss: 0.4947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5932, loss: 0.7311, batch_reg_loss: 0.1361, reg_loss: 0.1359 ||:  18%|#7        | 17/95 [00:12<00:54,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9517, UAS: 0.9452, LAS: 0.8924, UEM: 0.6389, LEM: 0.4000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0746, partial_loss/deprel_loss: 0.2032, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3136, loss: 0.7316, batch_reg_loss: 0.1361, reg_loss: 0.1360 ||:  22%|##2       | 21/95 [00:15<00:54,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9440, LAS: 0.8908, UEM: 0.6519, LEM: 0.4185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1294, partial_loss/deprel_loss: 0.2705, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3784, loss: 0.7436, batch_reg_loss: 0.1362, reg_loss: 0.1360 ||:  25%|##5       | 24/95 [00:17<00:50,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9156, UAS: 0.9409, LAS: 0.8871, UEM: 0.6308, LEM: 0.4006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2569, partial_loss/deprel_loss: 0.4021, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5093, loss: 0.7703, batch_reg_loss: 0.1363, reg_loss: 0.1360 ||:  29%|##9       | 28/95 [00:19<00:46,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8388, UAS: 0.9407, LAS: 0.8870, UEM: 0.6304, LEM: 0.3968, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3034, partial_loss/deprel_loss: 1.0082, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2036, loss: 0.7726, batch_reg_loss: 0.1363, reg_loss: 0.1360 ||:  33%|###2      | 31/95 [00:22<00:45,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8495, UAS: 0.9405, LAS: 0.8862, UEM: 0.6244, LEM: 0.3874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0059, partial_loss/deprel_loss: 0.9191, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0729, loss: 0.7778, batch_reg_loss: 0.1364, reg_loss: 0.1361 ||:  37%|###6      | 35/95 [00:24<00:41,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9141, UAS: 0.9416, LAS: 0.8876, UEM: 0.6220, LEM: 0.3787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2988, partial_loss/deprel_loss: 0.4795, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5798, loss: 0.7673, batch_reg_loss: 0.1365, reg_loss: 0.1361 ||:  41%|####1     | 39/95 [00:27<00:39,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9422, LAS: 0.8883, UEM: 0.6175, LEM: 0.3732, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2808, partial_loss/deprel_loss: 0.4012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5136, loss: 0.7585, batch_reg_loss: 0.1365, reg_loss: 0.1361 ||:  45%|####5     | 43/95 [00:30<00:36,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9432, LAS: 0.8891, UEM: 0.6218, LEM: 0.3729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2481, partial_loss/deprel_loss: 0.5173, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6001, loss: 0.7497, batch_reg_loss: 0.1366, reg_loss: 0.1362 ||:  48%|####8     | 46/95 [00:32<00:34,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8423, UAS: 0.9402, LAS: 0.8859, UEM: 0.6066, LEM: 0.3613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1341, partial_loss/deprel_loss: 0.9265, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1047, loss: 0.7741, batch_reg_loss: 0.1366, reg_loss: 0.1362 ||:  53%|#####2    | 50/95 [00:35<00:31,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8441, UAS: 0.9400, LAS: 0.8856, UEM: 0.6022, LEM: 0.3566, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1163, partial_loss/deprel_loss: 0.9497, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1197, loss: 0.7758, batch_reg_loss: 0.1367, reg_loss: 0.1362 ||:  56%|#####5    | 53/95 [00:37<00:29,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8871, UAS: 0.9403, LAS: 0.8859, UEM: 0.5938, LEM: 0.3477, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4960, partial_loss/deprel_loss: 0.5982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7146, loss: 0.7762, batch_reg_loss: 0.1368, reg_loss: 0.1363 ||:  60%|######    | 57/95 [00:39<00:25,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9383, LAS: 0.8835, UEM: 0.5834, LEM: 0.3383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4552, partial_loss/deprel_loss: 0.6142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7192, loss: 0.7948, batch_reg_loss: 0.1368, reg_loss: 0.1363 ||:  64%|######4   | 61/95 [00:42<00:22,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9387, LAS: 0.8840, UEM: 0.5977, LEM: 0.3522, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1554, partial_loss/deprel_loss: 0.3544, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4515, loss: 0.7900, batch_reg_loss: 0.1369, reg_loss: 0.1363 ||:  68%|######8   | 65/95 [00:45<00:20,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9384, LAS: 0.8836, UEM: 0.5927, LEM: 0.3481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2767, partial_loss/deprel_loss: 0.4502, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5525, loss: 0.7931, batch_reg_loss: 0.1370, reg_loss: 0.1364 ||:  73%|#######2  | 69/95 [00:47<00:17,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9378, LAS: 0.8831, UEM: 0.5895, LEM: 0.3445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2753, partial_loss/deprel_loss: 0.5303, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6163, loss: 0.7963, batch_reg_loss: 0.1371, reg_loss: 0.1364 ||:  76%|#######5  | 72/95 [00:50<00:16,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8692, UAS: 0.9361, LAS: 0.8812, UEM: 0.5811, LEM: 0.3384, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6207, partial_loss/deprel_loss: 0.7086, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8281, loss: 0.8108, batch_reg_loss: 0.1371, reg_loss: 0.1364 ||:  79%|#######8  | 75/95 [00:52<00:13,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9360, LAS: 0.8810, UEM: 0.5781, LEM: 0.3358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1930, partial_loss/deprel_loss: 0.3984, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4945, loss: 0.8120, batch_reg_loss: 0.1372, reg_loss: 0.1365 ||:  83%|########3 | 79/95 [00:54<00:10,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8946, UAS: 0.9366, LAS: 0.8815, UEM: 0.5757, LEM: 0.3305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4516, partial_loss/deprel_loss: 0.6488, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7467, loss: 0.8091, batch_reg_loss: 0.1373, reg_loss: 0.1365 ||:  87%|########7 | 83/95 [00:57<00:08,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8508, UAS: 0.9357, LAS: 0.8802, UEM: 0.5671, LEM: 0.3249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8374, partial_loss/deprel_loss: 0.8827, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0110, loss: 0.8188, batch_reg_loss: 0.1374, reg_loss: 0.1365 ||:  91%|######### | 86/95 [01:00<00:06,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9362, LAS: 0.8807, UEM: 0.5675, LEM: 0.3223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3415, partial_loss/deprel_loss: 0.5740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6649, loss: 0.8156, batch_reg_loss: 0.1374, reg_loss: 0.1366 ||:  94%|#########3| 89/95 [01:02<00:04,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8458, UAS: 0.9362, LAS: 0.8807, UEM: 0.5685, LEM: 0.3253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9220, partial_loss/deprel_loss: 0.8461, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9988, loss: 0.8153, batch_reg_loss: 0.1375, reg_loss: 0.1366 ||:  97%|#########6| 92/95 [01:04<00:02,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9058, UAS: 0.9362, LAS: 0.8807, UEM: 0.5664, LEM: 0.3221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4165, partial_loss/deprel_loss: 0.5739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6799, loss: 0.8159, batch_reg_loss: 0.1375, reg_loss: 0.1366 ||: 100%|##########| 95/95 [01:06<00:00,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9058, UAS: 0.9362, LAS: 0.8807, UEM: 0.5664, LEM: 0.3221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4165, partial_loss/deprel_loss: 0.5739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6799, loss: 0.8159, batch_reg_loss: 0.1375, reg_loss: 0.1366 ||: 100%|##########| 95/95 [01:06<00:00,  1.42it/s]\n",
+      "2023-04-06 23:41:27,404 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8713, UAS: 0.9165, LAS: 0.8550, UEM: 0.1988, LEM: 0.0361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8586, partial_loss/deprel_loss: 44.4118, partial_loss/cycle_loss: 0.0000, batch_loss: 35.7012, loss: 41.2754, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  18%|#8        | 2/11 [00:02<00:09,  1.06s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9456, LAS: 0.8943, UEM: 0.7281, LEM: 0.4981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2232, partial_loss/deprel_loss: 22.5852, partial_loss/cycle_loss: 0.0000, batch_loss: 18.1128, loss: 27.1635, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:05<00:06,  1.06s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8827, UAS: 0.9451, LAS: 0.8918, UEM: 0.6742, LEM: 0.4295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8574, partial_loss/deprel_loss: 33.8063, partial_loss/cycle_loss: 0.0000, batch_loss: 27.2165, loss: 28.1215, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  73%|#######2  | 8/11 [00:08<00:03,  1.01s/it]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9469, LAS: 0.8927, UEM: 0.6672, LEM: 0.3981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3619, partial_loss/deprel_loss: 24.0948, partial_loss/cycle_loss: 0.0000, batch_loss: 19.3482, loss: 26.4357, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.05it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9469, LAS: 0.8927, UEM: 0.6672, LEM: 0.3981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3619, partial_loss/deprel_loss: 24.0948, partial_loss/cycle_loss: 0.0000, batch_loss: 19.3482, loss: 26.4357, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.05it/s]\n",
+      "2023-04-06 23:41:37,888 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.137  |     0.000\n",
+      "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - UEM                      |     0.566  |     0.667\n",
+      "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - LEM                      |     0.322  |     0.398\n",
+      "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - EM                       |     0.906  |     0.915\n",
+      "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.416  |     0.362\n",
+      "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - UAS                      |     0.936  |     0.947\n",
+      "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.574  |    24.095\n",
+      "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - loss                     |     0.816  |    26.436\n",
+      "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:41:37,889 - INFO - combo.training.tensorboard_writer - LAS                      |     0.881  |     0.893\n",
+      "2023-04-06 23:41:37,890 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:41:37,890 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:41:37,890 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:41:37,890 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:41:37,890 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:41:37,890 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 23:41:37,891 - INFO - combo.training.trainer - Epoch duration: 0:01:17.265210\n",
+      "2023-04-06 23:41:37,891 - INFO - combo.training.trainer - Estimated training time remaining: 6:40:23\n",
+      "2023-04-06 23:41:37,891 - INFO - allennlp.training.trainer - Epoch 46/399\n",
+      "2023-04-06 23:41:37,891 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:41:37,891 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:41:37,898 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8570, UAS: 0.9384, LAS: 0.8818, UEM: 0.3734, LEM: 0.1384, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8249, partial_loss/deprel_loss: 0.9382, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0532, loss: 0.8264, batch_reg_loss: 0.1376, reg_loss: 0.1376 ||:   3%|3         | 3/95 [00:02<01:03,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8791, UAS: 0.9417, LAS: 0.8873, UEM: 0.4747, LEM: 0.2218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6840, partial_loss/deprel_loss: 0.7449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8704, loss: 0.7841, batch_reg_loss: 0.1377, reg_loss: 0.1376 ||:   6%|6         | 6/95 [00:04<01:02,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9425, LAS: 0.8875, UEM: 0.4812, LEM: 0.2071, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3713, partial_loss/deprel_loss: 0.5899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6839, loss: 0.7722, batch_reg_loss: 0.1377, reg_loss: 0.1376 ||:  11%|#         | 10/95 [00:06<00:58,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8354, UAS: 0.9372, LAS: 0.8831, UEM: 0.4905, LEM: 0.2360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3465, partial_loss/deprel_loss: 0.9104, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1354, loss: 0.7935, batch_reg_loss: 0.1378, reg_loss: 0.1377 ||:  15%|#4        | 14/95 [00:09<00:53,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8498, UAS: 0.9297, LAS: 0.8741, UEM: 0.4456, LEM: 0.2105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1434, partial_loss/deprel_loss: 0.9181, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1010, loss: 0.8644, batch_reg_loss: 0.1379, reg_loss: 0.1377 ||:  19%|#8        | 18/95 [00:11<00:49,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8276, UAS: 0.9280, LAS: 0.8725, UEM: 0.4833, LEM: 0.2600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3145, partial_loss/deprel_loss: 1.0498, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2407, loss: 0.8758, batch_reg_loss: 0.1379, reg_loss: 0.1377 ||:  22%|##2       | 21/95 [00:13<00:48,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9286, LAS: 0.8732, UEM: 0.4933, LEM: 0.2660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2313, partial_loss/deprel_loss: 0.4701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5604, loss: 0.8730, batch_reg_loss: 0.1380, reg_loss: 0.1378 ||:  25%|##5       | 24/95 [00:17<01:01,  1.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8390, UAS: 0.9300, LAS: 0.8744, UEM: 0.4931, LEM: 0.2588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1832, partial_loss/deprel_loss: 0.9521, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1364, loss: 0.8631, batch_reg_loss: 0.1381, reg_loss: 0.1378 ||:  29%|##9       | 28/95 [00:20<00:53,  1.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9166, UAS: 0.9325, LAS: 0.8773, UEM: 0.5136, LEM: 0.2703, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3778, partial_loss/deprel_loss: 0.5454, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6501, loss: 0.8409, batch_reg_loss: 0.1382, reg_loss: 0.1379 ||:  34%|###3      | 32/95 [00:22<00:47,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8435, UAS: 0.9315, LAS: 0.8762, UEM: 0.5065, LEM: 0.2656, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0980, partial_loss/deprel_loss: 0.9244, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0973, loss: 0.8481, batch_reg_loss: 0.1382, reg_loss: 0.1379 ||:  37%|###6      | 35/95 [00:25<00:43,  1.36it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8415, UAS: 0.9277, LAS: 0.8720, UEM: 0.4886, LEM: 0.2554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9752, partial_loss/deprel_loss: 0.8297, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9971, loss: 0.8780, batch_reg_loss: 0.1383, reg_loss: 0.1379 ||:  40%|####      | 38/95 [00:27<00:41,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9306, LAS: 0.8754, UEM: 0.5315, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1455, partial_loss/deprel_loss: 0.3835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4742, loss: 0.8522, batch_reg_loss: 0.1384, reg_loss: 0.1379 ||:  43%|####3     | 41/95 [00:29<00:40,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9326, LAS: 0.8776, UEM: 0.5548, LEM: 0.3083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2717, partial_loss/deprel_loss: 0.5146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6045, loss: 0.8329, batch_reg_loss: 0.1384, reg_loss: 0.1380 ||:  46%|####6     | 44/95 [00:32<00:39,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9335, LAS: 0.8787, UEM: 0.5579, LEM: 0.3089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2463, partial_loss/deprel_loss: 0.4783, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5704, loss: 0.8267, batch_reg_loss: 0.1385, reg_loss: 0.1380 ||:  49%|####9     | 47/95 [00:34<00:37,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9340, LAS: 0.8793, UEM: 0.5501, LEM: 0.3022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4458, partial_loss/deprel_loss: 0.5934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7024, loss: 0.8208, batch_reg_loss: 0.1385, reg_loss: 0.1380 ||:  53%|#####2    | 50/95 [00:36<00:34,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8462, UAS: 0.9337, LAS: 0.8787, UEM: 0.5367, LEM: 0.2910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9964, partial_loss/deprel_loss: 0.8618, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0273, loss: 0.8244, batch_reg_loss: 0.1386, reg_loss: 0.1381 ||:  57%|#####6    | 54/95 [00:39<00:29,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9513, UAS: 0.9349, LAS: 0.8801, UEM: 0.5640, LEM: 0.3265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0686, partial_loss/deprel_loss: 0.1964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3095, loss: 0.8150, batch_reg_loss: 0.1387, reg_loss: 0.1381 ||:  60%|######    | 57/95 [00:41<00:28,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8575, UAS: 0.9348, LAS: 0.8798, UEM: 0.5555, LEM: 0.3179, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9198, partial_loss/deprel_loss: 0.8242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9821, loss: 0.8174, batch_reg_loss: 0.1387, reg_loss: 0.1381 ||:  64%|######4   | 61/95 [00:44<00:24,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9252, UAS: 0.9352, LAS: 0.8805, UEM: 0.5606, LEM: 0.3220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2640, partial_loss/deprel_loss: 0.4431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5460, loss: 0.8125, batch_reg_loss: 0.1388, reg_loss: 0.1382 ||:  67%|######7   | 64/95 [00:46<00:22,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8916, UAS: 0.9360, LAS: 0.8814, UEM: 0.5732, LEM: 0.3361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4190, partial_loss/deprel_loss: 0.5727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6808, loss: 0.8043, batch_reg_loss: 0.1388, reg_loss: 0.1382 ||:  71%|#######   | 67/95 [00:48<00:21,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9370, LAS: 0.8826, UEM: 0.5785, LEM: 0.3382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3167, partial_loss/deprel_loss: 0.4821, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5879, loss: 0.7951, batch_reg_loss: 0.1389, reg_loss: 0.1382 ||:  74%|#######3  | 70/95 [00:50<00:18,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8793, UAS: 0.9369, LAS: 0.8826, UEM: 0.5706, LEM: 0.3307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6230, partial_loss/deprel_loss: 0.6653, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7957, loss: 0.7966, batch_reg_loss: 0.1389, reg_loss: 0.1383 ||:  78%|#######7  | 74/95 [00:53<00:14,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8875, UAS: 0.9375, LAS: 0.8832, UEM: 0.5774, LEM: 0.3366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4835, partial_loss/deprel_loss: 0.6329, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7420, loss: 0.7910, batch_reg_loss: 0.1390, reg_loss: 0.1383 ||:  81%|########1 | 77/95 [00:55<00:12,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9021, UAS: 0.9379, LAS: 0.8836, UEM: 0.5761, LEM: 0.3348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4014, partial_loss/deprel_loss: 0.5538, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6624, loss: 0.7882, batch_reg_loss: 0.1390, reg_loss: 0.1383 ||:  84%|########4 | 80/95 [00:58<00:11,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9377, LAS: 0.8832, UEM: 0.5691, LEM: 0.3287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4996, partial_loss/deprel_loss: 0.6721, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7767, loss: 0.7916, batch_reg_loss: 0.1391, reg_loss: 0.1383 ||:  87%|########7 | 83/95 [01:00<00:08,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9374, LAS: 0.8828, UEM: 0.5665, LEM: 0.3260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4622, partial_loss/deprel_loss: 0.5718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6890, loss: 0.7948, batch_reg_loss: 0.1391, reg_loss: 0.1384 ||:  91%|######### | 86/95 [01:02<00:06,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9382, LAS: 0.8835, UEM: 0.5720, LEM: 0.3273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1930, partial_loss/deprel_loss: 0.4435, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5326, loss: 0.7901, batch_reg_loss: 0.1392, reg_loss: 0.1384 ||:  95%|#########4| 90/95 [01:04<00:03,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9367, LAS: 0.8818, UEM: 0.5672, LEM: 0.3233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5604, partial_loss/deprel_loss: 0.7168, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8248, loss: 0.8043, batch_reg_loss: 0.1393, reg_loss: 0.1384 ||:  98%|#########7| 93/95 [01:07<00:01,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8415, UAS: 0.9359, LAS: 0.8809, UEM: 0.5622, LEM: 0.3202, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0151, partial_loss/deprel_loss: 0.9374, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0923, loss: 0.8117, batch_reg_loss: 0.1393, reg_loss: 0.1385 ||: 100%|##########| 95/95 [01:08<00:00,  1.39it/s]\n",
+      "2023-04-06 23:42:46,421 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:42:46,421 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.138  |       N/A\n",
+      "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - UEM                      |     0.562  |       N/A\n",
+      "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - LEM                      |     0.320  |       N/A\n",
+      "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - EM                       |     0.841  |       N/A\n",
+      "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.015  |       N/A\n",
+      "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - UAS                      |     0.936  |       N/A\n",
+      "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.937  |       N/A\n",
+      "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - loss                     |     0.812  |       N/A\n",
+      "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - LAS                      |     0.881  |       N/A\n",
+      "2023-04-06 23:42:46,422 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:42:46,423 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:42:46,423 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:42:46,423 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:42:46,423 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:42:46,423 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:42:46,423 - INFO - combo.training.trainer - Epoch duration: 0:01:08.532568\n",
+      "2023-04-06 23:42:46,424 - INFO - combo.training.trainer - Estimated training time remaining: 6:39:20\n",
+      "2023-04-06 23:42:46,424 - INFO - allennlp.training.trainer - Epoch 47/399\n",
+      "2023-04-06 23:42:46,424 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:42:46,424 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:42:46,431 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9575, LAS: 0.9058, UEM: 0.6646, LEM: 0.3678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2918, partial_loss/deprel_loss: 0.5193, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6131, loss: 0.6360, batch_reg_loss: 0.1394, reg_loss: 0.1393 ||:   4%|4         | 4/95 [00:02<00:59,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8759, UAS: 0.9441, LAS: 0.8906, UEM: 0.5665, LEM: 0.2927, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7484, partial_loss/deprel_loss: 0.6631, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8196, loss: 0.7513, batch_reg_loss: 0.1394, reg_loss: 0.1394 ||:   7%|7         | 7/95 [00:04<00:59,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9357, LAS: 0.8795, UEM: 0.5114, LEM: 0.2450, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7294, partial_loss/deprel_loss: 0.8087, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9323, loss: 0.8303, batch_reg_loss: 0.1395, reg_loss: 0.1394 ||:  11%|#         | 10/95 [00:06<00:57,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8993, UAS: 0.9358, LAS: 0.8801, UEM: 0.5003, LEM: 0.2286, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4632, partial_loss/deprel_loss: 0.5388, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6632, loss: 0.8273, batch_reg_loss: 0.1396, reg_loss: 0.1394 ||:  15%|#4        | 14/95 [00:09<00:53,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8491, UAS: 0.9353, LAS: 0.8802, UEM: 0.5093, LEM: 0.2462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9208, partial_loss/deprel_loss: 0.8924, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0377, loss: 0.8179, batch_reg_loss: 0.1396, reg_loss: 0.1395 ||:  18%|#7        | 17/95 [00:11<00:52,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9352, LAS: 0.8805, UEM: 0.5340, LEM: 0.2827, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1473, partial_loss/deprel_loss: 0.3474, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4471, loss: 0.8197, batch_reg_loss: 0.1397, reg_loss: 0.1395 ||:  21%|##1       | 20/95 [00:13<00:50,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9339, LAS: 0.8791, UEM: 0.5085, LEM: 0.2634, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6413, partial_loss/deprel_loss: 0.7258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8486, loss: 0.8335, batch_reg_loss: 0.1397, reg_loss: 0.1395 ||:  24%|##4       | 23/95 [00:15<00:48,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9361, LAS: 0.8817, UEM: 0.5197, LEM: 0.2742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2100, partial_loss/deprel_loss: 0.3856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4903, loss: 0.8120, batch_reg_loss: 0.1398, reg_loss: 0.1396 ||:  28%|##8       | 27/95 [00:17<00:44,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9333, LAS: 0.8783, UEM: 0.5124, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2833, partial_loss/deprel_loss: 0.4738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5756, loss: 0.8371, batch_reg_loss: 0.1399, reg_loss: 0.1396 ||:  33%|###2      | 31/95 [00:20<00:42,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9354, LAS: 0.8807, UEM: 0.5301, LEM: 0.2805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3344, partial_loss/deprel_loss: 0.5271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6285, loss: 0.8172, batch_reg_loss: 0.1400, reg_loss: 0.1396 ||:  36%|###5      | 34/95 [00:22<00:40,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9624, UAS: 0.9366, LAS: 0.8821, UEM: 0.5833, LEM: 0.3462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0444, partial_loss/deprel_loss: 0.1539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2721, loss: 0.8122, batch_reg_loss: 0.1400, reg_loss: 0.1397 ||:  40%|####      | 38/95 [00:25<00:39,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9361, LAS: 0.8817, UEM: 0.5872, LEM: 0.3494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5172, partial_loss/deprel_loss: 0.6677, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7777, loss: 0.8153, batch_reg_loss: 0.1401, reg_loss: 0.1397 ||:  43%|####3     | 41/95 [00:27<00:38,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8745, UAS: 0.9361, LAS: 0.8814, UEM: 0.5756, LEM: 0.3374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5892, partial_loss/deprel_loss: 0.6801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8021, loss: 0.8151, batch_reg_loss: 0.1401, reg_loss: 0.1397 ||:  46%|####6     | 44/95 [00:30<00:35,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9373, LAS: 0.8827, UEM: 0.5772, LEM: 0.3351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4436, partial_loss/deprel_loss: 0.5806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6934, loss: 0.8048, batch_reg_loss: 0.1402, reg_loss: 0.1398 ||:  49%|####9     | 47/95 [00:32<00:34,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8579, UAS: 0.9379, LAS: 0.8836, UEM: 0.5798, LEM: 0.3354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9289, partial_loss/deprel_loss: 0.8450, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0020, loss: 0.7981, batch_reg_loss: 0.1403, reg_loss: 0.1398 ||:  53%|#####2    | 50/95 [00:34<00:32,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9365, LAS: 0.8819, UEM: 0.5754, LEM: 0.3300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3637, partial_loss/deprel_loss: 0.6077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6992, loss: 0.8102, batch_reg_loss: 0.1403, reg_loss: 0.1398 ||:  57%|#####6    | 54/95 [00:37<00:28,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9375, LAS: 0.8828, UEM: 0.5777, LEM: 0.3257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3133, partial_loss/deprel_loss: 0.5667, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6564, loss: 0.8034, batch_reg_loss: 0.1404, reg_loss: 0.1399 ||:  60%|######    | 57/95 [00:39<00:27,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8647, UAS: 0.9369, LAS: 0.8822, UEM: 0.5702, LEM: 0.3201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8833, partial_loss/deprel_loss: 0.8060, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9619, loss: 0.8088, batch_reg_loss: 0.1404, reg_loss: 0.1399 ||:  63%|######3   | 60/95 [00:41<00:25,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9369, LAS: 0.8819, UEM: 0.5634, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5471, partial_loss/deprel_loss: 0.8084, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8966, loss: 0.8110, batch_reg_loss: 0.1405, reg_loss: 0.1399 ||:  66%|######6   | 63/95 [00:43<00:23,  1.37it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9372, LAS: 0.8823, UEM: 0.5600, LEM: 0.3102, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5296, partial_loss/deprel_loss: 0.6012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7274, loss: 0.8069, batch_reg_loss: 0.1405, reg_loss: 0.1399 ||:  71%|#######   | 67/95 [00:46<00:19,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9369, LAS: 0.8821, UEM: 0.5693, LEM: 0.3246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4940, partial_loss/deprel_loss: 0.6594, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7669, loss: 0.8081, batch_reg_loss: 0.1406, reg_loss: 0.1400 ||:  74%|#######3  | 70/95 [00:48<00:17,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9382, LAS: 0.8836, UEM: 0.5848, LEM: 0.3365, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1530, partial_loss/deprel_loss: 0.3817, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4766, loss: 0.7969, batch_reg_loss: 0.1407, reg_loss: 0.1400 ||:  77%|#######6  | 73/95 [00:51<00:16,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8283, UAS: 0.9379, LAS: 0.8833, UEM: 0.5780, LEM: 0.3291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2605, partial_loss/deprel_loss: 1.0438, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2278, loss: 0.7990, batch_reg_loss: 0.1407, reg_loss: 0.1400 ||:  81%|########1 | 77/95 [00:53<00:12,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9381, LAS: 0.8834, UEM: 0.5851, LEM: 0.3348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2065, partial_loss/deprel_loss: 0.4362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5310, loss: 0.7956, batch_reg_loss: 0.1408, reg_loss: 0.1401 ||:  84%|########4 | 80/95 [00:55<00:10,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9380, LAS: 0.8832, UEM: 0.5787, LEM: 0.3285, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3494, partial_loss/deprel_loss: 0.4998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6105, loss: 0.7982, batch_reg_loss: 0.1408, reg_loss: 0.1401 ||:  88%|########8 | 84/95 [00:57<00:07,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9373, LAS: 0.8823, UEM: 0.5795, LEM: 0.3323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1643, partial_loss/deprel_loss: 0.3449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4497, loss: 0.8058, batch_reg_loss: 0.1409, reg_loss: 0.1401 ||:  93%|#########2| 88/95 [01:00<00:04,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8859, UAS: 0.9373, LAS: 0.8821, UEM: 0.5728, LEM: 0.3260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5563, partial_loss/deprel_loss: 0.6610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7810, loss: 0.8073, batch_reg_loss: 0.1410, reg_loss: 0.1402 ||:  97%|#########6| 92/95 [01:02<00:01,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9364, LAS: 0.8810, UEM: 0.5686, LEM: 0.3221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3712, partial_loss/deprel_loss: 0.5893, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6867, loss: 0.8150, batch_reg_loss: 0.1410, reg_loss: 0.1402 ||: 100%|##########| 95/95 [01:03<00:00,  1.48it/s]\n",
+      "2023-04-06 23:43:50,414 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.140  |       N/A\n",
+      "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - UEM                      |     0.569  |       N/A\n",
+      "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - LEM                      |     0.322  |       N/A\n",
+      "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - EM                       |     0.890  |       N/A\n",
+      "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.371  |       N/A\n",
+      "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - UAS                      |     0.936  |       N/A\n",
+      "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.589  |       N/A\n",
+      "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - loss                     |     0.815  |       N/A\n",
+      "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - LAS                      |     0.881  |       N/A\n",
+      "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:43:50,415 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:43:50,416 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:43:50,416 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:43:50,416 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:43:50,416 - INFO - combo.training.trainer - Epoch duration: 0:01:03.992550\n",
+      "2023-04-06 23:43:50,416 - INFO - combo.training.trainer - Estimated training time remaining: 6:37:44\n",
+      "2023-04-06 23:43:50,416 - INFO - allennlp.training.trainer - Epoch 48/399\n",
+      "2023-04-06 23:43:50,416 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:43:50,417 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:43:50,430 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9246, LAS: 0.8706, UEM: 0.3107, LEM: 0.1247, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4508, partial_loss/deprel_loss: 0.6146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7229, loss: 0.8960, batch_reg_loss: 0.1411, reg_loss: 0.1411 ||:   4%|4         | 4/95 [00:02<00:53,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9529, UAS: 0.9396, LAS: 0.8903, UEM: 0.6835, LEM: 0.5249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0651, partial_loss/deprel_loss: 0.1912, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3071, loss: 0.7490, batch_reg_loss: 0.1411, reg_loss: 0.1411 ||:   6%|6         | 6/95 [00:04<01:04,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9430, LAS: 0.8921, UEM: 0.6491, LEM: 0.4458, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3176, partial_loss/deprel_loss: 0.5263, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6257, loss: 0.7309, batch_reg_loss: 0.1412, reg_loss: 0.1411 ||:   9%|9         | 9/95 [00:06<01:04,  1.34it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8511, UAS: 0.9407, LAS: 0.8877, UEM: 0.6194, LEM: 0.4118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0302, partial_loss/deprel_loss: 0.9679, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1216, loss: 0.7598, batch_reg_loss: 0.1412, reg_loss: 0.1411 ||:  13%|#2        | 12/95 [00:09<01:01,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9411, LAS: 0.8879, UEM: 0.6232, LEM: 0.4010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2766, partial_loss/deprel_loss: 0.4543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5601, loss: 0.7571, batch_reg_loss: 0.1413, reg_loss: 0.1412 ||:  16%|#5        | 15/95 [00:11<01:00,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9362, LAS: 0.8814, UEM: 0.5813, LEM: 0.3622, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5272, partial_loss/deprel_loss: 0.6339, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7539, loss: 0.8038, batch_reg_loss: 0.1414, reg_loss: 0.1412 ||:  20%|##        | 19/95 [00:13<00:54,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8836, UAS: 0.9384, LAS: 0.8840, UEM: 0.5813, LEM: 0.3491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6809, partial_loss/deprel_loss: 0.7209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8544, loss: 0.7911, batch_reg_loss: 0.1414, reg_loss: 0.1412 ||:  23%|##3       | 22/95 [00:15<00:51,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9348, LAS: 0.8805, UEM: 0.5621, LEM: 0.3311, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5691, partial_loss/deprel_loss: 0.7029, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8176, loss: 0.8155, batch_reg_loss: 0.1415, reg_loss: 0.1413 ||:  27%|##7       | 26/95 [00:18<00:48,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8847, UAS: 0.9332, LAS: 0.8784, UEM: 0.5724, LEM: 0.3364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4915, partial_loss/deprel_loss: 0.6467, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7572, loss: 0.8279, batch_reg_loss: 0.1416, reg_loss: 0.1413 ||:  31%|###       | 29/95 [00:20<00:47,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8625, UAS: 0.9330, LAS: 0.8774, UEM: 0.5595, LEM: 0.3227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6215, partial_loss/deprel_loss: 0.8165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9192, loss: 0.8350, batch_reg_loss: 0.1416, reg_loss: 0.1413 ||:  34%|###3      | 32/95 [00:22<00:44,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8683, UAS: 0.9348, LAS: 0.8798, UEM: 0.5804, LEM: 0.3409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7149, partial_loss/deprel_loss: 0.8073, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9305, loss: 0.8176, batch_reg_loss: 0.1417, reg_loss: 0.1414 ||:  37%|###6      | 35/95 [00:25<00:42,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8580, UAS: 0.9340, LAS: 0.8788, UEM: 0.5589, LEM: 0.3246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0087, partial_loss/deprel_loss: 0.8536, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0264, loss: 0.8281, batch_reg_loss: 0.1418, reg_loss: 0.1414 ||:  41%|####1     | 39/95 [00:27<00:37,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9362, LAS: 0.8813, UEM: 0.5820, LEM: 0.3414, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2104, partial_loss/deprel_loss: 0.3947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4997, loss: 0.8080, batch_reg_loss: 0.1418, reg_loss: 0.1414 ||:  44%|####4     | 42/95 [00:29<00:36,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8371, UAS: 0.9346, LAS: 0.8795, UEM: 0.5668, LEM: 0.3294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3684, partial_loss/deprel_loss: 0.9809, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2003, loss: 0.8222, batch_reg_loss: 0.1419, reg_loss: 0.1415 ||:  48%|####8     | 46/95 [00:32<00:33,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8141, UAS: 0.9333, LAS: 0.8780, UEM: 0.5536, LEM: 0.3186, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3576, partial_loss/deprel_loss: 0.9825, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1995, loss: 0.8312, batch_reg_loss: 0.1420, reg_loss: 0.1415 ||:  53%|#####2    | 50/95 [00:34<00:29,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8536, UAS: 0.9332, LAS: 0.8779, UEM: 0.5417, LEM: 0.3075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9766, partial_loss/deprel_loss: 0.8796, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0411, loss: 0.8334, batch_reg_loss: 0.1420, reg_loss: 0.1415 ||:  57%|#####6    | 54/95 [00:37<00:26,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8652, UAS: 0.9322, LAS: 0.8768, UEM: 0.5268, LEM: 0.2976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7397, partial_loss/deprel_loss: 0.7262, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8710, loss: 0.8443, batch_reg_loss: 0.1421, reg_loss: 0.1416 ||:  61%|######1   | 58/95 [00:39<00:23,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8496, UAS: 0.9325, LAS: 0.8768, UEM: 0.5299, LEM: 0.2985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9624, partial_loss/deprel_loss: 0.8780, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0370, loss: 0.8424, batch_reg_loss: 0.1422, reg_loss: 0.1416 ||:  65%|######5   | 62/95 [00:42<00:22,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9343, LAS: 0.8788, UEM: 0.5502, LEM: 0.3127, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3150, partial_loss/deprel_loss: 0.4701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5813, loss: 0.8254, batch_reg_loss: 0.1423, reg_loss: 0.1417 ||:  69%|######9   | 66/95 [00:45<00:19,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9346, LAS: 0.8791, UEM: 0.5491, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9794, partial_loss/deprel_loss: 0.8978, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0565, loss: 0.8239, batch_reg_loss: 0.1424, reg_loss: 0.1417 ||:  74%|#######3  | 70/95 [00:47<00:16,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9351, LAS: 0.8797, UEM: 0.5488, LEM: 0.3082, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6549, partial_loss/deprel_loss: 0.6211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7703, loss: 0.8183, batch_reg_loss: 0.1424, reg_loss: 0.1417 ||:  78%|#######7  | 74/95 [00:51<00:14,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9350, LAS: 0.8797, UEM: 0.5482, LEM: 0.3068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3373, partial_loss/deprel_loss: 0.5063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6150, loss: 0.8187, batch_reg_loss: 0.1425, reg_loss: 0.1418 ||:  81%|########1 | 77/95 [00:53<00:12,  1.45it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9360, LAS: 0.8810, UEM: 0.5638, LEM: 0.3246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1284, partial_loss/deprel_loss: 0.2522, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3700, loss: 0.8082, batch_reg_loss: 0.1425, reg_loss: 0.1418 ||:  84%|########4 | 80/95 [00:55<00:10,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9360, LAS: 0.8809, UEM: 0.5696, LEM: 0.3311, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1299, partial_loss/deprel_loss: 0.3227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4267, loss: 0.8099, batch_reg_loss: 0.1426, reg_loss: 0.1418 ||:  87%|########7 | 83/95 [00:57<00:08,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9364, LAS: 0.8812, UEM: 0.5652, LEM: 0.3244, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5604, partial_loss/deprel_loss: 0.6542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7781, loss: 0.8085, batch_reg_loss: 0.1426, reg_loss: 0.1419 ||:  92%|#########1| 87/95 [00:59<00:05,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8426, UAS: 0.9360, LAS: 0.8808, UEM: 0.5644, LEM: 0.3241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1008, partial_loss/deprel_loss: 0.9605, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1313, loss: 0.8109, batch_reg_loss: 0.1427, reg_loss: 0.1419 ||:  95%|#########4| 90/95 [01:02<00:03,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8646, UAS: 0.9366, LAS: 0.8813, UEM: 0.5658, LEM: 0.3225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7521, partial_loss/deprel_loss: 0.8806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9976, loss: 0.8087, batch_reg_loss: 0.1428, reg_loss: 0.1419 ||:  99%|#########8| 94/95 [01:04<00:00,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8473, UAS: 0.9362, LAS: 0.8809, UEM: 0.5632, LEM: 0.3208, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0050, partial_loss/deprel_loss: 0.9152, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0759, loss: 0.8115, batch_reg_loss: 0.1428, reg_loss: 0.1419 ||: 100%|##########| 95/95 [01:04<00:00,  1.47it/s]\n",
+      "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.142  |       N/A\n",
+      "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - UEM                      |     0.563  |       N/A\n",
+      "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - LEM                      |     0.321  |       N/A\n",
+      "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - EM                       |     0.847  |       N/A\n",
+      "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.005  |       N/A\n",
+      "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - UAS                      |     0.936  |       N/A\n",
+      "2023-04-06 23:44:55,054 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:44:55,055 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.915  |       N/A\n",
+      "2023-04-06 23:44:55,055 - INFO - combo.training.tensorboard_writer - loss                     |     0.811  |       N/A\n",
+      "2023-04-06 23:44:55,055 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:44:55,055 - INFO - combo.training.tensorboard_writer - LAS                      |     0.881  |       N/A\n",
+      "2023-04-06 23:44:55,055 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:44:55,055 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:44:55,055 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:44:55,055 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:44:55,055 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:44:55,055 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:44:55,056 - INFO - combo.training.trainer - Epoch duration: 0:01:04.639291\n",
+      "2023-04-06 23:44:55,056 - INFO - combo.training.trainer - Estimated training time remaining: 6:36:13\n",
+      "2023-04-06 23:44:55,056 - INFO - allennlp.training.trainer - Epoch 49/399\n",
+      "2023-04-06 23:44:55,056 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:44:55,056 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:44:55,062 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8661, UAS: 0.9468, LAS: 0.8951, UEM: 0.5605, LEM: 0.2780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8158, partial_loss/deprel_loss: 0.8483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9846, loss: 0.7297, batch_reg_loss: 0.1428, reg_loss: 0.1428 ||:   4%|4         | 4/95 [00:02<00:46,  1.94it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9492, LAS: 0.8979, UEM: 0.6192, LEM: 0.3542, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2337, partial_loss/deprel_loss: 0.4015, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5108, loss: 0.6914, batch_reg_loss: 0.1429, reg_loss: 0.1428 ||:   7%|7         | 7/95 [00:04<00:52,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9468, LAS: 0.8960, UEM: 0.6436, LEM: 0.3955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1523, partial_loss/deprel_loss: 0.2886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4043, loss: 0.7006, batch_reg_loss: 0.1429, reg_loss: 0.1429 ||:  11%|#         | 10/95 [00:06<00:56,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8899, UAS: 0.9431, LAS: 0.8893, UEM: 0.5835, LEM: 0.3360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4091, partial_loss/deprel_loss: 0.6584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7515, loss: 0.7444, batch_reg_loss: 0.1430, reg_loss: 0.1429 ||:  15%|#4        | 14/95 [00:09<00:51,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8678, UAS: 0.9415, LAS: 0.8879, UEM: 0.5673, LEM: 0.3210, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6671, partial_loss/deprel_loss: 0.6714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8136, loss: 0.7581, batch_reg_loss: 0.1431, reg_loss: 0.1429 ||:  19%|#8        | 18/95 [00:11<00:47,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8277, UAS: 0.9393, LAS: 0.8853, UEM: 0.5465, LEM: 0.3020, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3672, partial_loss/deprel_loss: 1.0111, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2254, loss: 0.7825, batch_reg_loss: 0.1431, reg_loss: 0.1430 ||:  22%|##2       | 21/95 [00:13<00:47,  1.57it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8413, UAS: 0.9398, LAS: 0.8865, UEM: 0.5490, LEM: 0.2997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2423, partial_loss/deprel_loss: 0.8838, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0987, loss: 0.7780, batch_reg_loss: 0.1432, reg_loss: 0.1430 ||:  26%|##6       | 25/95 [00:16<00:45,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8591, UAS: 0.9369, LAS: 0.8828, UEM: 0.5379, LEM: 0.2909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7318, partial_loss/deprel_loss: 0.8710, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9864, loss: 0.8033, batch_reg_loss: 0.1433, reg_loss: 0.1430 ||:  29%|##9       | 28/95 [00:18<00:44,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8395, UAS: 0.9374, LAS: 0.8834, UEM: 0.5485, LEM: 0.2986, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1769, partial_loss/deprel_loss: 0.9157, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1113, loss: 0.7973, batch_reg_loss: 0.1433, reg_loss: 0.1430 ||:  33%|###2      | 31/95 [00:20<00:43,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8837, UAS: 0.9366, LAS: 0.8823, UEM: 0.5334, LEM: 0.2852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5307, partial_loss/deprel_loss: 0.6811, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7944, loss: 0.8072, batch_reg_loss: 0.1434, reg_loss: 0.1431 ||:  36%|###5      | 34/95 [00:22<00:42,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9372, LAS: 0.8830, UEM: 0.5274, LEM: 0.2795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4577, partial_loss/deprel_loss: 0.5830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7013, loss: 0.8014, batch_reg_loss: 0.1434, reg_loss: 0.1431 ||:  39%|###8      | 37/95 [00:24<00:40,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8788, UAS: 0.9367, LAS: 0.8823, UEM: 0.5204, LEM: 0.2730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6713, partial_loss/deprel_loss: 0.7439, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8729, loss: 0.8124, batch_reg_loss: 0.1435, reg_loss: 0.1431 ||:  42%|####2     | 40/95 [00:26<00:38,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9368, LAS: 0.8824, UEM: 0.5301, LEM: 0.2832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1867, partial_loss/deprel_loss: 0.4327, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5271, loss: 0.8118, batch_reg_loss: 0.1436, reg_loss: 0.1432 ||:  46%|####6     | 44/95 [00:29<00:34,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9372, LAS: 0.8830, UEM: 0.5267, LEM: 0.2781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3491, partial_loss/deprel_loss: 0.5682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6680, loss: 0.8096, batch_reg_loss: 0.1436, reg_loss: 0.1432 ||:  51%|#####     | 48/95 [00:31<00:31,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8034, UAS: 0.9359, LAS: 0.8816, UEM: 0.5234, LEM: 0.2767, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6888, partial_loss/deprel_loss: 1.1994, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4410, loss: 0.8214, batch_reg_loss: 0.1437, reg_loss: 0.1432 ||:  54%|#####3    | 51/95 [00:33<00:29,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9493, UAS: 0.9366, LAS: 0.8824, UEM: 0.5644, LEM: 0.3270, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0663, partial_loss/deprel_loss: 0.1810, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3018, loss: 0.8144, batch_reg_loss: 0.1437, reg_loss: 0.1433 ||:  57%|#####6    | 54/95 [00:36<00:29,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9368, LAS: 0.8822, UEM: 0.5618, LEM: 0.3219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3877, partial_loss/deprel_loss: 0.5460, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6581, loss: 0.8138, batch_reg_loss: 0.1438, reg_loss: 0.1433 ||:  60%|######    | 57/95 [00:38<00:26,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9355, LAS: 0.8809, UEM: 0.5548, LEM: 0.3172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2272, partial_loss/deprel_loss: 0.4428, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5435, loss: 0.8239, batch_reg_loss: 0.1439, reg_loss: 0.1433 ||:  64%|######4   | 61/95 [00:40<00:23,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8994, UAS: 0.9361, LAS: 0.8814, UEM: 0.5611, LEM: 0.3194, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3078, partial_loss/deprel_loss: 0.5077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6117, loss: 0.8197, batch_reg_loss: 0.1439, reg_loss: 0.1433 ||:  67%|######7   | 64/95 [00:43<00:21,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9364, LAS: 0.8815, UEM: 0.5533, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7052, partial_loss/deprel_loss: 0.7890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9162, loss: 0.8203, batch_reg_loss: 0.1440, reg_loss: 0.1434 ||:  72%|#######1  | 68/95 [00:45<00:18,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8378, UAS: 0.9355, LAS: 0.8806, UEM: 0.5464, LEM: 0.3063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3218, partial_loss/deprel_loss: 0.9959, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2051, loss: 0.8276, batch_reg_loss: 0.1441, reg_loss: 0.1434 ||:  76%|#######5  | 72/95 [00:48<00:15,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9365, LAS: 0.8817, UEM: 0.5571, LEM: 0.3135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5070, partial_loss/deprel_loss: 0.6505, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7659, loss: 0.8192, batch_reg_loss: 0.1441, reg_loss: 0.1434 ||:  79%|#######8  | 75/95 [00:50<00:14,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9021, UAS: 0.9368, LAS: 0.8820, UEM: 0.5578, LEM: 0.3128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3250, partial_loss/deprel_loss: 0.5083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6158, loss: 0.8165, batch_reg_loss: 0.1442, reg_loss: 0.1435 ||:  82%|########2 | 78/95 [00:52<00:12,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9165, UAS: 0.9365, LAS: 0.8816, UEM: 0.5566, LEM: 0.3134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2677, partial_loss/deprel_loss: 0.4016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5191, loss: 0.8171, batch_reg_loss: 0.1442, reg_loss: 0.1435 ||:  85%|########5 | 81/95 [00:55<00:10,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9363, LAS: 0.8815, UEM: 0.5511, LEM: 0.3080, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4442, partial_loss/deprel_loss: 0.5221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6508, loss: 0.8182, batch_reg_loss: 0.1443, reg_loss: 0.1435 ||:  89%|########9 | 85/95 [00:57<00:07,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9373, LAS: 0.8828, UEM: 0.5726, LEM: 0.3318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1108, partial_loss/deprel_loss: 0.2497, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3663, loss: 0.8079, batch_reg_loss: 0.1444, reg_loss: 0.1436 ||:  93%|#########2| 88/95 [01:00<00:05,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9376, LAS: 0.8832, UEM: 0.5692, LEM: 0.3286, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4735, partial_loss/deprel_loss: 0.5673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6930, loss: 0.8064, batch_reg_loss: 0.1444, reg_loss: 0.1436 ||:  97%|#########6| 92/95 [01:02<00:02,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9378, LAS: 0.8832, UEM: 0.5714, LEM: 0.3296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5080, partial_loss/deprel_loss: 0.6464, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7632, loss: 0.8066, batch_reg_loss: 0.1445, reg_loss: 0.1436 ||: 100%|##########| 95/95 [01:04<00:00,  1.46it/s]\n",
+      "2023-04-06 23:45:59,939 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:45:59,939 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:45:59,939 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.144  |       N/A\n",
+      "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - UEM                      |     0.571  |       N/A\n",
+      "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - LEM                      |     0.330  |       N/A\n",
+      "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - EM                       |     0.888  |       N/A\n",
+      "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.508  |       N/A\n",
+      "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - UAS                      |     0.938  |       N/A\n",
+      "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.646  |       N/A\n",
+      "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - loss                     |     0.807  |       N/A\n",
+      "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - LAS                      |     0.883  |       N/A\n",
+      "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:45:59,940 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:45:59,941 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:45:59,941 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:45:59,941 - INFO - combo.training.trainer - Epoch duration: 0:01:04.885191\n",
+      "2023-04-06 23:45:59,941 - INFO - combo.training.trainer - Estimated training time remaining: 6:34:46\n",
+      "2023-04-06 23:45:59,941 - INFO - allennlp.training.trainer - Epoch 50/399\n",
+      "2023-04-06 23:45:59,941 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:45:59,942 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:45:59,947 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9078, LAS: 0.8507, UEM: 0.3908, LEM: 0.1523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5539, partial_loss/deprel_loss: 0.6880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8057, loss: 1.0078, batch_reg_loss: 0.1445, reg_loss: 0.1445 ||:   3%|3         | 3/95 [00:02<01:02,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9317, LAS: 0.8766, UEM: 0.5551, LEM: 0.2737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4512, partial_loss/deprel_loss: 0.6208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7314, loss: 0.8406, batch_reg_loss: 0.1446, reg_loss: 0.1445 ||:   6%|6         | 6/95 [00:04<01:01,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8013, UAS: 0.9265, LAS: 0.8697, UEM: 0.5033, LEM: 0.2321, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7658, partial_loss/deprel_loss: 1.1443, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4133, loss: 0.8956, batch_reg_loss: 0.1446, reg_loss: 0.1446 ||:  11%|#         | 10/95 [00:06<00:56,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9341, LAS: 0.8794, UEM: 0.5481, LEM: 0.2683, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3290, partial_loss/deprel_loss: 0.5131, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6209, loss: 0.8274, batch_reg_loss: 0.1447, reg_loss: 0.1446 ||:  14%|#3        | 13/95 [00:09<00:59,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9374, LAS: 0.8833, UEM: 0.5741, LEM: 0.2911, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2631, partial_loss/deprel_loss: 0.4149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5293, loss: 0.7962, batch_reg_loss: 0.1448, reg_loss: 0.1446 ||:  17%|#6        | 16/95 [00:11<01:00,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8762, UAS: 0.9353, LAS: 0.8816, UEM: 0.5744, LEM: 0.3010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7819, partial_loss/deprel_loss: 0.7879, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9315, loss: 0.8111, batch_reg_loss: 0.1448, reg_loss: 0.1446 ||:  20%|##        | 19/95 [00:14<00:58,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8510, UAS: 0.9337, LAS: 0.8794, UEM: 0.5620, LEM: 0.2932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0534, partial_loss/deprel_loss: 0.9259, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0962, loss: 0.8336, batch_reg_loss: 0.1449, reg_loss: 0.1447 ||:  23%|##3       | 22/95 [00:16<00:54,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9366, LAS: 0.8828, UEM: 0.5983, LEM: 0.3322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1763, partial_loss/deprel_loss: 0.3904, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4925, loss: 0.8100, batch_reg_loss: 0.1449, reg_loss: 0.1447 ||:  26%|##6       | 25/95 [00:18<00:53,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8514, UAS: 0.9354, LAS: 0.8810, UEM: 0.5727, LEM: 0.3118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8617, partial_loss/deprel_loss: 0.8764, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0185, loss: 0.8204, batch_reg_loss: 0.1450, reg_loss: 0.1447 ||:  31%|###       | 29/95 [00:21<00:47,  1.39it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9376, LAS: 0.8837, UEM: 0.5951, LEM: 0.3436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1037, partial_loss/deprel_loss: 0.2590, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3730, loss: 0.7973, batch_reg_loss: 0.1451, reg_loss: 0.1448 ||:  35%|###4      | 33/95 [00:23<00:44,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8823, UAS: 0.9367, LAS: 0.8824, UEM: 0.5756, LEM: 0.3293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6670, partial_loss/deprel_loss: 0.6741, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8178, loss: 0.8089, batch_reg_loss: 0.1451, reg_loss: 0.1448 ||:  38%|###7      | 36/95 [00:25<00:41,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9375, LAS: 0.8833, UEM: 0.5715, LEM: 0.3226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3772, partial_loss/deprel_loss: 0.5216, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6379, loss: 0.8022, batch_reg_loss: 0.1452, reg_loss: 0.1448 ||:  41%|####1     | 39/95 [00:27<00:39,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9368, LAS: 0.8828, UEM: 0.5804, LEM: 0.3350, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1168, partial_loss/deprel_loss: 0.3273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4304, loss: 0.8037, batch_reg_loss: 0.1452, reg_loss: 0.1449 ||:  44%|####4     | 42/95 [00:30<00:37,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9351, LAS: 0.8807, UEM: 0.5662, LEM: 0.3249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5921, partial_loss/deprel_loss: 0.7327, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8499, loss: 0.8204, batch_reg_loss: 0.1453, reg_loss: 0.1449 ||:  47%|####7     | 45/95 [00:32<00:35,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8879, UAS: 0.9360, LAS: 0.8817, UEM: 0.5692, LEM: 0.3260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4875, partial_loss/deprel_loss: 0.6497, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7626, loss: 0.8124, batch_reg_loss: 0.1453, reg_loss: 0.1449 ||:  51%|#####     | 48/95 [00:34<00:33,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9346, LAS: 0.8800, UEM: 0.5626, LEM: 0.3225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2597, partial_loss/deprel_loss: 0.4557, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5619, loss: 0.8267, batch_reg_loss: 0.1454, reg_loss: 0.1449 ||:  55%|#####4    | 52/95 [00:37<00:30,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8542, UAS: 0.9348, LAS: 0.8800, UEM: 0.5570, LEM: 0.3149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8865, partial_loss/deprel_loss: 0.8319, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9883, loss: 0.8266, batch_reg_loss: 0.1455, reg_loss: 0.1450 ||:  58%|#####7    | 55/95 [00:39<00:28,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9051, UAS: 0.9349, LAS: 0.8801, UEM: 0.5596, LEM: 0.3156, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3515, partial_loss/deprel_loss: 0.5473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6537, loss: 0.8267, batch_reg_loss: 0.1455, reg_loss: 0.1450 ||:  61%|######1   | 58/95 [00:41<00:27,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8477, UAS: 0.9346, LAS: 0.8797, UEM: 0.5508, LEM: 0.3073, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0865, partial_loss/deprel_loss: 0.9012, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0839, loss: 0.8320, batch_reg_loss: 0.1456, reg_loss: 0.1450 ||:  65%|######5   | 62/95 [00:43<00:22,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9355, LAS: 0.8809, UEM: 0.5603, LEM: 0.3137, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2380, partial_loss/deprel_loss: 0.3913, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5063, loss: 0.8214, batch_reg_loss: 0.1457, reg_loss: 0.1451 ||:  69%|######9   | 66/95 [00:46<00:19,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9361, LAS: 0.8818, UEM: 0.5629, LEM: 0.3163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7719, partial_loss/deprel_loss: 0.7586, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9070, loss: 0.8146, batch_reg_loss: 0.1458, reg_loss: 0.1451 ||:  74%|#######3  | 70/95 [00:49<00:16,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9361, LAS: 0.8819, UEM: 0.5576, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4729, partial_loss/deprel_loss: 0.5808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7050, loss: 0.8139, batch_reg_loss: 0.1458, reg_loss: 0.1452 ||:  78%|#######7  | 74/95 [00:51<00:13,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8327, UAS: 0.9368, LAS: 0.8829, UEM: 0.5771, LEM: 0.3366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1562, partial_loss/deprel_loss: 1.0269, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1986, loss: 0.8075, batch_reg_loss: 0.1459, reg_loss: 0.1452 ||:  82%|########2 | 78/95 [00:54<00:12,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8208, UAS: 0.9364, LAS: 0.8823, UEM: 0.5720, LEM: 0.3302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4516, partial_loss/deprel_loss: 1.0691, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2915, loss: 0.8112, batch_reg_loss: 0.1459, reg_loss: 0.1452 ||:  86%|########6 | 82/95 [00:57<00:08,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9366, LAS: 0.8825, UEM: 0.5678, LEM: 0.3253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5063, partial_loss/deprel_loss: 0.6596, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7750, loss: 0.8109, batch_reg_loss: 0.1460, reg_loss: 0.1452 ||:  89%|########9 | 85/95 [00:59<00:06,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9374, LAS: 0.8832, UEM: 0.5746, LEM: 0.3306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1837, partial_loss/deprel_loss: 0.3435, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4576, loss: 0.8052, batch_reg_loss: 0.1460, reg_loss: 0.1453 ||:  93%|#########2| 88/95 [01:01<00:04,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8544, UAS: 0.9378, LAS: 0.8836, UEM: 0.5769, LEM: 0.3318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7352, partial_loss/deprel_loss: 0.9154, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0254, loss: 0.8025, batch_reg_loss: 0.1461, reg_loss: 0.1453 ||:  96%|#########5| 91/95 [01:03<00:02,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8683, UAS: 0.9377, LAS: 0.8833, UEM: 0.5734, LEM: 0.3270, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7321, partial_loss/deprel_loss: 0.7708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9092, loss: 0.8052, batch_reg_loss: 0.1462, reg_loss: 0.1453 ||: 100%|##########| 95/95 [01:06<00:00,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8683, UAS: 0.9377, LAS: 0.8833, UEM: 0.5734, LEM: 0.3270, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7321, partial_loss/deprel_loss: 0.7708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9092, loss: 0.8052, batch_reg_loss: 0.1462, reg_loss: 0.1453 ||: 100%|##########| 95/95 [01:06<00:00,  1.43it/s]\n",
+      "2023-04-06 23:47:06,372 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8985, UAS: 0.9566, LAS: 0.9018, UEM: 0.7797, LEM: 0.5207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4264, partial_loss/deprel_loss: 29.7159, partial_loss/cycle_loss: 0.0000, batch_loss: 23.8580, loss: 25.5143, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  27%|##7       | 3/11 [00:02<00:07,  1.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8784, UAS: 0.9567, LAS: 0.9029, UEM: 0.7585, LEM: 0.4904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8997, partial_loss/deprel_loss: 34.5766, partial_loss/cycle_loss: 0.0000, batch_loss: 27.8412, loss: 24.5860, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:04<00:05,  1.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8750, UAS: 0.9503, LAS: 0.8962, UEM: 0.6993, LEM: 0.4292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9073, partial_loss/deprel_loss: 29.4189, partial_loss/cycle_loss: 0.0000, batch_loss: 23.7166, loss: 25.8269, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  73%|#######2  | 8/11 [00:07<00:02,  1.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9473, LAS: 0.8931, UEM: 0.6718, LEM: 0.3940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3101, partial_loss/deprel_loss: 28.6903, partial_loss/cycle_loss: 0.0000, batch_loss: 23.0143, loss: 27.0167, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:09<00:00,  1.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9473, LAS: 0.8931, UEM: 0.6718, LEM: 0.3940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3101, partial_loss/deprel_loss: 28.6903, partial_loss/cycle_loss: 0.0000, batch_loss: 23.0143, loss: 27.0167, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:09<00:00,  1.10it/s]\n",
+      "2023-04-06 23:47:16,340 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:47:16,340 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:47:16,340 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.145  |     0.000\n",
+      "2023-04-06 23:47:16,340 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:47:16,340 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:47:16,340 - INFO - combo.training.tensorboard_writer - UEM                      |     0.573  |     0.672\n",
+      "2023-04-06 23:47:16,340 - INFO - combo.training.tensorboard_writer - LEM                      |     0.327  |     0.394\n",
+      "2023-04-06 23:47:16,340 - INFO - combo.training.tensorboard_writer - EM                       |     0.868  |     0.922\n",
+      "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.732  |     0.310\n",
+      "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - UAS                      |     0.938  |     0.947\n",
+      "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.771  |    28.690\n",
+      "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - loss                     |     0.805  |    27.017\n",
+      "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - LAS                      |     0.883  |     0.893\n",
+      "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:47:16,341 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 23:47:16,342 - INFO - combo.training.trainer - Epoch duration: 0:01:16.400613\n",
+      "2023-04-06 23:47:16,342 - INFO - combo.training.trainer - Estimated training time remaining: 6:34:38\n",
+      "2023-04-06 23:47:16,342 - INFO - allennlp.training.trainer - Epoch 51/399\n",
+      "2023-04-06 23:47:16,342 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:47:16,342 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:47:16,348 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8734, UAS: 0.9418, LAS: 0.8849, UEM: 0.3598, LEM: 0.1190, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6567, partial_loss/deprel_loss: 0.7006, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8380, loss: 0.7955, batch_reg_loss: 0.1462, reg_loss: 0.1462 ||:   3%|3         | 3/95 [00:02<01:02,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8956, UAS: 0.9489, LAS: 0.8934, UEM: 0.5391, LEM: 0.2555, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3646, partial_loss/deprel_loss: 0.5189, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6343, loss: 0.7233, batch_reg_loss: 0.1463, reg_loss: 0.1462 ||:   6%|6         | 6/95 [00:04<01:03,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9484, LAS: 0.8927, UEM: 0.5886, LEM: 0.3045, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2742, partial_loss/deprel_loss: 0.4436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5560, loss: 0.7152, batch_reg_loss: 0.1463, reg_loss: 0.1462 ||:   9%|9         | 9/95 [00:06<01:04,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9482, LAS: 0.8929, UEM: 0.5899, LEM: 0.3152, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5917, partial_loss/deprel_loss: 0.6768, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8061, loss: 0.7116, batch_reg_loss: 0.1464, reg_loss: 0.1463 ||:  14%|#3        | 13/95 [00:09<00:58,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9425, LAS: 0.8861, UEM: 0.5435, LEM: 0.2807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4471, partial_loss/deprel_loss: 0.5360, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6646, loss: 0.7664, batch_reg_loss: 0.1464, reg_loss: 0.1463 ||:  18%|#7        | 17/95 [00:11<00:52,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9440, LAS: 0.8886, UEM: 0.5466, LEM: 0.2774, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4041, partial_loss/deprel_loss: 0.4940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6226, loss: 0.7496, batch_reg_loss: 0.1465, reg_loss: 0.1463 ||:  22%|##2       | 21/95 [00:14<00:48,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8482, UAS: 0.9404, LAS: 0.8849, UEM: 0.5174, LEM: 0.2602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0270, partial_loss/deprel_loss: 0.9598, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1198, loss: 0.7867, batch_reg_loss: 0.1465, reg_loss: 0.1464 ||:  25%|##5       | 24/95 [00:16<00:47,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9391, LAS: 0.8837, UEM: 0.5188, LEM: 0.2660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2842, partial_loss/deprel_loss: 0.4099, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5314, loss: 0.7961, batch_reg_loss: 0.1466, reg_loss: 0.1464 ||:  28%|##8       | 27/95 [00:18<00:46,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9409, LAS: 0.8856, UEM: 0.5292, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2306, partial_loss/deprel_loss: 0.4513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5539, loss: 0.7793, batch_reg_loss: 0.1467, reg_loss: 0.1464 ||:  33%|###2      | 31/95 [00:20<00:42,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9418, LAS: 0.8865, UEM: 0.5381, LEM: 0.2730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2403, partial_loss/deprel_loss: 0.4465, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5520, loss: 0.7741, batch_reg_loss: 0.1467, reg_loss: 0.1464 ||:  36%|###5      | 34/95 [00:23<00:41,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9413, LAS: 0.8859, UEM: 0.5288, LEM: 0.2658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4709, partial_loss/deprel_loss: 0.5891, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7123, loss: 0.7800, batch_reg_loss: 0.1468, reg_loss: 0.1465 ||:  39%|###8      | 37/95 [00:25<00:39,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9425, LAS: 0.8874, UEM: 0.5445, LEM: 0.2782, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1804, partial_loss/deprel_loss: 0.3495, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4625, loss: 0.7694, batch_reg_loss: 0.1469, reg_loss: 0.1465 ||:  43%|####3     | 41/95 [00:27<00:36,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8694, UAS: 0.9425, LAS: 0.8873, UEM: 0.5542, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7870, partial_loss/deprel_loss: 0.7960, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9411, loss: 0.7686, batch_reg_loss: 0.1469, reg_loss: 0.1465 ||:  46%|####6     | 44/95 [00:30<00:35,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9432, LAS: 0.8885, UEM: 0.5694, LEM: 0.3075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1664, partial_loss/deprel_loss: 0.3307, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4448, loss: 0.7603, batch_reg_loss: 0.1470, reg_loss: 0.1466 ||:  49%|####9     | 47/95 [00:32<00:34,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8436, UAS: 0.9404, LAS: 0.8856, UEM: 0.5516, LEM: 0.2966, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1840, partial_loss/deprel_loss: 0.8997, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1035, loss: 0.7850, batch_reg_loss: 0.1470, reg_loss: 0.1466 ||:  54%|#####3    | 51/95 [00:34<00:30,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8368, UAS: 0.9406, LAS: 0.8859, UEM: 0.5674, LEM: 0.3173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9788, partial_loss/deprel_loss: 0.9509, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1035, loss: 0.7812, batch_reg_loss: 0.1471, reg_loss: 0.1466 ||:  57%|#####6    | 54/95 [00:36<00:28,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9391, LAS: 0.8844, UEM: 0.5723, LEM: 0.3221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2408, partial_loss/deprel_loss: 0.4449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5512, loss: 0.7934, batch_reg_loss: 0.1471, reg_loss: 0.1467 ||:  61%|######1   | 58/95 [00:39<00:24,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7838, UAS: 0.9380, LAS: 0.8832, UEM: 0.5718, LEM: 0.3214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1437, partial_loss/deprel_loss: 1.2796, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5997, loss: 0.8041, batch_reg_loss: 0.1472, reg_loss: 0.1467 ||:  65%|######5   | 62/95 [00:42<00:22,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8767, UAS: 0.9389, LAS: 0.8846, UEM: 0.5914, LEM: 0.3493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7249, partial_loss/deprel_loss: 0.7364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8814, loss: 0.7952, batch_reg_loss: 0.1473, reg_loss: 0.1467 ||:  68%|######8   | 65/95 [00:44<00:20,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9377, LAS: 0.8832, UEM: 0.5912, LEM: 0.3501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1658, partial_loss/deprel_loss: 0.3402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4526, loss: 0.8055, batch_reg_loss: 0.1473, reg_loss: 0.1467 ||:  73%|#######2  | 69/95 [00:47<00:17,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9380, LAS: 0.8834, UEM: 0.5869, LEM: 0.3451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5853, partial_loss/deprel_loss: 0.6372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7742, loss: 0.8042, batch_reg_loss: 0.1474, reg_loss: 0.1468 ||:  76%|#######5  | 72/95 [00:49<00:15,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8181, UAS: 0.9366, LAS: 0.8817, UEM: 0.5751, LEM: 0.3361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4094, partial_loss/deprel_loss: 0.9917, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2227, loss: 0.8158, batch_reg_loss: 0.1475, reg_loss: 0.1468 ||:  80%|########  | 76/95 [00:51<00:12,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8381, UAS: 0.9358, LAS: 0.8808, UEM: 0.5683, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1287, partial_loss/deprel_loss: 0.9087, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1003, loss: 0.8236, batch_reg_loss: 0.1476, reg_loss: 0.1468 ||:  84%|########4 | 80/95 [00:53<00:09,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9031, UAS: 0.9358, LAS: 0.8808, UEM: 0.5622, LEM: 0.3238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3467, partial_loss/deprel_loss: 0.5521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6587, loss: 0.8243, batch_reg_loss: 0.1476, reg_loss: 0.1469 ||:  88%|########8 | 84/95 [00:56<00:07,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9364, LAS: 0.8813, UEM: 0.5618, LEM: 0.3204, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5633, partial_loss/deprel_loss: 0.7083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8270, loss: 0.8204, batch_reg_loss: 0.1477, reg_loss: 0.1469 ||:  93%|#########2| 88/95 [00:59<00:04,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9074, UAS: 0.9373, LAS: 0.8825, UEM: 0.5713, LEM: 0.3279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3449, partial_loss/deprel_loss: 0.5724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6747, loss: 0.8121, batch_reg_loss: 0.1478, reg_loss: 0.1469 ||:  96%|#########5| 91/95 [01:02<00:02,  1.39it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9378, LAS: 0.8829, UEM: 0.5731, LEM: 0.3275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2890, partial_loss/deprel_loss: 0.4753, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5859, loss: 0.8094, batch_reg_loss: 0.1479, reg_loss: 0.1470 ||: 100%|##########| 95/95 [01:04<00:00,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9378, LAS: 0.8829, UEM: 0.5731, LEM: 0.3275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2890, partial_loss/deprel_loss: 0.4753, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5859, loss: 0.8094, batch_reg_loss: 0.1479, reg_loss: 0.1470 ||: 100%|##########| 95/95 [01:04<00:00,  1.47it/s]\n",
+      "2023-04-06 23:48:21,159 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:48:21,159 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-06 23:48:21,159 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.147  |       N/A\n",
+      "2023-04-06 23:48:21,159 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - UEM                      |     0.573  |       N/A\n",
+      "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - LEM                      |     0.328  |       N/A\n",
+      "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - EM                       |     0.912  |       N/A\n",
+      "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.289  |       N/A\n",
+      "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - UAS                      |     0.938  |       N/A\n",
+      "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.475  |       N/A\n",
+      "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - loss                     |     0.809  |       N/A\n",
+      "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - LAS                      |     0.883  |       N/A\n",
+      "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:48:21,160 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:48:21,161 - INFO - combo.training.trainer - Epoch duration: 0:01:04.818947\n",
+      "2023-04-06 23:48:21,161 - INFO - combo.training.trainer - Estimated training time remaining: 6:33:10\n",
+      "2023-04-06 23:48:21,161 - INFO - allennlp.training.trainer - Epoch 52/399\n",
+      "2023-04-06 23:48:21,161 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:48:21,162 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:48:21,167 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9308, LAS: 0.8799, UEM: 0.6359, LEM: 0.4512, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1617, partial_loss/deprel_loss: 0.3055, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4247, loss: 0.8042, batch_reg_loss: 0.1479, reg_loss: 0.1479 ||:   3%|3         | 3/95 [00:02<01:06,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9420, LAS: 0.8884, UEM: 0.6471, LEM: 0.4010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1579, partial_loss/deprel_loss: 0.4190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5147, loss: 0.7566, batch_reg_loss: 0.1480, reg_loss: 0.1479 ||:   7%|7         | 7/95 [00:04<01:01,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8480, UAS: 0.9364, LAS: 0.8820, UEM: 0.5961, LEM: 0.3525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1484, partial_loss/deprel_loss: 1.0143, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1891, loss: 0.8171, batch_reg_loss: 0.1480, reg_loss: 0.1480 ||:  11%|#         | 10/95 [00:06<01:00,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8648, UAS: 0.9336, LAS: 0.8782, UEM: 0.5276, LEM: 0.2999, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7180, partial_loss/deprel_loss: 0.7570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8973, loss: 0.8447, batch_reg_loss: 0.1481, reg_loss: 0.1480 ||:  15%|#4        | 14/95 [00:09<00:53,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8710, UAS: 0.9357, LAS: 0.8806, UEM: 0.5214, LEM: 0.2849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6777, partial_loss/deprel_loss: 0.8299, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9476, loss: 0.8326, batch_reg_loss: 0.1481, reg_loss: 0.1480 ||:  18%|#7        | 17/95 [00:11<00:52,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9371, LAS: 0.8815, UEM: 0.5317, LEM: 0.2886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3349, partial_loss/deprel_loss: 0.5308, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6398, loss: 0.8226, batch_reg_loss: 0.1482, reg_loss: 0.1480 ||:  22%|##2       | 21/95 [00:13<00:49,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8498, UAS: 0.9336, LAS: 0.8785, UEM: 0.5080, LEM: 0.2708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0253, partial_loss/deprel_loss: 0.9645, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1249, loss: 0.8501, batch_reg_loss: 0.1483, reg_loss: 0.1481 ||:  26%|##6       | 25/95 [00:16<00:46,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9349, LAS: 0.8800, UEM: 0.5150, LEM: 0.2738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2474, partial_loss/deprel_loss: 0.4210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5346, loss: 0.8417, batch_reg_loss: 0.1483, reg_loss: 0.1481 ||:  29%|##9       | 28/95 [00:18<00:46,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9358, LAS: 0.8812, UEM: 0.5436, LEM: 0.2974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2380, partial_loss/deprel_loss: 0.4435, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5508, loss: 0.8294, batch_reg_loss: 0.1484, reg_loss: 0.1481 ||:  33%|###2      | 31/95 [00:21<00:47,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9358, LAS: 0.8813, UEM: 0.5378, LEM: 0.2888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4386, partial_loss/deprel_loss: 0.5854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7045, loss: 0.8295, batch_reg_loss: 0.1485, reg_loss: 0.1482 ||:  37%|###6      | 35/95 [00:24<00:43,  1.39it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9380, LAS: 0.8842, UEM: 0.5699, LEM: 0.3212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1450, partial_loss/deprel_loss: 0.2676, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3916, loss: 0.8068, batch_reg_loss: 0.1485, reg_loss: 0.1482 ||:  41%|####1     | 39/95 [00:26<00:39,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7942, UAS: 0.9366, LAS: 0.8825, UEM: 0.5679, LEM: 0.3191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9756, partial_loss/deprel_loss: 1.2451, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5398, loss: 0.8189, batch_reg_loss: 0.1486, reg_loss: 0.1482 ||:  44%|####4     | 42/95 [00:29<00:38,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9361, LAS: 0.8820, UEM: 0.5585, LEM: 0.3120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2940, partial_loss/deprel_loss: 0.4615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5767, loss: 0.8254, batch_reg_loss: 0.1487, reg_loss: 0.1483 ||:  48%|####8     | 46/95 [00:31<00:33,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9373, LAS: 0.8833, UEM: 0.5702, LEM: 0.3198, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4421, partial_loss/deprel_loss: 0.6539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7603, loss: 0.8182, batch_reg_loss: 0.1487, reg_loss: 0.1483 ||:  52%|#####1    | 49/95 [00:33<00:31,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9373, LAS: 0.8831, UEM: 0.5623, LEM: 0.3106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4181, partial_loss/deprel_loss: 0.6043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7158, loss: 0.8206, batch_reg_loss: 0.1488, reg_loss: 0.1483 ||:  55%|#####4    | 52/95 [00:35<00:30,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9375, LAS: 0.8832, UEM: 0.5650, LEM: 0.3138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2680, partial_loss/deprel_loss: 0.4244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5420, loss: 0.8150, batch_reg_loss: 0.1488, reg_loss: 0.1483 ||:  59%|#####8    | 56/95 [00:38<00:26,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8324, UAS: 0.9381, LAS: 0.8839, UEM: 0.5715, LEM: 0.3173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3018, partial_loss/deprel_loss: 1.0026, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2113, loss: 0.8112, batch_reg_loss: 0.1489, reg_loss: 0.1484 ||:  63%|######3   | 60/95 [00:40<00:23,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8724, UAS: 0.9374, LAS: 0.8830, UEM: 0.5618, LEM: 0.3098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7262, partial_loss/deprel_loss: 0.7235, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8730, loss: 0.8165, batch_reg_loss: 0.1489, reg_loss: 0.1484 ||:  66%|######6   | 63/95 [00:42<00:21,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8881, UAS: 0.9382, LAS: 0.8840, UEM: 0.5622, LEM: 0.3088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4737, partial_loss/deprel_loss: 0.6175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7378, loss: 0.8098, batch_reg_loss: 0.1490, reg_loss: 0.1484 ||:  69%|######9   | 66/95 [00:44<00:19,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8108, UAS: 0.9377, LAS: 0.8833, UEM: 0.5594, LEM: 0.3063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4983, partial_loss/deprel_loss: 1.1986, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4076, loss: 0.8166, batch_reg_loss: 0.1490, reg_loss: 0.1485 ||:  73%|#######2  | 69/95 [00:47<00:18,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9378, LAS: 0.8833, UEM: 0.5587, LEM: 0.3033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3065, partial_loss/deprel_loss: 0.5009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6111, loss: 0.8146, batch_reg_loss: 0.1491, reg_loss: 0.1485 ||:  76%|#######5  | 72/95 [00:49<00:16,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9391, LAS: 0.8849, UEM: 0.5869, LEM: 0.3380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2669, partial_loss/deprel_loss: 0.4559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5672, loss: 0.8003, batch_reg_loss: 0.1491, reg_loss: 0.1485 ||:  79%|#######8  | 75/95 [00:52<00:15,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9391, LAS: 0.8849, UEM: 0.5810, LEM: 0.3327, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6178, partial_loss/deprel_loss: 0.7175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8468, loss: 0.7992, batch_reg_loss: 0.1492, reg_loss: 0.1485 ||:  83%|########3 | 79/95 [00:54<00:11,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8830, UAS: 0.9390, LAS: 0.8849, UEM: 0.5754, LEM: 0.3278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6301, partial_loss/deprel_loss: 0.7038, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8383, loss: 0.7999, batch_reg_loss: 0.1492, reg_loss: 0.1486 ||:  86%|########6 | 82/95 [00:56<00:09,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8864, UAS: 0.9389, LAS: 0.8847, UEM: 0.5671, LEM: 0.3207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5044, partial_loss/deprel_loss: 0.7119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8197, loss: 0.8009, batch_reg_loss: 0.1493, reg_loss: 0.1486 ||:  91%|######### | 86/95 [00:59<00:06,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9396, LAS: 0.8856, UEM: 0.5762, LEM: 0.3302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1137, partial_loss/deprel_loss: 0.3177, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4263, loss: 0.7948, batch_reg_loss: 0.1494, reg_loss: 0.1486 ||:  95%|#########4| 90/95 [01:02<00:03,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9090, UAS: 0.9392, LAS: 0.8851, UEM: 0.5773, LEM: 0.3306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3726, partial_loss/deprel_loss: 0.5450, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6599, loss: 0.7989, batch_reg_loss: 0.1494, reg_loss: 0.1487 ||:  98%|#########7| 93/95 [01:04<00:01,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8315, UAS: 0.9387, LAS: 0.8846, UEM: 0.5744, LEM: 0.3280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2811, partial_loss/deprel_loss: 0.9185, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1404, loss: 0.8018, batch_reg_loss: 0.1495, reg_loss: 0.1487 ||: 100%|##########| 95/95 [01:05<00:00,  1.44it/s]\n",
+      "2023-04-06 23:49:26,971 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:49:26,971 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-06 23:49:26,971 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.149  |       N/A\n",
+      "2023-04-06 23:49:26,971 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:49:26,971 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:49:26,971 - INFO - combo.training.tensorboard_writer - UEM                      |     0.574  |       N/A\n",
+      "2023-04-06 23:49:26,971 - INFO - combo.training.tensorboard_writer - LEM                      |     0.328  |       N/A\n",
+      "2023-04-06 23:49:26,971 - INFO - combo.training.tensorboard_writer - EM                       |     0.832  |       N/A\n",
+      "2023-04-06 23:49:26,971 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.281  |       N/A\n",
+      "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - UAS                      |     0.939  |       N/A\n",
+      "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.918  |       N/A\n",
+      "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - loss                     |     0.802  |       N/A\n",
+      "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - LAS                      |     0.885  |       N/A\n",
+      "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:49:26,972 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:49:26,973 - INFO - combo.training.trainer - Epoch duration: 0:01:05.811734\n",
+      "2023-04-06 23:49:26,973 - INFO - combo.training.trainer - Estimated training time remaining: 6:31:49\n",
+      "2023-04-06 23:49:26,973 - INFO - allennlp.training.trainer - Epoch 53/399\n",
+      "2023-04-06 23:49:26,973 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:49:26,974 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:49:26,980 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8393, UAS: 0.9074, LAS: 0.8516, UEM: 0.2768, LEM: 0.1176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2356, partial_loss/deprel_loss: 0.9544, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1601, loss: 1.0297, batch_reg_loss: 0.1495, reg_loss: 0.1495 ||:   3%|3         | 3/95 [00:02<01:06,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9332, LAS: 0.8793, UEM: 0.6292, LEM: 0.4162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3958, partial_loss/deprel_loss: 0.5297, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6525, loss: 0.8124, batch_reg_loss: 0.1496, reg_loss: 0.1495 ||:   6%|6         | 6/95 [00:04<01:03,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9334, LAS: 0.8799, UEM: 0.5389, LEM: 0.3261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4452, partial_loss/deprel_loss: 0.5596, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6863, loss: 0.8171, batch_reg_loss: 0.1496, reg_loss: 0.1495 ||:  11%|#         | 10/95 [00:06<00:56,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9385, LAS: 0.8856, UEM: 0.5737, LEM: 0.3425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1791, partial_loss/deprel_loss: 0.3581, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4720, loss: 0.7805, batch_reg_loss: 0.1497, reg_loss: 0.1496 ||:  14%|#3        | 13/95 [00:08<00:56,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8637, UAS: 0.9397, LAS: 0.8870, UEM: 0.5782, LEM: 0.3355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9353, partial_loss/deprel_loss: 0.8215, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9940, loss: 0.7734, batch_reg_loss: 0.1497, reg_loss: 0.1496 ||:  17%|#6        | 16/95 [00:10<00:54,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8284, UAS: 0.9376, LAS: 0.8846, UEM: 0.5705, LEM: 0.3324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3460, partial_loss/deprel_loss: 1.0317, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2443, loss: 0.7951, batch_reg_loss: 0.1498, reg_loss: 0.1496 ||:  21%|##1       | 20/95 [00:13<00:50,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8824, UAS: 0.9387, LAS: 0.8857, UEM: 0.5541, LEM: 0.3142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5471, partial_loss/deprel_loss: 0.7203, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8355, loss: 0.7887, batch_reg_loss: 0.1499, reg_loss: 0.1497 ||:  24%|##4       | 23/95 [00:15<00:48,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8791, UAS: 0.9406, LAS: 0.8880, UEM: 0.5694, LEM: 0.3269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6971, partial_loss/deprel_loss: 0.7017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8507, loss: 0.7714, batch_reg_loss: 0.1499, reg_loss: 0.1497 ||:  27%|##7       | 26/95 [00:17<00:48,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8546, UAS: 0.9401, LAS: 0.8875, UEM: 0.5800, LEM: 0.3425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8850, partial_loss/deprel_loss: 0.8165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9802, loss: 0.7746, batch_reg_loss: 0.1500, reg_loss: 0.1497 ||:  31%|###       | 29/95 [00:19<00:46,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9407, LAS: 0.8880, UEM: 0.5727, LEM: 0.3301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4124, partial_loss/deprel_loss: 0.5812, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6975, loss: 0.7700, batch_reg_loss: 0.1500, reg_loss: 0.1497 ||:  34%|###3      | 32/95 [00:21<00:44,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9424, LAS: 0.8896, UEM: 0.5849, LEM: 0.3339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3894, partial_loss/deprel_loss: 0.6124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7179, loss: 0.7588, batch_reg_loss: 0.1501, reg_loss: 0.1498 ||:  37%|###6      | 35/95 [00:24<00:45,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9401, LAS: 0.8871, UEM: 0.5659, LEM: 0.3205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6715, partial_loss/deprel_loss: 0.7216, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8617, loss: 0.7798, batch_reg_loss: 0.1501, reg_loss: 0.1498 ||:  40%|####      | 38/95 [00:26<00:42,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9220, UAS: 0.9402, LAS: 0.8874, UEM: 0.5589, LEM: 0.3125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2362, partial_loss/deprel_loss: 0.4092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5247, loss: 0.7810, batch_reg_loss: 0.1502, reg_loss: 0.1498 ||:  44%|####4     | 42/95 [00:29<00:37,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8499, UAS: 0.9405, LAS: 0.8873, UEM: 0.5617, LEM: 0.3126, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9249, partial_loss/deprel_loss: 0.8992, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0545, loss: 0.7805, batch_reg_loss: 0.1502, reg_loss: 0.1498 ||:  47%|####7     | 45/95 [00:31<00:35,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9401, LAS: 0.8867, UEM: 0.5562, LEM: 0.3124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2549, partial_loss/deprel_loss: 0.3797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5050, loss: 0.7841, batch_reg_loss: 0.1503, reg_loss: 0.1499 ||:  52%|#####1    | 49/95 [00:34<00:32,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9389, LAS: 0.8857, UEM: 0.5537, LEM: 0.3127, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2715, partial_loss/deprel_loss: 0.4252, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5448, loss: 0.7928, batch_reg_loss: 0.1503, reg_loss: 0.1499 ||:  55%|#####4    | 52/95 [00:36<00:30,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8194, UAS: 0.9378, LAS: 0.8848, UEM: 0.5472, LEM: 0.3060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7601, partial_loss/deprel_loss: 1.0152, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3145, loss: 0.8008, batch_reg_loss: 0.1504, reg_loss: 0.1499 ||:  58%|#####7    | 55/95 [00:38<00:28,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9077, UAS: 0.9370, LAS: 0.8838, UEM: 0.5553, LEM: 0.3116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2572, partial_loss/deprel_loss: 0.4285, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5446, loss: 0.8078, batch_reg_loss: 0.1504, reg_loss: 0.1500 ||:  61%|######1   | 58/95 [00:40<00:26,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9364, LAS: 0.8831, UEM: 0.5463, LEM: 0.3027, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4287, partial_loss/deprel_loss: 0.5523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6781, loss: 0.8138, batch_reg_loss: 0.1505, reg_loss: 0.1500 ||:  65%|######5   | 62/95 [00:42<00:22,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9182, UAS: 0.9364, LAS: 0.8830, UEM: 0.5485, LEM: 0.3053, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2064, partial_loss/deprel_loss: 0.3761, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4928, loss: 0.8177, batch_reg_loss: 0.1506, reg_loss: 0.1500 ||:  69%|######9   | 66/95 [00:45<00:19,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9171, UAS: 0.9381, LAS: 0.8851, UEM: 0.5775, LEM: 0.3391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3076, partial_loss/deprel_loss: 0.4389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5633, loss: 0.8029, batch_reg_loss: 0.1507, reg_loss: 0.1501 ||:  74%|#######3  | 70/95 [00:48<00:16,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8704, UAS: 0.9380, LAS: 0.8847, UEM: 0.5696, LEM: 0.3307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5853, partial_loss/deprel_loss: 0.7426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8619, loss: 0.8040, batch_reg_loss: 0.1507, reg_loss: 0.1501 ||:  78%|#######7  | 74/95 [00:50<00:13,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8700, UAS: 0.9385, LAS: 0.8852, UEM: 0.5755, LEM: 0.3363, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7588, partial_loss/deprel_loss: 0.7845, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9302, loss: 0.7990, batch_reg_loss: 0.1508, reg_loss: 0.1501 ||:  82%|########2 | 78/95 [00:53<00:11,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9397, LAS: 0.8864, UEM: 0.5853, LEM: 0.3418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2012, partial_loss/deprel_loss: 0.4047, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5149, loss: 0.7898, batch_reg_loss: 0.1509, reg_loss: 0.1502 ||:  86%|########6 | 82/95 [00:55<00:08,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8571, UAS: 0.9392, LAS: 0.8857, UEM: 0.5788, LEM: 0.3354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7710, partial_loss/deprel_loss: 0.8137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9561, loss: 0.7949, batch_reg_loss: 0.1509, reg_loss: 0.1502 ||:  91%|######### | 86/95 [00:58<00:05,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9395, LAS: 0.8860, UEM: 0.5767, LEM: 0.3313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3494, partial_loss/deprel_loss: 0.5346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6486, loss: 0.7926, batch_reg_loss: 0.1510, reg_loss: 0.1502 ||:  95%|#########4| 90/95 [01:00<00:03,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8603, UAS: 0.9386, LAS: 0.8847, UEM: 0.5728, LEM: 0.3284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8984, partial_loss/deprel_loss: 0.8506, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0112, loss: 0.8005, batch_reg_loss: 0.1511, reg_loss: 0.1503 ||:  99%|#########8| 94/95 [01:03<00:00,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8413, UAS: 0.9382, LAS: 0.8843, UEM: 0.5700, LEM: 0.3266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0352, partial_loss/deprel_loss: 0.9346, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1058, loss: 0.8037, batch_reg_loss: 0.1511, reg_loss: 0.1503 ||: 100%|##########| 95/95 [01:03<00:00,  1.49it/s]\n",
+      "2023-04-06 23:50:30,698 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.150  |       N/A\n",
+      "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - UEM                      |     0.570  |       N/A\n",
+      "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - LEM                      |     0.327  |       N/A\n",
+      "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - EM                       |     0.841  |       N/A\n",
+      "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.035  |       N/A\n",
+      "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - UAS                      |     0.938  |       N/A\n",
+      "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.935  |       N/A\n",
+      "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - loss                     |     0.804  |       N/A\n",
+      "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - LAS                      |     0.884  |       N/A\n",
+      "2023-04-06 23:50:30,699 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:50:30,700 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:50:30,700 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:50:30,700 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:50:30,700 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:50:30,700 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:50:30,700 - INFO - combo.training.trainer - Epoch duration: 0:01:03.727272\n",
+      "2023-04-06 23:50:30,701 - INFO - combo.training.trainer - Estimated training time remaining: 6:30:15\n",
+      "2023-04-06 23:50:30,701 - INFO - allennlp.training.trainer - Epoch 54/399\n",
+      "2023-04-06 23:50:30,701 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:50:30,701 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:50:30,708 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9432, LAS: 0.8912, UEM: 0.4653, LEM: 0.1987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3018, partial_loss/deprel_loss: 0.5142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6229, loss: 0.7230, batch_reg_loss: 0.1512, reg_loss: 0.1511 ||:   4%|4         | 4/95 [00:02<00:53,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9407, LAS: 0.8860, UEM: 0.4340, LEM: 0.1799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5516, partial_loss/deprel_loss: 0.6807, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8061, loss: 0.7673, batch_reg_loss: 0.1512, reg_loss: 0.1512 ||:   7%|7         | 7/95 [00:04<00:55,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9446, LAS: 0.8911, UEM: 0.5261, LEM: 0.2600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6742, partial_loss/deprel_loss: 0.7591, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8934, loss: 0.7372, batch_reg_loss: 0.1513, reg_loss: 0.1512 ||:  11%|#         | 10/95 [00:06<00:56,  1.51it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8014, UAS: 0.9321, LAS: 0.8777, UEM: 0.4638, LEM: 0.2215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7332, partial_loss/deprel_loss: 1.1551, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4221, loss: 0.8509, batch_reg_loss: 0.1513, reg_loss: 0.1512 ||:  15%|#4        | 14/95 [00:09<00:54,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9389, LAS: 0.8856, UEM: 0.5889, LEM: 0.3443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1185, partial_loss/deprel_loss: 0.2801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3991, loss: 0.7908, batch_reg_loss: 0.1514, reg_loss: 0.1512 ||:  18%|#7        | 17/95 [00:11<00:54,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8735, UAS: 0.9422, LAS: 0.8906, UEM: 0.6494, LEM: 0.4311, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8040, partial_loss/deprel_loss: 0.8287, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9752, loss: 0.7633, batch_reg_loss: 0.1514, reg_loss: 0.1513 ||:  21%|##1       | 20/95 [00:14<00:54,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8443, UAS: 0.9409, LAS: 0.8893, UEM: 0.6266, LEM: 0.4081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0245, partial_loss/deprel_loss: 0.9164, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0895, loss: 0.7669, batch_reg_loss: 0.1515, reg_loss: 0.1513 ||:  25%|##5       | 24/95 [00:16<00:49,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9141, UAS: 0.9400, LAS: 0.8877, UEM: 0.6214, LEM: 0.3981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2229, partial_loss/deprel_loss: 0.4560, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5609, loss: 0.7795, batch_reg_loss: 0.1516, reg_loss: 0.1513 ||:  28%|##8       | 27/95 [00:18<00:47,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8994, UAS: 0.9423, LAS: 0.8900, UEM: 0.6320, LEM: 0.3967, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3760, partial_loss/deprel_loss: 0.5327, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6529, loss: 0.7602, batch_reg_loss: 0.1516, reg_loss: 0.1514 ||:  32%|###1      | 30/95 [00:20<00:45,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8786, UAS: 0.9402, LAS: 0.8870, UEM: 0.6083, LEM: 0.3746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5305, partial_loss/deprel_loss: 0.6831, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8043, loss: 0.7803, batch_reg_loss: 0.1517, reg_loss: 0.1514 ||:  36%|###5      | 34/95 [00:23<00:40,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9400, LAS: 0.8864, UEM: 0.5986, LEM: 0.3629, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3237, partial_loss/deprel_loss: 0.5330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6429, loss: 0.7899, batch_reg_loss: 0.1517, reg_loss: 0.1514 ||:  40%|####      | 38/95 [00:25<00:36,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9409, LAS: 0.8871, UEM: 0.6169, LEM: 0.3787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0997, partial_loss/deprel_loss: 0.3137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4227, loss: 0.7853, batch_reg_loss: 0.1518, reg_loss: 0.1515 ||:  44%|####4     | 42/95 [00:29<00:37,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8557, UAS: 0.9413, LAS: 0.8877, UEM: 0.6130, LEM: 0.3720, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9848, partial_loss/deprel_loss: 0.9332, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0954, loss: 0.7816, batch_reg_loss: 0.1519, reg_loss: 0.1515 ||:  48%|####8     | 46/95 [00:31<00:33,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9116, UAS: 0.9406, LAS: 0.8871, UEM: 0.6170, LEM: 0.3734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2747, partial_loss/deprel_loss: 0.4643, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5783, loss: 0.7857, batch_reg_loss: 0.1520, reg_loss: 0.1515 ||:  53%|#####2    | 50/95 [00:34<00:30,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9409, LAS: 0.8871, UEM: 0.6076, LEM: 0.3632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5270, partial_loss/deprel_loss: 0.6130, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7478, loss: 0.7860, batch_reg_loss: 0.1520, reg_loss: 0.1516 ||:  56%|#####5    | 53/95 [00:36<00:28,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9395, LAS: 0.8854, UEM: 0.6006, LEM: 0.3553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4682, partial_loss/deprel_loss: 0.6048, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7295, loss: 0.7997, batch_reg_loss: 0.1521, reg_loss: 0.1516 ||:  60%|######    | 57/95 [00:38<00:25,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8758, UAS: 0.9390, LAS: 0.8849, UEM: 0.5891, LEM: 0.3447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6837, partial_loss/deprel_loss: 0.6771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8306, loss: 0.8014, batch_reg_loss: 0.1521, reg_loss: 0.1516 ||:  64%|######4   | 61/95 [00:41<00:22,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8511, UAS: 0.9387, LAS: 0.8846, UEM: 0.5810, LEM: 0.3362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0663, partial_loss/deprel_loss: 0.8890, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0767, loss: 0.8040, batch_reg_loss: 0.1522, reg_loss: 0.1517 ||:  68%|######8   | 65/95 [00:43<00:18,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8764, UAS: 0.9382, LAS: 0.8842, UEM: 0.5700, LEM: 0.3276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7110, partial_loss/deprel_loss: 0.7114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8636, loss: 0.8082, batch_reg_loss: 0.1523, reg_loss: 0.1517 ||:  73%|#######2  | 69/95 [00:46<00:16,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9388, LAS: 0.8849, UEM: 0.5726, LEM: 0.3297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2094, partial_loss/deprel_loss: 0.4050, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5182, loss: 0.8035, batch_reg_loss: 0.1523, reg_loss: 0.1517 ||:  77%|#######6  | 73/95 [00:48<00:13,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8325, UAS: 0.9375, LAS: 0.8835, UEM: 0.5630, LEM: 0.3230, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4102, partial_loss/deprel_loss: 0.9987, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2334, loss: 0.8147, batch_reg_loss: 0.1524, reg_loss: 0.1518 ||:  81%|########1 | 77/95 [00:50<00:10,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9172, UAS: 0.9382, LAS: 0.8841, UEM: 0.5651, LEM: 0.3230, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2742, partial_loss/deprel_loss: 0.4569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5728, loss: 0.8095, batch_reg_loss: 0.1525, reg_loss: 0.1518 ||:  85%|########5 | 81/95 [00:53<00:08,  1.60it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8801, UAS: 0.9380, LAS: 0.8841, UEM: 0.5726, LEM: 0.3309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6431, partial_loss/deprel_loss: 0.7291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8645, loss: 0.8083, batch_reg_loss: 0.1526, reg_loss: 0.1518 ||:  89%|########9 | 85/95 [00:56<00:06,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8391, UAS: 0.9384, LAS: 0.8845, UEM: 0.5755, LEM: 0.3316, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1240, partial_loss/deprel_loss: 0.8925, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0915, loss: 0.8048, batch_reg_loss: 0.1526, reg_loss: 0.1519 ||:  94%|#########3| 89/95 [00:59<00:04,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8907, UAS: 0.9386, LAS: 0.8847, UEM: 0.5751, LEM: 0.3307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5276, partial_loss/deprel_loss: 0.6364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7674, loss: 0.8045, batch_reg_loss: 0.1527, reg_loss: 0.1519 ||:  98%|#########7| 93/95 [01:02<00:01,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8796, UAS: 0.9384, LAS: 0.8844, UEM: 0.5714, LEM: 0.3276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5570, partial_loss/deprel_loss: 0.7028, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8264, loss: 0.8055, batch_reg_loss: 0.1527, reg_loss: 0.1519 ||: 100%|##########| 95/95 [01:03<00:00,  1.49it/s]\n",
+      "2023-04-06 23:51:34,583 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:51:34,583 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-06 23:51:34,583 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.152  |       N/A\n",
+      "2023-04-06 23:51:34,583 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:51:34,583 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - UEM                      |     0.571  |       N/A\n",
+      "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - LEM                      |     0.328  |       N/A\n",
+      "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - EM                       |     0.880  |       N/A\n",
+      "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.557  |       N/A\n",
+      "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - UAS                      |     0.938  |       N/A\n",
+      "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.703  |       N/A\n",
+      "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - loss                     |     0.806  |       N/A\n",
+      "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - LAS                      |     0.884  |       N/A\n",
+      "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:51:34,584 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:51:34,585 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:51:34,585 - INFO - combo.training.trainer - Epoch duration: 0:01:03.884523\n",
+      "2023-04-06 23:51:34,585 - INFO - combo.training.trainer - Estimated training time remaining: 6:28:44\n",
+      "2023-04-06 23:51:34,585 - INFO - allennlp.training.trainer - Epoch 55/399\n",
+      "2023-04-06 23:51:34,586 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:51:34,586 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:51:34,592 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8764, UAS: 0.9246, LAS: 0.8702, UEM: 0.4162, LEM: 0.1844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7076, partial_loss/deprel_loss: 0.7673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9081, loss: 0.9192, batch_reg_loss: 0.1528, reg_loss: 0.1528 ||:   3%|3         | 3/95 [00:02<01:09,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9021, UAS: 0.9409, LAS: 0.8876, UEM: 0.6300, LEM: 0.3581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3062, partial_loss/deprel_loss: 0.4841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6013, loss: 0.7514, batch_reg_loss: 0.1528, reg_loss: 0.1528 ||:   6%|6         | 6/95 [00:04<01:11,  1.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8435, UAS: 0.9288, LAS: 0.8742, UEM: 0.5475, LEM: 0.3031, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2014, partial_loss/deprel_loss: 0.9325, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1391, loss: 0.8618, batch_reg_loss: 0.1529, reg_loss: 0.1528 ||:   9%|9         | 9/95 [00:07<01:06,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9283, LAS: 0.8745, UEM: 0.5024, LEM: 0.2643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4370, partial_loss/deprel_loss: 0.5151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6525, loss: 0.8605, batch_reg_loss: 0.1530, reg_loss: 0.1529 ||:  14%|#3        | 13/95 [00:09<01:00,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9333, LAS: 0.8803, UEM: 0.5678, LEM: 0.3236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2531, partial_loss/deprel_loss: 0.4340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5508, loss: 0.8142, batch_reg_loss: 0.1530, reg_loss: 0.1529 ||:  17%|#6        | 16/95 [00:12<01:00,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9314, LAS: 0.8772, UEM: 0.5379, LEM: 0.2921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5511, partial_loss/deprel_loss: 0.6187, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7583, loss: 0.8362, batch_reg_loss: 0.1531, reg_loss: 0.1529 ||:  21%|##1       | 20/95 [00:14<00:54,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9573, UAS: 0.9366, LAS: 0.8835, UEM: 0.6102, LEM: 0.3794, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0675, partial_loss/deprel_loss: 0.1877, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3168, loss: 0.7936, batch_reg_loss: 0.1531, reg_loss: 0.1529 ||:  25%|##5       | 24/95 [00:17<00:52,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9288, UAS: 0.9365, LAS: 0.8834, UEM: 0.5995, LEM: 0.3674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2511, partial_loss/deprel_loss: 0.4303, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5477, loss: 0.8045, batch_reg_loss: 0.1532, reg_loss: 0.1530 ||:  29%|##9       | 28/95 [00:20<00:47,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8766, UAS: 0.9370, LAS: 0.8837, UEM: 0.5871, LEM: 0.3543, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6924, partial_loss/deprel_loss: 0.7964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9289, loss: 0.8024, batch_reg_loss: 0.1533, reg_loss: 0.1530 ||:  33%|###2      | 31/95 [00:22<00:46,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8790, UAS: 0.9347, LAS: 0.8810, UEM: 0.5645, LEM: 0.3344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6177, partial_loss/deprel_loss: 0.6442, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7922, loss: 0.8214, batch_reg_loss: 0.1533, reg_loss: 0.1530 ||:  37%|###6      | 35/95 [00:25<00:41,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9353, LAS: 0.8816, UEM: 0.5658, LEM: 0.3323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2670, partial_loss/deprel_loss: 0.4818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5922, loss: 0.8181, batch_reg_loss: 0.1534, reg_loss: 0.1531 ||:  40%|####      | 38/95 [00:27<00:39,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8591, UAS: 0.9350, LAS: 0.8809, UEM: 0.5577, LEM: 0.3223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9163, partial_loss/deprel_loss: 0.8228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9950, loss: 0.8232, batch_reg_loss: 0.1535, reg_loss: 0.1531 ||:  44%|####4     | 42/95 [00:29<00:35,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8980, UAS: 0.9343, LAS: 0.8800, UEM: 0.5480, LEM: 0.3151, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3827, partial_loss/deprel_loss: 0.5582, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6766, loss: 0.8292, batch_reg_loss: 0.1535, reg_loss: 0.1531 ||:  47%|####7     | 45/95 [00:31<00:34,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9360, LAS: 0.8817, UEM: 0.5640, LEM: 0.3267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4991, partial_loss/deprel_loss: 0.6491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7727, loss: 0.8155, batch_reg_loss: 0.1536, reg_loss: 0.1532 ||:  51%|#####     | 48/95 [00:33<00:31,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9184, UAS: 0.9372, LAS: 0.8833, UEM: 0.5737, LEM: 0.3329, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2591, partial_loss/deprel_loss: 0.4242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5448, loss: 0.8033, batch_reg_loss: 0.1536, reg_loss: 0.1532 ||:  54%|#####3    | 51/95 [00:35<00:30,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8744, UAS: 0.9379, LAS: 0.8836, UEM: 0.5688, LEM: 0.3256, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6107, partial_loss/deprel_loss: 0.7630, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8862, loss: 0.8026, batch_reg_loss: 0.1537, reg_loss: 0.1532 ||:  58%|#####7    | 55/95 [00:38<00:26,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9099, UAS: 0.9386, LAS: 0.8845, UEM: 0.5654, LEM: 0.3192, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3918, partial_loss/deprel_loss: 0.5176, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6462, loss: 0.7971, batch_reg_loss: 0.1538, reg_loss: 0.1533 ||:  62%|######2   | 59/95 [00:40<00:23,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9392, LAS: 0.8850, UEM: 0.5727, LEM: 0.3233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4212, partial_loss/deprel_loss: 0.5769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6996, loss: 0.7926, batch_reg_loss: 0.1538, reg_loss: 0.1533 ||:  66%|######6   | 63/95 [00:43<00:20,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8618, UAS: 0.9371, LAS: 0.8827, UEM: 0.5671, LEM: 0.3200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8757, partial_loss/deprel_loss: 0.8471, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0066, loss: 0.8118, batch_reg_loss: 0.1539, reg_loss: 0.1533 ||:  71%|#######   | 67/95 [00:46<00:18,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8849, UAS: 0.9374, LAS: 0.8829, UEM: 0.5622, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5699, partial_loss/deprel_loss: 0.7673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8817, loss: 0.8103, batch_reg_loss: 0.1539, reg_loss: 0.1534 ||:  75%|#######4  | 71/95 [00:48<00:15,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8005, UAS: 0.9372, LAS: 0.8826, UEM: 0.5689, LEM: 0.3189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8491, partial_loss/deprel_loss: 1.1676, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4579, loss: 0.8126, batch_reg_loss: 0.1540, reg_loss: 0.1534 ||:  79%|#######8  | 75/95 [00:51<00:13,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8587, UAS: 0.9367, LAS: 0.8821, UEM: 0.5602, LEM: 0.3116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7321, partial_loss/deprel_loss: 0.8468, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9780, loss: 0.8171, batch_reg_loss: 0.1541, reg_loss: 0.1534 ||:  83%|########3 | 79/95 [00:54<00:10,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9371, LAS: 0.8825, UEM: 0.5707, LEM: 0.3225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1588, partial_loss/deprel_loss: 0.3685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4807, loss: 0.8144, batch_reg_loss: 0.1541, reg_loss: 0.1535 ||:  87%|########7 | 83/95 [00:57<00:08,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9373, LAS: 0.8828, UEM: 0.5761, LEM: 0.3311, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1189, partial_loss/deprel_loss: 0.2510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3788, loss: 0.8118, batch_reg_loss: 0.1542, reg_loss: 0.1535 ||:  92%|#########1| 87/95 [01:00<00:05,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9379, LAS: 0.8834, UEM: 0.5767, LEM: 0.3294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2888, partial_loss/deprel_loss: 0.4539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5751, loss: 0.8068, batch_reg_loss: 0.1543, reg_loss: 0.1535 ||:  96%|#########5| 91/95 [01:02<00:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9380, LAS: 0.8835, UEM: 0.5754, LEM: 0.3275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4507, partial_loss/deprel_loss: 0.6335, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7513, loss: 0.8063, batch_reg_loss: 0.1543, reg_loss: 0.1535 ||:  99%|#########8| 94/95 [01:04<00:00,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8511, UAS: 0.9378, LAS: 0.8832, UEM: 0.5728, LEM: 0.3258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0441, partial_loss/deprel_loss: 0.9468, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1206, loss: 0.8096, batch_reg_loss: 0.1544, reg_loss: 0.1536 ||: 100%|##########| 95/95 [01:05<00:00,  1.46it/s]\n",
+      "2023-04-06 23:52:39,843 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8707, UAS: 0.9485, LAS: 0.8993, UEM: 0.6034, LEM: 0.3028, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9159, partial_loss/deprel_loss: 29.4420, partial_loss/cycle_loss: 0.0000, batch_loss: 23.7367, loss: 22.1813, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  27%|##7       | 3/11 [00:02<00:07,  1.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8371, UAS: 0.9402, LAS: 0.8871, UEM: 0.5676, LEM: 0.2821, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4387, partial_loss/deprel_loss: 59.0686, partial_loss/cycle_loss: 0.0000, batch_loss: 47.5426, loss: 28.3777, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  55%|#####4    | 6/11 [00:05<00:04,  1.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8807, UAS: 0.9450, LAS: 0.8928, UEM: 0.6581, LEM: 0.4051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8604, partial_loss/deprel_loss: 34.5645, partial_loss/cycle_loss: 0.0000, batch_loss: 27.8236, loss: 26.8009, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  73%|#######2  | 8/11 [00:07<00:02,  1.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8961, UAS: 0.9466, LAS: 0.8934, UEM: 0.6662, LEM: 0.3971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4874, partial_loss/deprel_loss: 29.6997, partial_loss/cycle_loss: 0.0000, batch_loss: 23.8572, loss: 26.9928, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8961, UAS: 0.9466, LAS: 0.8934, UEM: 0.6662, LEM: 0.3971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4874, partial_loss/deprel_loss: 29.6997, partial_loss/cycle_loss: 0.0000, batch_loss: 23.8572, loss: 26.9928, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.06it/s]\n",
+      "2023-04-06 23:52:50,238 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.154  |     0.000\n",
+      "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - UEM                      |     0.573  |     0.666\n",
+      "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - LEM                      |     0.326  |     0.397\n",
+      "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - EM                       |     0.851  |     0.896\n",
+      "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.044  |     0.487\n",
+      "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - UAS                      |     0.938  |     0.947\n",
+      "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.947  |    29.700\n",
+      "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - loss                     |     0.810  |    26.993\n",
+      "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - LAS                      |     0.883  |     0.893\n",
+      "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:52:50,239 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:52:50,240 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:52:50,240 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:52:50,240 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 23:52:50,240 - INFO - combo.training.trainer - Epoch duration: 0:01:15.654778\n",
+      "2023-04-06 23:52:50,240 - INFO - combo.training.trainer - Estimated training time remaining: 6:28:26\n",
+      "2023-04-06 23:52:50,240 - INFO - allennlp.training.trainer - Epoch 56/399\n",
+      "2023-04-06 23:52:50,240 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:52:50,241 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:52:50,246 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8305, UAS: 0.9262, LAS: 0.8712, UEM: 0.3168, LEM: 0.0991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3721, partial_loss/deprel_loss: 0.9398, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1807, loss: 0.8943, batch_reg_loss: 0.1544, reg_loss: 0.1544 ||:   4%|4         | 4/95 [00:02<00:52,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9058, UAS: 0.9322, LAS: 0.8770, UEM: 0.4235, LEM: 0.1870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4081, partial_loss/deprel_loss: 0.5488, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6752, loss: 0.8571, batch_reg_loss: 0.1545, reg_loss: 0.1544 ||:   7%|7         | 7/95 [00:04<00:53,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9325, LAS: 0.8772, UEM: 0.4856, LEM: 0.2496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6284, partial_loss/deprel_loss: 0.7571, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8859, loss: 0.8623, batch_reg_loss: 0.1545, reg_loss: 0.1544 ||:  11%|#         | 10/95 [00:06<00:55,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9220, UAS: 0.9383, LAS: 0.8840, UEM: 0.5598, LEM: 0.3119, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2178, partial_loss/deprel_loss: 0.4345, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5457, loss: 0.8084, batch_reg_loss: 0.1546, reg_loss: 0.1545 ||:  14%|#3        | 13/95 [00:08<00:54,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8712, UAS: 0.9405, LAS: 0.8866, UEM: 0.5888, LEM: 0.3371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7046, partial_loss/deprel_loss: 0.7288, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8785, loss: 0.7837, batch_reg_loss: 0.1546, reg_loss: 0.1545 ||:  17%|#6        | 16/95 [00:10<00:52,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9426, LAS: 0.8891, UEM: 0.5805, LEM: 0.3207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3558, partial_loss/deprel_loss: 0.5277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6480, loss: 0.7713, batch_reg_loss: 0.1547, reg_loss: 0.1545 ||:  21%|##1       | 20/95 [00:13<00:49,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9432, LAS: 0.8909, UEM: 0.6266, LEM: 0.3985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5408, partial_loss/deprel_loss: 0.5727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7211, loss: 0.7608, batch_reg_loss: 0.1547, reg_loss: 0.1546 ||:  24%|##4       | 23/95 [00:15<00:49,  1.44it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8683, UAS: 0.9439, LAS: 0.8914, UEM: 0.6181, LEM: 0.3890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8244, partial_loss/deprel_loss: 0.7752, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9398, loss: 0.7575, batch_reg_loss: 0.1548, reg_loss: 0.1546 ||:  28%|##8       | 27/95 [00:18<00:45,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8683, UAS: 0.9449, LAS: 0.8917, UEM: 0.6201, LEM: 0.3806, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6989, partial_loss/deprel_loss: 0.8017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9360, loss: 0.7524, batch_reg_loss: 0.1548, reg_loss: 0.1546 ||:  32%|###1      | 30/95 [00:20<00:44,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9442, LAS: 0.8912, UEM: 0.6167, LEM: 0.3749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5697, partial_loss/deprel_loss: 0.5757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7294, loss: 0.7548, batch_reg_loss: 0.1549, reg_loss: 0.1546 ||:  36%|###5      | 34/95 [00:22<00:41,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8981, UAS: 0.9415, LAS: 0.8884, UEM: 0.6010, LEM: 0.3632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4092, partial_loss/deprel_loss: 0.6103, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7250, loss: 0.7745, batch_reg_loss: 0.1550, reg_loss: 0.1547 ||:  39%|###8      | 37/95 [00:24<00:39,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9407, LAS: 0.8875, UEM: 0.5969, LEM: 0.3615, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3139, partial_loss/deprel_loss: 0.4131, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5483, loss: 0.7804, batch_reg_loss: 0.1550, reg_loss: 0.1547 ||:  42%|####2     | 40/95 [00:27<00:38,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9004, UAS: 0.9415, LAS: 0.8882, UEM: 0.6005, LEM: 0.3620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3625, partial_loss/deprel_loss: 0.5394, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6591, loss: 0.7746, batch_reg_loss: 0.1551, reg_loss: 0.1547 ||:  45%|####5     | 43/95 [00:29<00:39,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9415, LAS: 0.8882, UEM: 0.5928, LEM: 0.3546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3712, partial_loss/deprel_loss: 0.5092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6367, loss: 0.7747, batch_reg_loss: 0.1551, reg_loss: 0.1547 ||:  48%|####8     | 46/95 [00:31<00:36,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8849, UAS: 0.9408, LAS: 0.8876, UEM: 0.5904, LEM: 0.3519, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5980, partial_loss/deprel_loss: 0.6605, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8032, loss: 0.7798, batch_reg_loss: 0.1552, reg_loss: 0.1548 ||:  52%|#####1    | 49/95 [00:34<00:33,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9415, LAS: 0.8884, UEM: 0.5918, LEM: 0.3501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2679, partial_loss/deprel_loss: 0.4459, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5655, loss: 0.7738, batch_reg_loss: 0.1552, reg_loss: 0.1548 ||:  55%|#####4    | 52/95 [00:36<00:30,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8635, UAS: 0.9396, LAS: 0.8862, UEM: 0.5763, LEM: 0.3381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7964, partial_loss/deprel_loss: 0.7824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9405, loss: 0.7906, batch_reg_loss: 0.1553, reg_loss: 0.1548 ||:  59%|#####8    | 56/95 [00:38<00:27,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7874, UAS: 0.9390, LAS: 0.8856, UEM: 0.5793, LEM: 0.3393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9541, partial_loss/deprel_loss: 1.2240, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5254, loss: 0.7949, batch_reg_loss: 0.1553, reg_loss: 0.1549 ||:  63%|######3   | 60/95 [00:41<00:23,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7955, UAS: 0.9389, LAS: 0.8856, UEM: 0.5938, LEM: 0.3560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5819, partial_loss/deprel_loss: 1.1667, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4052, loss: 0.7929, batch_reg_loss: 0.1554, reg_loss: 0.1549 ||:  67%|######7   | 64/95 [00:43<00:20,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9391, LAS: 0.8859, UEM: 0.5976, LEM: 0.3606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1142, partial_loss/deprel_loss: 0.3327, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4445, loss: 0.7904, batch_reg_loss: 0.1555, reg_loss: 0.1549 ||:  72%|#######1  | 68/95 [00:46<00:18,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9399, LAS: 0.8865, UEM: 0.5956, LEM: 0.3551, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5234, partial_loss/deprel_loss: 0.7011, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8211, loss: 0.7863, batch_reg_loss: 0.1555, reg_loss: 0.1550 ||:  76%|#######5  | 72/95 [00:49<00:15,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8700, UAS: 0.9390, LAS: 0.8855, UEM: 0.5850, LEM: 0.3461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6051, partial_loss/deprel_loss: 0.6956, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8331, loss: 0.7931, batch_reg_loss: 0.1556, reg_loss: 0.1550 ||:  80%|########  | 76/95 [00:52<00:12,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8459, UAS: 0.9392, LAS: 0.8854, UEM: 0.5840, LEM: 0.3420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0770, partial_loss/deprel_loss: 0.9281, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1136, loss: 0.7925, batch_reg_loss: 0.1557, reg_loss: 0.1550 ||:  84%|########4 | 80/95 [00:54<00:10,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8977, UAS: 0.9398, LAS: 0.8862, UEM: 0.5856, LEM: 0.3411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4596, partial_loss/deprel_loss: 0.6046, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7314, loss: 0.7873, batch_reg_loss: 0.1557, reg_loss: 0.1550 ||:  87%|########7 | 83/95 [00:56<00:08,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9392, LAS: 0.8855, UEM: 0.5793, LEM: 0.3355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3229, partial_loss/deprel_loss: 0.4868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6098, loss: 0.7921, batch_reg_loss: 0.1558, reg_loss: 0.1551 ||:  92%|#########1| 87/95 [00:59<00:05,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.9390, LAS: 0.8853, UEM: 0.5784, LEM: 0.3357, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7266, partial_loss/deprel_loss: 0.7919, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9347, loss: 0.7935, batch_reg_loss: 0.1559, reg_loss: 0.1551 ||:  95%|#########4| 90/95 [01:01<00:03,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8619, UAS: 0.9386, LAS: 0.8848, UEM: 0.5719, LEM: 0.3303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8613, partial_loss/deprel_loss: 0.8771, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0299, loss: 0.7983, batch_reg_loss: 0.1559, reg_loss: 0.1551 ||:  99%|#########8| 94/95 [01:04<00:00,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8436, UAS: 0.9382, LAS: 0.8843, UEM: 0.5696, LEM: 0.3289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1757, partial_loss/deprel_loss: 0.9447, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1468, loss: 0.8020, batch_reg_loss: 0.1559, reg_loss: 0.1551 ||: 100%|##########| 95/95 [01:05<00:00,  1.46it/s]\n",
+      "2023-04-06 23:53:55,303 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:53:55,303 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-06 23:53:55,303 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.155  |       N/A\n",
+      "2023-04-06 23:53:55,303 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:53:55,303 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:53:55,303 - INFO - combo.training.tensorboard_writer - UEM                      |     0.570  |       N/A\n",
+      "2023-04-06 23:53:55,303 - INFO - combo.training.tensorboard_writer - LEM                      |     0.329  |       N/A\n",
+      "2023-04-06 23:53:55,303 - INFO - combo.training.tensorboard_writer - EM                       |     0.844  |       N/A\n",
+      "2023-04-06 23:53:55,303 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.176  |       N/A\n",
+      "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - UAS                      |     0.938  |       N/A\n",
+      "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.945  |       N/A\n",
+      "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - loss                     |     0.802  |       N/A\n",
+      "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - LAS                      |     0.884  |       N/A\n",
+      "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:53:55,304 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:53:55,305 - INFO - combo.training.trainer - Epoch duration: 0:01:05.064412\n",
+      "2023-04-06 23:53:55,305 - INFO - combo.training.trainer - Estimated training time remaining: 6:27:02\n",
+      "2023-04-06 23:53:55,305 - INFO - allennlp.training.trainer - Epoch 57/399\n",
+      "2023-04-06 23:53:55,305 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:53:55,305 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:53:55,311 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8881, UAS: 0.9514, LAS: 0.8998, UEM: 0.5685, LEM: 0.2944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6102, partial_loss/deprel_loss: 0.6701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8141, loss: 0.6940, batch_reg_loss: 0.1560, reg_loss: 0.1560 ||:   3%|3         | 3/95 [00:02<01:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8771, UAS: 0.9429, LAS: 0.8933, UEM: 0.6418, LEM: 0.4220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8174, partial_loss/deprel_loss: 0.6788, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8626, loss: 0.7285, batch_reg_loss: 0.1560, reg_loss: 0.1560 ||:   6%|6         | 6/95 [00:04<01:01,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9323, LAS: 0.8814, UEM: 0.5794, LEM: 0.3624, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4063, partial_loss/deprel_loss: 0.4939, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6324, loss: 0.8184, batch_reg_loss: 0.1561, reg_loss: 0.1560 ||:   9%|9         | 9/95 [00:06<00:59,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9295, LAS: 0.8768, UEM: 0.5295, LEM: 0.3072, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5860, partial_loss/deprel_loss: 0.6730, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8118, loss: 0.8601, batch_reg_loss: 0.1562, reg_loss: 0.1561 ||:  14%|#3        | 13/95 [00:08<00:55,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9284, UAS: 0.9299, LAS: 0.8773, UEM: 0.5165, LEM: 0.2977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2354, partial_loss/deprel_loss: 0.4117, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5327, loss: 0.8636, batch_reg_loss: 0.1562, reg_loss: 0.1561 ||:  17%|#6        | 16/95 [00:10<00:53,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9312, LAS: 0.8786, UEM: 0.5149, LEM: 0.2920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9326, partial_loss/deprel_loss: 0.7946, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9785, loss: 0.8560, batch_reg_loss: 0.1563, reg_loss: 0.1561 ||:  21%|##1       | 20/95 [00:13<00:49,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8510, UAS: 0.9314, LAS: 0.8781, UEM: 0.4962, LEM: 0.2743, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9069, partial_loss/deprel_loss: 0.8206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9942, loss: 0.8563, batch_reg_loss: 0.1564, reg_loss: 0.1562 ||:  24%|##4       | 23/95 [00:15<00:48,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8687, UAS: 0.9310, LAS: 0.8775, UEM: 0.4864, LEM: 0.2669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8210, partial_loss/deprel_loss: 0.7806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9451, loss: 0.8614, batch_reg_loss: 0.1564, reg_loss: 0.1562 ||:  27%|##7       | 26/95 [00:17<00:47,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9330, LAS: 0.8797, UEM: 0.4983, LEM: 0.2689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3869, partial_loss/deprel_loss: 0.5806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6983, loss: 0.8448, batch_reg_loss: 0.1565, reg_loss: 0.1562 ||:  31%|###       | 29/95 [00:19<00:46,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9231, UAS: 0.9360, LAS: 0.8833, UEM: 0.5451, LEM: 0.3109, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2559, partial_loss/deprel_loss: 0.4483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5663, loss: 0.8185, batch_reg_loss: 0.1565, reg_loss: 0.1562 ||:  34%|###3      | 32/95 [00:21<00:44,  1.41it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9353, LAS: 0.8824, UEM: 0.5308, LEM: 0.2968, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4447, partial_loss/deprel_loss: 0.4559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6102, loss: 0.8230, batch_reg_loss: 0.1566, reg_loss: 0.1563 ||:  38%|###7      | 36/95 [00:24<00:40,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8615, UAS: 0.9349, LAS: 0.8817, UEM: 0.5291, LEM: 0.2952, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7084, partial_loss/deprel_loss: 0.7378, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8886, loss: 0.8245, batch_reg_loss: 0.1566, reg_loss: 0.1563 ||:  41%|####1     | 39/95 [00:26<00:39,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8946, UAS: 0.9360, LAS: 0.8826, UEM: 0.5297, LEM: 0.2893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4608, partial_loss/deprel_loss: 0.6143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7403, loss: 0.8194, batch_reg_loss: 0.1567, reg_loss: 0.1563 ||:  44%|####4     | 42/95 [00:28<00:37,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8561, UAS: 0.9374, LAS: 0.8840, UEM: 0.5491, LEM: 0.3022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9230, partial_loss/deprel_loss: 0.8469, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0189, loss: 0.8084, batch_reg_loss: 0.1568, reg_loss: 0.1564 ||:  48%|####8     | 46/95 [00:31<00:34,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8981, UAS: 0.9383, LAS: 0.8847, UEM: 0.5481, LEM: 0.2973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4649, partial_loss/deprel_loss: 0.5608, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6985, loss: 0.8031, batch_reg_loss: 0.1568, reg_loss: 0.1564 ||:  52%|#####1    | 49/95 [00:35<00:40,  1.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9042, UAS: 0.9386, LAS: 0.8848, UEM: 0.5428, LEM: 0.2910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3975, partial_loss/deprel_loss: 0.5208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6530, loss: 0.8013, batch_reg_loss: 0.1568, reg_loss: 0.1564 ||:  55%|#####4    | 52/95 [00:37<00:35,  1.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9132, UAS: 0.9388, LAS: 0.8851, UEM: 0.5479, LEM: 0.2955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2873, partial_loss/deprel_loss: 0.3841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5216, loss: 0.7988, batch_reg_loss: 0.1569, reg_loss: 0.1564 ||:  58%|#####7    | 55/95 [00:39<00:32,  1.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9600, UAS: 0.9386, LAS: 0.8854, UEM: 0.5680, LEM: 0.3294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0666, partial_loss/deprel_loss: 0.1669, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3038, loss: 0.8006, batch_reg_loss: 0.1569, reg_loss: 0.1565 ||:  62%|######2   | 59/95 [00:42<00:28,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9386, LAS: 0.8854, UEM: 0.5663, LEM: 0.3273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2632, partial_loss/deprel_loss: 0.4677, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5838, loss: 0.7999, batch_reg_loss: 0.1570, reg_loss: 0.1565 ||:  65%|######5   | 62/95 [00:45<00:25,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9385, LAS: 0.8852, UEM: 0.5681, LEM: 0.3271, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2532, partial_loss/deprel_loss: 0.4551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5718, loss: 0.8015, batch_reg_loss: 0.1570, reg_loss: 0.1565 ||:  68%|######8   | 65/95 [00:47<00:23,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8796, UAS: 0.9393, LAS: 0.8861, UEM: 0.5810, LEM: 0.3386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6600, partial_loss/deprel_loss: 0.7542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8925, loss: 0.7937, batch_reg_loss: 0.1571, reg_loss: 0.1565 ||:  72%|#######1  | 68/95 [00:49<00:20,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8942, UAS: 0.9401, LAS: 0.8870, UEM: 0.5895, LEM: 0.3448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4321, partial_loss/deprel_loss: 0.5371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6732, loss: 0.7851, batch_reg_loss: 0.1571, reg_loss: 0.1566 ||:  75%|#######4  | 71/95 [00:51<00:18,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9406, LAS: 0.8876, UEM: 0.5927, LEM: 0.3449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3304, partial_loss/deprel_loss: 0.5570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6689, loss: 0.7806, batch_reg_loss: 0.1572, reg_loss: 0.1566 ||:  78%|#######7  | 74/95 [00:53<00:15,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9402, LAS: 0.8869, UEM: 0.5958, LEM: 0.3471, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1576, partial_loss/deprel_loss: 0.3719, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4863, loss: 0.7857, batch_reg_loss: 0.1572, reg_loss: 0.1566 ||:  82%|########2 | 78/95 [00:56<00:12,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9400, LAS: 0.8867, UEM: 0.5954, LEM: 0.3469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1439, partial_loss/deprel_loss: 0.3659, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4787, loss: 0.7872, batch_reg_loss: 0.1573, reg_loss: 0.1566 ||:  85%|########5 | 81/95 [00:58<00:10,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8853, UAS: 0.9388, LAS: 0.8855, UEM: 0.5889, LEM: 0.3407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5523, partial_loss/deprel_loss: 0.6464, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7849, loss: 0.7964, batch_reg_loss: 0.1573, reg_loss: 0.1567 ||:  89%|########9 | 85/95 [01:01<00:07,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8431, UAS: 0.9382, LAS: 0.8849, UEM: 0.5850, LEM: 0.3385, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2189, partial_loss/deprel_loss: 0.9243, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1406, loss: 0.8010, batch_reg_loss: 0.1574, reg_loss: 0.1567 ||:  93%|#########2| 88/95 [01:03<00:04,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8519, UAS: 0.9382, LAS: 0.8847, UEM: 0.5793, LEM: 0.3322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0566, partial_loss/deprel_loss: 0.9256, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1092, loss: 0.8039, batch_reg_loss: 0.1574, reg_loss: 0.1567 ||:  97%|#########6| 92/95 [01:06<00:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8719, UAS: 0.9386, LAS: 0.8851, UEM: 0.5787, LEM: 0.3306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7973, partial_loss/deprel_loss: 0.7478, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9152, loss: 0.8015, batch_reg_loss: 0.1575, reg_loss: 0.1568 ||: 100%|##########| 95/95 [01:08<00:00,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8719, UAS: 0.9386, LAS: 0.8851, UEM: 0.5787, LEM: 0.3306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7973, partial_loss/deprel_loss: 0.7478, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9152, loss: 0.8015, batch_reg_loss: 0.1575, reg_loss: 0.1568 ||: 100%|##########| 95/95 [01:08<00:00,  1.39it/s]\n",
+      "2023-04-06 23:55:03,586 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:55:03,586 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-06 23:55:03,586 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.157  |       N/A\n",
+      "2023-04-06 23:55:03,586 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - UEM                      |     0.579  |       N/A\n",
+      "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - LEM                      |     0.331  |       N/A\n",
+      "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - EM                       |     0.872  |       N/A\n",
+      "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.797  |       N/A\n",
+      "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - UAS                      |     0.939  |       N/A\n",
+      "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.748  |       N/A\n",
+      "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - loss                     |     0.802  |       N/A\n",
+      "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - LAS                      |     0.885  |       N/A\n",
+      "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:55:03,587 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:55:03,588 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:55:03,588 - INFO - combo.training.trainer - Epoch duration: 0:01:08.283101\n",
+      "2023-04-06 23:55:03,588 - INFO - combo.training.trainer - Estimated training time remaining: 6:25:58\n",
+      "2023-04-06 23:55:03,588 - INFO - allennlp.training.trainer - Epoch 58/399\n",
+      "2023-04-06 23:55:03,588 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:55:03,589 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:55:03,595 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9535, LAS: 0.9048, UEM: 0.6764, LEM: 0.4264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2934, partial_loss/deprel_loss: 0.4203, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5525, loss: 0.6294, batch_reg_loss: 0.1576, reg_loss: 0.1575 ||:   4%|4         | 4/95 [00:02<00:57,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8714, UAS: 0.9500, LAS: 0.8997, UEM: 0.6510, LEM: 0.3980, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7014, partial_loss/deprel_loss: 0.7054, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8623, loss: 0.6667, batch_reg_loss: 0.1576, reg_loss: 0.1576 ||:   7%|7         | 7/95 [00:04<00:56,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8508, UAS: 0.9462, LAS: 0.8961, UEM: 0.7060, LEM: 0.5104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0477, partial_loss/deprel_loss: 0.8501, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0473, loss: 0.7036, batch_reg_loss: 0.1577, reg_loss: 0.1576 ||:  11%|#         | 10/95 [00:06<00:58,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8719, UAS: 0.9474, LAS: 0.8962, UEM: 0.6754, LEM: 0.4585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6657, partial_loss/deprel_loss: 0.8229, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9492, loss: 0.7093, batch_reg_loss: 0.1577, reg_loss: 0.1576 ||:  15%|#4        | 14/95 [00:09<00:53,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8636, UAS: 0.9421, LAS: 0.8899, UEM: 0.6545, LEM: 0.4361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8990, partial_loss/deprel_loss: 0.8420, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0112, loss: 0.7615, batch_reg_loss: 0.1578, reg_loss: 0.1577 ||:  18%|#7        | 17/95 [00:11<00:53,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9386, LAS: 0.8864, UEM: 0.6129, LEM: 0.3951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6553, partial_loss/deprel_loss: 0.6360, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7977, loss: 0.7913, batch_reg_loss: 0.1579, reg_loss: 0.1577 ||:  22%|##2       | 21/95 [00:14<00:50,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9410, LAS: 0.8891, UEM: 0.6241, LEM: 0.3942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2191, partial_loss/deprel_loss: 0.4281, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5443, loss: 0.7703, batch_reg_loss: 0.1579, reg_loss: 0.1577 ||:  25%|##5       | 24/95 [00:16<00:49,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8943, UAS: 0.9409, LAS: 0.8887, UEM: 0.6214, LEM: 0.3859, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4183, partial_loss/deprel_loss: 0.5498, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6815, loss: 0.7742, batch_reg_loss: 0.1580, reg_loss: 0.1577 ||:  28%|##8       | 27/95 [00:18<00:46,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9412, LAS: 0.8893, UEM: 0.6210, LEM: 0.3841, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3110, partial_loss/deprel_loss: 0.3967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5376, loss: 0.7676, batch_reg_loss: 0.1580, reg_loss: 0.1578 ||:  32%|###1      | 30/95 [00:20<00:48,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8546, UAS: 0.9412, LAS: 0.8894, UEM: 0.6169, LEM: 0.3763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9132, partial_loss/deprel_loss: 0.8714, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0378, loss: 0.7685, batch_reg_loss: 0.1581, reg_loss: 0.1578 ||:  35%|###4      | 33/95 [00:23<00:45,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9076, UAS: 0.9429, LAS: 0.8910, UEM: 0.6139, LEM: 0.3650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3775, partial_loss/deprel_loss: 0.5630, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6840, loss: 0.7588, batch_reg_loss: 0.1581, reg_loss: 0.1578 ||:  39%|###8      | 37/95 [00:25<00:40,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9430, LAS: 0.8911, UEM: 0.6065, LEM: 0.3568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2773, partial_loss/deprel_loss: 0.5158, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6263, loss: 0.7592, batch_reg_loss: 0.1582, reg_loss: 0.1579 ||:  42%|####2     | 40/95 [00:27<00:39,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9410, LAS: 0.8892, UEM: 0.6008, LEM: 0.3545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1724, partial_loss/deprel_loss: 0.3492, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4721, loss: 0.7747, batch_reg_loss: 0.1582, reg_loss: 0.1579 ||:  46%|####6     | 44/95 [00:30<00:36,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9413, LAS: 0.8894, UEM: 0.5904, LEM: 0.3423, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5840, partial_loss/deprel_loss: 0.6788, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8182, loss: 0.7717, batch_reg_loss: 0.1583, reg_loss: 0.1579 ||:  51%|#####     | 48/95 [00:32<00:31,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9409, LAS: 0.8889, UEM: 0.5887, LEM: 0.3417, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5248, partial_loss/deprel_loss: 0.6978, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8215, loss: 0.7760, batch_reg_loss: 0.1584, reg_loss: 0.1580 ||:  55%|#####4    | 52/95 [00:35<00:28,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8261, UAS: 0.9389, LAS: 0.8867, UEM: 0.5847, LEM: 0.3377, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2997, partial_loss/deprel_loss: 0.9815, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2036, loss: 0.7913, batch_reg_loss: 0.1584, reg_loss: 0.1580 ||:  59%|#####8    | 56/95 [00:38<00:26,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9382, LAS: 0.8857, UEM: 0.5789, LEM: 0.3347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2292, partial_loss/deprel_loss: 0.4372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5541, loss: 0.8001, batch_reg_loss: 0.1585, reg_loss: 0.1580 ||:  63%|######3   | 60/95 [00:40<00:23,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8780, UAS: 0.9382, LAS: 0.8857, UEM: 0.5745, LEM: 0.3298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7031, partial_loss/deprel_loss: 0.7636, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9101, loss: 0.8013, batch_reg_loss: 0.1586, reg_loss: 0.1581 ||:  67%|######7   | 64/95 [00:43<00:21,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9375, LAS: 0.8849, UEM: 0.5662, LEM: 0.3219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4286, partial_loss/deprel_loss: 0.5786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7073, loss: 0.8071, batch_reg_loss: 0.1587, reg_loss: 0.1581 ||:  72%|#######1  | 68/95 [00:46<00:17,  1.52it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9196, UAS: 0.9377, LAS: 0.8849, UEM: 0.5654, LEM: 0.3189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2696, partial_loss/deprel_loss: 0.4043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5361, loss: 0.8082, batch_reg_loss: 0.1587, reg_loss: 0.1581 ||:  76%|#######5  | 72/95 [00:48<00:15,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9376, LAS: 0.8847, UEM: 0.5615, LEM: 0.3154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4792, partial_loss/deprel_loss: 0.6233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7533, loss: 0.8099, batch_reg_loss: 0.1588, reg_loss: 0.1582 ||:  80%|########  | 76/95 [00:52<00:13,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9378, LAS: 0.8848, UEM: 0.5582, LEM: 0.3110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4244, partial_loss/deprel_loss: 0.5378, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6739, loss: 0.8090, batch_reg_loss: 0.1589, reg_loss: 0.1582 ||:  83%|########3 | 79/95 [00:54<00:11,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9391, LAS: 0.8863, UEM: 0.5690, LEM: 0.3173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2843, partial_loss/deprel_loss: 0.4835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6026, loss: 0.7994, batch_reg_loss: 0.1589, reg_loss: 0.1582 ||:  87%|########7 | 83/95 [00:56<00:08,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9031, UAS: 0.9388, LAS: 0.8860, UEM: 0.5645, LEM: 0.3121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3804, partial_loss/deprel_loss: 0.5243, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6545, loss: 0.8033, batch_reg_loss: 0.1590, reg_loss: 0.1583 ||:  92%|#########1| 87/95 [00:59<00:05,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9383, LAS: 0.8854, UEM: 0.5636, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3970, partial_loss/deprel_loss: 0.5750, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6984, loss: 0.8081, batch_reg_loss: 0.1590, reg_loss: 0.1583 ||:  95%|#########4| 90/95 [01:01<00:03,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9389, LAS: 0.8861, UEM: 0.5803, LEM: 0.3315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1318, partial_loss/deprel_loss: 0.2567, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3908, loss: 0.8016, batch_reg_loss: 0.1591, reg_loss: 0.1583 ||:  98%|#########7| 93/95 [01:04<00:01,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9389, LAS: 0.8862, UEM: 0.5780, LEM: 0.3291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3488, partial_loss/deprel_loss: 0.5293, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6523, loss: 0.8017, batch_reg_loss: 0.1591, reg_loss: 0.1583 ||: 100%|##########| 95/95 [01:05<00:00,  1.45it/s]\n",
+      "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.158  |       N/A\n",
+      "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - UEM                      |     0.578  |       N/A\n",
+      "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - LEM                      |     0.329  |       N/A\n",
+      "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - EM                       |     0.904  |       N/A\n",
+      "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.349  |       N/A\n",
+      "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - UAS                      |     0.939  |       N/A\n",
+      "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.529  |       N/A\n",
+      "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - loss                     |     0.802  |       N/A\n",
+      "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - LAS                      |     0.886  |       N/A\n",
+      "2023-04-06 23:56:08,966 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:56:08,967 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:56:08,967 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:56:08,967 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:56:08,967 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:56:08,967 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:56:08,967 - INFO - combo.training.trainer - Epoch duration: 0:01:05.378838\n",
+      "2023-04-06 23:56:08,967 - INFO - combo.training.trainer - Estimated training time remaining: 6:24:36\n",
+      "2023-04-06 23:56:08,967 - INFO - allennlp.training.trainer - Epoch 59/399\n",
+      "2023-04-06 23:56:08,967 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:56:08,967 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:56:08,972 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9668, LAS: 0.9214, UEM: 0.8388, LEM: 0.6739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2145, partial_loss/deprel_loss: 0.4612, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5710, loss: 0.5334, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||:   3%|3         | 3/95 [00:02<01:12,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9447, LAS: 0.8962, UEM: 0.7278, LEM: 0.5356, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4894, partial_loss/deprel_loss: 0.6428, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7714, loss: 0.7324, batch_reg_loss: 0.1592, reg_loss: 0.1592 ||:   7%|7         | 7/95 [00:04<01:04,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9368, LAS: 0.8860, UEM: 0.6479, LEM: 0.4513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3521, partial_loss/deprel_loss: 0.4918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6231, loss: 0.7971, batch_reg_loss: 0.1592, reg_loss: 0.1592 ||:  12%|#1        | 11/95 [00:07<00:59,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9405, LAS: 0.8894, UEM: 0.6198, LEM: 0.4015, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4050, partial_loss/deprel_loss: 0.4890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6315, loss: 0.7755, batch_reg_loss: 0.1593, reg_loss: 0.1592 ||:  16%|#5        | 15/95 [00:09<00:54,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9432, LAS: 0.8910, UEM: 0.6084, LEM: 0.3725, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4418, partial_loss/deprel_loss: 0.5769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7093, loss: 0.7605, batch_reg_loss: 0.1594, reg_loss: 0.1592 ||:  20%|##        | 19/95 [00:12<00:51,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9429, LAS: 0.8900, UEM: 0.5828, LEM: 0.3433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4115, partial_loss/deprel_loss: 0.5493, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6811, loss: 0.7659, batch_reg_loss: 0.1594, reg_loss: 0.1593 ||:  24%|##4       | 23/95 [00:15<00:48,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9435, LAS: 0.8912, UEM: 0.6006, LEM: 0.3587, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2167, partial_loss/deprel_loss: 0.3695, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4984, loss: 0.7566, batch_reg_loss: 0.1595, reg_loss: 0.1593 ||:  27%|##7       | 26/95 [00:17<00:47,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9447, LAS: 0.8927, UEM: 0.6153, LEM: 0.3717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3898, partial_loss/deprel_loss: 0.5664, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6906, loss: 0.7423, batch_reg_loss: 0.1595, reg_loss: 0.1593 ||:  31%|###       | 29/95 [00:19<00:45,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8538, UAS: 0.9444, LAS: 0.8926, UEM: 0.6101, LEM: 0.3645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9486, partial_loss/deprel_loss: 0.8810, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0541, loss: 0.7445, batch_reg_loss: 0.1596, reg_loss: 0.1593 ||:  35%|###4      | 33/95 [00:22<00:42,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9452, LAS: 0.8934, UEM: 0.6117, LEM: 0.3593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3082, partial_loss/deprel_loss: 0.5202, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6374, loss: 0.7371, batch_reg_loss: 0.1596, reg_loss: 0.1594 ||:  38%|###7      | 36/95 [00:24<00:40,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8725, UAS: 0.9432, LAS: 0.8910, UEM: 0.5908, LEM: 0.3416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6523, partial_loss/deprel_loss: 0.6621, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8198, loss: 0.7559, batch_reg_loss: 0.1597, reg_loss: 0.1594 ||:  42%|####2     | 40/95 [00:26<00:35,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9442, LAS: 0.8916, UEM: 0.5983, LEM: 0.3473, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6514, partial_loss/deprel_loss: 0.7769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9115, loss: 0.7486, batch_reg_loss: 0.1597, reg_loss: 0.1594 ||:  47%|####7     | 45/95 [00:29<00:30,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9431, LAS: 0.8904, UEM: 0.5858, LEM: 0.3349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4181, partial_loss/deprel_loss: 0.6002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7236, loss: 0.7604, batch_reg_loss: 0.1598, reg_loss: 0.1595 ||:  52%|#####1    | 49/95 [00:31<00:27,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8748, UAS: 0.9424, LAS: 0.8899, UEM: 0.5948, LEM: 0.3484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6893, partial_loss/deprel_loss: 0.6942, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8530, loss: 0.7647, batch_reg_loss: 0.1598, reg_loss: 0.1595 ||:  56%|#####5    | 53/95 [00:33<00:25,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9434, LAS: 0.8910, UEM: 0.6033, LEM: 0.3512, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2670, partial_loss/deprel_loss: 0.4293, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5567, loss: 0.7560, batch_reg_loss: 0.1599, reg_loss: 0.1595 ||:  60%|######    | 57/95 [00:36<00:24,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8582, UAS: 0.9424, LAS: 0.8897, UEM: 0.5927, LEM: 0.3424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9398, partial_loss/deprel_loss: 0.8258, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0086, loss: 0.7681, batch_reg_loss: 0.1600, reg_loss: 0.1595 ||:  64%|######4   | 61/95 [00:39<00:21,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8505, UAS: 0.9415, LAS: 0.8887, UEM: 0.5846, LEM: 0.3355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1753, partial_loss/deprel_loss: 0.8177, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0493, loss: 0.7768, batch_reg_loss: 0.1600, reg_loss: 0.1596 ||:  68%|######8   | 65/95 [00:41<00:19,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8253, UAS: 0.9403, LAS: 0.8875, UEM: 0.5899, LEM: 0.3469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4067, partial_loss/deprel_loss: 0.9934, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2361, loss: 0.7864, batch_reg_loss: 0.1601, reg_loss: 0.1596 ||:  73%|#######2  | 69/95 [00:44<00:16,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9406, LAS: 0.8879, UEM: 0.5918, LEM: 0.3483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3396, partial_loss/deprel_loss: 0.5143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6395, loss: 0.7834, batch_reg_loss: 0.1602, reg_loss: 0.1596 ||:  77%|#######6  | 73/95 [00:47<00:14,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8790, UAS: 0.9404, LAS: 0.8874, UEM: 0.5856, LEM: 0.3419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6402, partial_loss/deprel_loss: 0.7421, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8819, loss: 0.7881, batch_reg_loss: 0.1602, reg_loss: 0.1597 ||:  81%|########1 | 77/95 [00:49<00:11,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8436, UAS: 0.9396, LAS: 0.8863, UEM: 0.5803, LEM: 0.3375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0770, partial_loss/deprel_loss: 0.9965, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1729, loss: 0.7966, batch_reg_loss: 0.1603, reg_loss: 0.1597 ||:  85%|########5 | 81/95 [00:52<00:09,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9397, LAS: 0.8863, UEM: 0.5751, LEM: 0.3319, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4392, partial_loss/deprel_loss: 0.6400, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7602, loss: 0.7989, batch_reg_loss: 0.1604, reg_loss: 0.1597 ||:  89%|########9 | 85/95 [00:55<00:06,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9386, LAS: 0.8850, UEM: 0.5739, LEM: 0.3309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3208, partial_loss/deprel_loss: 0.4776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6067, loss: 0.8075, batch_reg_loss: 0.1604, reg_loss: 0.1597 ||:  93%|#########2| 88/95 [00:57<00:04,  1.44it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9392, LAS: 0.8857, UEM: 0.5768, LEM: 0.3322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1678, partial_loss/deprel_loss: 0.3699, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4900, loss: 0.8025, batch_reg_loss: 0.1605, reg_loss: 0.1598 ||:  96%|#########5| 91/95 [00:59<00:02,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9391, LAS: 0.8854, UEM: 0.5732, LEM: 0.3283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3238, partial_loss/deprel_loss: 0.5131, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6358, loss: 0.8066, batch_reg_loss: 0.1606, reg_loss: 0.1598 ||: 100%|##########| 95/95 [01:02<00:00,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9391, LAS: 0.8854, UEM: 0.5732, LEM: 0.3283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3238, partial_loss/deprel_loss: 0.5131, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6358, loss: 0.8066, batch_reg_loss: 0.1606, reg_loss: 0.1598 ||: 100%|##########| 95/95 [01:02<00:00,  1.53it/s]\n",
+      "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.160  |       N/A\n",
+      "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - UEM                      |     0.573  |       N/A\n",
+      "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - LEM                      |     0.328  |       N/A\n",
+      "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - EM                       |     0.911  |       N/A\n",
+      "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.324  |       N/A\n",
+      "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - UAS                      |     0.939  |       N/A\n",
+      "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.513  |       N/A\n",
+      "2023-04-06 23:57:11,130 - INFO - combo.training.tensorboard_writer - loss                     |     0.807  |       N/A\n",
+      "2023-04-06 23:57:11,131 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:57:11,131 - INFO - combo.training.tensorboard_writer - LAS                      |     0.885  |       N/A\n",
+      "2023-04-06 23:57:11,131 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:57:11,131 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:57:11,131 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:57:11,131 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:57:11,131 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:57:11,131 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:57:11,131 - INFO - combo.training.trainer - Epoch duration: 0:01:02.164157\n",
+      "2023-04-06 23:57:11,131 - INFO - combo.training.trainer - Estimated training time remaining: 6:22:57\n",
+      "2023-04-06 23:57:11,132 - INFO - allennlp.training.trainer - Epoch 60/399\n",
+      "2023-04-06 23:57:11,132 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:57:11,132 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:57:11,137 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9200, UAS: 0.9245, LAS: 0.8735, UEM: 0.5809, LEM: 0.3020, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2835, partial_loss/deprel_loss: 0.4011, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5382, loss: 0.8867, batch_reg_loss: 0.1606, reg_loss: 0.1606 ||:   4%|4         | 4/95 [00:02<00:52,  1.74it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9349, LAS: 0.8832, UEM: 0.5488, LEM: 0.2704, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6060, partial_loss/deprel_loss: 0.6525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8039, loss: 0.8042, batch_reg_loss: 0.1607, reg_loss: 0.1606 ||:   8%|8         | 8/95 [00:04<00:51,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9577, UAS: 0.9444, LAS: 0.8942, UEM: 0.6930, LEM: 0.4517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0510, partial_loss/deprel_loss: 0.1657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3035, loss: 0.7286, batch_reg_loss: 0.1608, reg_loss: 0.1607 ||:  12%|#1        | 11/95 [00:07<00:55,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9423, LAS: 0.8906, UEM: 0.6329, LEM: 0.3907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4824, partial_loss/deprel_loss: 0.5800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7213, loss: 0.7588, batch_reg_loss: 0.1608, reg_loss: 0.1607 ||:  16%|#5        | 15/95 [00:09<00:52,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8853, UAS: 0.9417, LAS: 0.8896, UEM: 0.5919, LEM: 0.3523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5967, partial_loss/deprel_loss: 0.6186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7751, loss: 0.7680, batch_reg_loss: 0.1609, reg_loss: 0.1607 ||:  20%|##        | 19/95 [00:12<00:48,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9428, LAS: 0.8911, UEM: 0.5764, LEM: 0.3350, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6191, partial_loss/deprel_loss: 0.6637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8158, loss: 0.7589, batch_reg_loss: 0.1609, reg_loss: 0.1608 ||:  24%|##4       | 23/95 [00:14<00:46,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9457, LAS: 0.8947, UEM: 0.6226, LEM: 0.3809, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3466, partial_loss/deprel_loss: 0.4763, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6113, loss: 0.7316, batch_reg_loss: 0.1610, reg_loss: 0.1608 ||:  27%|##7       | 26/95 [00:17<00:47,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8313, UAS: 0.9451, LAS: 0.8939, UEM: 0.6225, LEM: 0.3755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4179, partial_loss/deprel_loss: 0.9926, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2387, loss: 0.7391, batch_reg_loss: 0.1610, reg_loss: 0.1608 ||:  32%|###1      | 30/95 [00:19<00:42,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9444, LAS: 0.8931, UEM: 0.6279, LEM: 0.3823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1271, partial_loss/deprel_loss: 0.3208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4432, loss: 0.7458, batch_reg_loss: 0.1611, reg_loss: 0.1609 ||:  36%|###5      | 34/95 [00:22<00:40,  1.51it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8490, UAS: 0.9430, LAS: 0.8910, UEM: 0.6072, LEM: 0.3626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0711, partial_loss/deprel_loss: 0.9718, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1528, loss: 0.7647, batch_reg_loss: 0.1612, reg_loss: 0.1609 ||:  40%|####      | 38/95 [00:24<00:36,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8729, UAS: 0.9420, LAS: 0.8900, UEM: 0.6056, LEM: 0.3677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8198, partial_loss/deprel_loss: 0.7777, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9473, loss: 0.7771, batch_reg_loss: 0.1612, reg_loss: 0.1609 ||:  44%|####4     | 42/95 [00:27<00:34,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9430, LAS: 0.8911, UEM: 0.6079, LEM: 0.3671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3948, partial_loss/deprel_loss: 0.5245, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6598, loss: 0.7663, batch_reg_loss: 0.1613, reg_loss: 0.1609 ||:  48%|####8     | 46/95 [00:30<00:32,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8200, UAS: 0.9429, LAS: 0.8905, UEM: 0.6061, LEM: 0.3623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4237, partial_loss/deprel_loss: 1.1122, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3359, loss: 0.7717, batch_reg_loss: 0.1613, reg_loss: 0.1610 ||:  53%|#####2    | 50/95 [00:32<00:29,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9439, LAS: 0.8916, UEM: 0.6126, LEM: 0.3621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2412, partial_loss/deprel_loss: 0.4260, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5504, loss: 0.7624, batch_reg_loss: 0.1614, reg_loss: 0.1610 ||:  57%|#####6    | 54/95 [00:35<00:26,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9429, LAS: 0.8902, UEM: 0.6016, LEM: 0.3534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2458, partial_loss/deprel_loss: 0.4670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5842, loss: 0.7729, batch_reg_loss: 0.1615, reg_loss: 0.1610 ||:  61%|######1   | 58/95 [00:37<00:24,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8963, UAS: 0.9441, LAS: 0.8919, UEM: 0.6137, LEM: 0.3635, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4000, partial_loss/deprel_loss: 0.6110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7303, loss: 0.7600, batch_reg_loss: 0.1615, reg_loss: 0.1611 ||:  65%|######5   | 62/95 [00:40<00:22,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9432, LAS: 0.8905, UEM: 0.6067, LEM: 0.3565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3855, partial_loss/deprel_loss: 0.5793, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7021, loss: 0.7705, batch_reg_loss: 0.1616, reg_loss: 0.1611 ||:  69%|######9   | 66/95 [00:43<00:19,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8728, UAS: 0.9421, LAS: 0.8893, UEM: 0.5971, LEM: 0.3487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6925, partial_loss/deprel_loss: 0.7960, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9369, loss: 0.7804, batch_reg_loss: 0.1616, reg_loss: 0.1611 ||:  74%|#######3  | 70/95 [00:46<00:16,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8977, UAS: 0.9419, LAS: 0.8890, UEM: 0.5929, LEM: 0.3437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3221, partial_loss/deprel_loss: 0.5109, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6348, loss: 0.7832, batch_reg_loss: 0.1617, reg_loss: 0.1612 ||:  78%|#######7  | 74/95 [00:48<00:13,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8898, UAS: 0.9421, LAS: 0.8892, UEM: 0.5903, LEM: 0.3389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5034, partial_loss/deprel_loss: 0.6401, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7745, loss: 0.7812, batch_reg_loss: 0.1618, reg_loss: 0.1612 ||:  82%|########2 | 78/95 [00:51<00:11,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9411, LAS: 0.8881, UEM: 0.5903, LEM: 0.3392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4647, partial_loss/deprel_loss: 0.5666, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7081, loss: 0.7896, batch_reg_loss: 0.1618, reg_loss: 0.1612 ||:  86%|########6 | 82/95 [00:54<00:08,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8739, UAS: 0.9410, LAS: 0.8880, UEM: 0.5907, LEM: 0.3415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8185, partial_loss/deprel_loss: 0.7277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9077, loss: 0.7905, batch_reg_loss: 0.1619, reg_loss: 0.1612 ||:  89%|########9 | 85/95 [00:56<00:06,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9406, LAS: 0.8877, UEM: 0.5881, LEM: 0.3401, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8441, partial_loss/deprel_loss: 0.7880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9612, loss: 0.7938, batch_reg_loss: 0.1619, reg_loss: 0.1613 ||:  93%|#########2| 88/95 [00:58<00:04,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9403, LAS: 0.8873, UEM: 0.5851, LEM: 0.3369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3601, partial_loss/deprel_loss: 0.4747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6138, loss: 0.7959, batch_reg_loss: 0.1620, reg_loss: 0.1613 ||:  97%|#########6| 92/95 [01:00<00:01,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8697, UAS: 0.9398, LAS: 0.8866, UEM: 0.5784, LEM: 0.3320, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8617, partial_loss/deprel_loss: 0.7983, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9730, loss: 0.8016, batch_reg_loss: 0.1620, reg_loss: 0.1613 ||: 100%|##########| 95/95 [01:02<00:00,  1.53it/s]\n",
+      "2023-04-06 23:58:13,320 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9560, LAS: 0.9073, UEM: 0.8034, LEM: 0.6181, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2104, partial_loss/deprel_loss: 19.9283, partial_loss/cycle_loss: 0.0000, batch_loss: 15.9847, loss: 26.0149, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  18%|#8        | 2/11 [00:02<00:09,  1.01s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9476, LAS: 0.8960, UEM: 0.7225, LEM: 0.5025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1885, partial_loss/deprel_loss: 22.8232, partial_loss/cycle_loss: 0.0000, batch_loss: 18.2962, loss: 29.0160, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:04<00:05,  1.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8930, UAS: 0.9471, LAS: 0.8934, UEM: 0.6713, LEM: 0.4075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5159, partial_loss/deprel_loss: 24.4035, partial_loss/cycle_loss: 0.0000, batch_loss: 19.6260, loss: 26.5097, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  73%|#######2  | 8/11 [00:07<00:02,  1.10it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9489, LAS: 0.8961, UEM: 0.6698, LEM: 0.3987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2996, partial_loss/deprel_loss: 28.4184, partial_loss/cycle_loss: 0.0000, batch_loss: 22.7947, loss: 26.7813, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:09<00:00,  1.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9489, LAS: 0.8961, UEM: 0.6698, LEM: 0.3987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2996, partial_loss/deprel_loss: 28.4184, partial_loss/cycle_loss: 0.0000, batch_loss: 22.7947, loss: 26.7813, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:09<00:00,  1.16it/s]\n",
+      "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.161  |     0.000\n",
+      "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - UEM                      |     0.578  |     0.670\n",
+      "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - LEM                      |     0.332  |     0.399\n",
+      "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - EM                       |     0.870  |     0.928\n",
+      "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.862  |     0.300\n",
+      "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - UAS                      |     0.940  |     0.949\n",
+      "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.798  |    28.418\n",
+      "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - loss                     |     0.802  |    26.781\n",
+      "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:58:22,805 - INFO - combo.training.tensorboard_writer - LAS                      |     0.887  |     0.896\n",
+      "2023-04-06 23:58:22,806 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:58:22,806 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:58:22,806 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:58:22,806 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:58:22,806 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:58:22,806 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 23:58:22,806 - INFO - combo.training.trainer - Epoch duration: 0:01:11.674813\n",
+      "2023-04-06 23:58:22,806 - INFO - combo.training.trainer - Estimated training time remaining: 6:22:13\n",
+      "2023-04-06 23:58:22,806 - INFO - allennlp.training.trainer - Epoch 61/399\n",
+      "2023-04-06 23:58:22,807 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:58:22,807 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:58:22,813 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9493, LAS: 0.9001, UEM: 0.5113, LEM: 0.2608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3290, partial_loss/deprel_loss: 0.4222, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5657, loss: 0.6838, batch_reg_loss: 0.1621, reg_loss: 0.1621 ||:   3%|3         | 3/95 [00:02<01:03,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8624, UAS: 0.9380, LAS: 0.8878, UEM: 0.4589, LEM: 0.2282, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9957, partial_loss/deprel_loss: 0.8262, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0223, loss: 0.7848, batch_reg_loss: 0.1621, reg_loss: 0.1621 ||:   6%|6         | 6/95 [00:04<01:02,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9442, LAS: 0.8942, UEM: 0.5610, LEM: 0.3058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2538, partial_loss/deprel_loss: 0.4180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5474, loss: 0.7266, batch_reg_loss: 0.1622, reg_loss: 0.1621 ||:   9%|9         | 9/95 [00:06<01:03,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9201, UAS: 0.9430, LAS: 0.8916, UEM: 0.5512, LEM: 0.3020, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1657, partial_loss/deprel_loss: 0.3888, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5065, loss: 0.7471, batch_reg_loss: 0.1623, reg_loss: 0.1622 ||:  14%|#3        | 13/95 [00:09<00:58,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8666, UAS: 0.9446, LAS: 0.8934, UEM: 0.5710, LEM: 0.3175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7792, partial_loss/deprel_loss: 0.8112, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9671, loss: 0.7342, batch_reg_loss: 0.1623, reg_loss: 0.1622 ||:  17%|#6        | 16/95 [00:11<00:58,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9461, LAS: 0.8949, UEM: 0.5937, LEM: 0.3367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1852, partial_loss/deprel_loss: 0.3654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4918, loss: 0.7225, batch_reg_loss: 0.1624, reg_loss: 0.1622 ||:  20%|##        | 19/95 [00:13<00:55,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9465, LAS: 0.8951, UEM: 0.6055, LEM: 0.3513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2041, partial_loss/deprel_loss: 0.4017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5246, loss: 0.7280, batch_reg_loss: 0.1624, reg_loss: 0.1622 ||:  24%|##4       | 23/95 [00:16<00:50,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9466, LAS: 0.8947, UEM: 0.6008, LEM: 0.3465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1822, partial_loss/deprel_loss: 0.4087, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5258, loss: 0.7323, batch_reg_loss: 0.1625, reg_loss: 0.1623 ||:  28%|##8       | 27/95 [00:18<00:45,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8538, UAS: 0.9436, LAS: 0.8907, UEM: 0.5673, LEM: 0.3226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9718, partial_loss/deprel_loss: 0.8352, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0251, loss: 0.7632, batch_reg_loss: 0.1625, reg_loss: 0.1623 ||:  33%|###2      | 31/95 [00:21<00:41,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8527, UAS: 0.9424, LAS: 0.8898, UEM: 0.5869, LEM: 0.3499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0540, partial_loss/deprel_loss: 0.8374, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0433, loss: 0.7694, batch_reg_loss: 0.1626, reg_loss: 0.1623 ||:  37%|###6      | 35/95 [00:23<00:39,  1.52it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9438, LAS: 0.8912, UEM: 0.6027, LEM: 0.3623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1477, partial_loss/deprel_loss: 0.2882, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4227, loss: 0.7581, batch_reg_loss: 0.1626, reg_loss: 0.1624 ||:  40%|####      | 38/95 [00:26<00:38,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8994, UAS: 0.9432, LAS: 0.8908, UEM: 0.5884, LEM: 0.3474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4037, partial_loss/deprel_loss: 0.5200, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6594, loss: 0.7604, batch_reg_loss: 0.1627, reg_loss: 0.1624 ||:  44%|####4     | 42/95 [00:28<00:35,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8437, UAS: 0.9408, LAS: 0.8881, UEM: 0.5801, LEM: 0.3413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0877, partial_loss/deprel_loss: 0.9107, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1088, loss: 0.7804, batch_reg_loss: 0.1627, reg_loss: 0.1624 ||:  47%|####7     | 45/95 [00:30<00:33,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7994, UAS: 0.9375, LAS: 0.8846, UEM: 0.5655, LEM: 0.3302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7998, partial_loss/deprel_loss: 1.0932, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3973, loss: 0.8055, batch_reg_loss: 0.1628, reg_loss: 0.1624 ||:  52%|#####1    | 49/95 [00:33<00:29,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8899, UAS: 0.9374, LAS: 0.8844, UEM: 0.5565, LEM: 0.3205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4351, partial_loss/deprel_loss: 0.5761, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7108, loss: 0.8063, batch_reg_loss: 0.1629, reg_loss: 0.1625 ||:  56%|#####5    | 53/95 [00:35<00:26,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9384, LAS: 0.8854, UEM: 0.5557, LEM: 0.3157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3168, partial_loss/deprel_loss: 0.5233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6449, loss: 0.7999, batch_reg_loss: 0.1630, reg_loss: 0.1625 ||:  60%|######    | 57/95 [00:37<00:23,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9392, LAS: 0.8863, UEM: 0.5548, LEM: 0.3101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3584, partial_loss/deprel_loss: 0.5174, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6487, loss: 0.7932, batch_reg_loss: 0.1630, reg_loss: 0.1625 ||:  64%|######4   | 61/95 [00:40<00:21,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8705, UAS: 0.9395, LAS: 0.8864, UEM: 0.5497, LEM: 0.3038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6822, partial_loss/deprel_loss: 0.7306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8841, loss: 0.7922, batch_reg_loss: 0.1631, reg_loss: 0.1626 ||:  68%|######8   | 65/95 [00:43<00:20,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8188, UAS: 0.9390, LAS: 0.8860, UEM: 0.5673, LEM: 0.3322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5033, partial_loss/deprel_loss: 1.0465, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3010, loss: 0.7974, batch_reg_loss: 0.1632, reg_loss: 0.1626 ||:  73%|#######2  | 69/95 [00:46<00:17,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9401, LAS: 0.8873, UEM: 0.5793, LEM: 0.3385, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2484, partial_loss/deprel_loss: 0.4358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5615, loss: 0.7877, batch_reg_loss: 0.1632, reg_loss: 0.1626 ||:  76%|#######5  | 72/95 [00:48<00:15,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8704, UAS: 0.9407, LAS: 0.8878, UEM: 0.5868, LEM: 0.3455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7300, partial_loss/deprel_loss: 0.7953, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9455, loss: 0.7839, batch_reg_loss: 0.1633, reg_loss: 0.1627 ||:  79%|#######8  | 75/95 [00:50<00:14,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9227, UAS: 0.9402, LAS: 0.8873, UEM: 0.5855, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2602, partial_loss/deprel_loss: 0.4101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5434, loss: 0.7891, batch_reg_loss: 0.1633, reg_loss: 0.1627 ||:  83%|########3 | 79/95 [00:53<00:10,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9404, LAS: 0.8876, UEM: 0.5859, LEM: 0.3439, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2909, partial_loss/deprel_loss: 0.4057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5461, loss: 0.7864, batch_reg_loss: 0.1634, reg_loss: 0.1627 ||:  86%|########6 | 82/95 [00:55<00:08,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9407, LAS: 0.8877, UEM: 0.5833, LEM: 0.3373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6463, partial_loss/deprel_loss: 0.7100, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8607, loss: 0.7867, batch_reg_loss: 0.1634, reg_loss: 0.1627 ||:  91%|######### | 86/95 [00:57<00:05,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9406, LAS: 0.8875, UEM: 0.5804, LEM: 0.3326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5472, partial_loss/deprel_loss: 0.6384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7836, loss: 0.7904, batch_reg_loss: 0.1635, reg_loss: 0.1628 ||:  95%|#########4| 90/95 [01:00<00:03,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9395, LAS: 0.8861, UEM: 0.5729, LEM: 0.3268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4341, partial_loss/deprel_loss: 0.5810, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7152, loss: 0.8014, batch_reg_loss: 0.1635, reg_loss: 0.1628 ||:  99%|#########8| 94/95 [01:02<00:00,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9398, LAS: 0.8863, UEM: 0.5764, LEM: 0.3290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2508, partial_loss/deprel_loss: 0.4408, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5663, loss: 0.7989, batch_reg_loss: 0.1636, reg_loss: 0.1628 ||: 100%|##########| 95/95 [01:03<00:00,  1.51it/s]\n",
+      "2023-04-06 23:59:25,920 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:59:25,920 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-06 23:59:25,920 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.163  |       N/A\n",
+      "2023-04-06 23:59:25,920 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:59:25,920 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:59:25,920 - INFO - combo.training.tensorboard_writer - UEM                      |     0.576  |       N/A\n",
+      "2023-04-06 23:59:25,920 - INFO - combo.training.tensorboard_writer - LEM                      |     0.329  |       N/A\n",
+      "2023-04-06 23:59:25,920 - INFO - combo.training.tensorboard_writer - EM                       |     0.906  |       N/A\n",
+      "2023-04-06 23:59:25,920 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.251  |       N/A\n",
+      "2023-04-06 23:59:25,920 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - UAS                      |     0.940  |       N/A\n",
+      "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.441  |       N/A\n",
+      "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - loss                     |     0.799  |       N/A\n",
+      "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - LAS                      |     0.886  |       N/A\n",
+      "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:59:25,921 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:59:25,922 - INFO - combo.training.trainer - Epoch duration: 0:01:03.115203\n",
+      "2023-04-06 23:59:25,922 - INFO - combo.training.trainer - Estimated training time remaining: 6:20:40\n",
+      "2023-04-06 23:59:25,922 - INFO - allennlp.training.trainer - Epoch 62/399\n",
+      "2023-04-06 23:59:25,922 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-06 23:59:25,922 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:59:25,928 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9352, LAS: 0.8864, UEM: 0.6689, LEM: 0.4856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1004, partial_loss/deprel_loss: 0.2947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4195, loss: 0.8111, batch_reg_loss: 0.1636, reg_loss: 0.1636 ||:   3%|3         | 3/95 [00:02<01:03,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8784, UAS: 0.9423, LAS: 0.8922, UEM: 0.5717, LEM: 0.3430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6524, partial_loss/deprel_loss: 0.7108, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8628, loss: 0.7538, batch_reg_loss: 0.1637, reg_loss: 0.1636 ||:   7%|7         | 7/95 [00:04<00:59,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8511, UAS: 0.9436, LAS: 0.8937, UEM: 0.6140, LEM: 0.3753, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9611, partial_loss/deprel_loss: 0.8192, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0113, loss: 0.7286, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||:  11%|#         | 10/95 [00:06<00:58,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8707, UAS: 0.9404, LAS: 0.8906, UEM: 0.5818, LEM: 0.3406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7859, partial_loss/deprel_loss: 0.7698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9368, loss: 0.7612, batch_reg_loss: 0.1638, reg_loss: 0.1637 ||:  15%|#4        | 14/95 [00:09<00:54,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9457, LAS: 0.8979, UEM: 0.6694, LEM: 0.4514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2048, partial_loss/deprel_loss: 0.3795, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5084, loss: 0.7118, batch_reg_loss: 0.1638, reg_loss: 0.1637 ||:  18%|#7        | 17/95 [00:11<00:55,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8722, UAS: 0.9462, LAS: 0.8974, UEM: 0.6547, LEM: 0.4268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6472, partial_loss/deprel_loss: 0.7830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9197, loss: 0.7198, batch_reg_loss: 0.1639, reg_loss: 0.1637 ||:  21%|##1       | 20/95 [00:13<00:53,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8566, UAS: 0.9451, LAS: 0.8964, UEM: 0.6450, LEM: 0.4199, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9298, partial_loss/deprel_loss: 0.8191, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0052, loss: 0.7245, batch_reg_loss: 0.1639, reg_loss: 0.1638 ||:  24%|##4       | 23/95 [00:16<00:51,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9416, LAS: 0.8921, UEM: 0.6166, LEM: 0.3929, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6848, partial_loss/deprel_loss: 0.7441, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8962, loss: 0.7624, batch_reg_loss: 0.1640, reg_loss: 0.1638 ||:  28%|##8       | 27/95 [00:18<00:46,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9077, UAS: 0.9440, LAS: 0.8946, UEM: 0.6354, LEM: 0.4024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2743, partial_loss/deprel_loss: 0.4524, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5808, loss: 0.7425, batch_reg_loss: 0.1640, reg_loss: 0.1638 ||:  32%|###1      | 30/95 [00:20<00:45,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8557, UAS: 0.9422, LAS: 0.8927, UEM: 0.6160, LEM: 0.3835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0462, partial_loss/deprel_loss: 0.8503, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0535, loss: 0.7598, batch_reg_loss: 0.1641, reg_loss: 0.1638 ||:  36%|###5      | 34/95 [00:22<00:40,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8844, UAS: 0.9412, LAS: 0.8911, UEM: 0.5973, LEM: 0.3674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6510, partial_loss/deprel_loss: 0.6828, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8406, loss: 0.7688, batch_reg_loss: 0.1641, reg_loss: 0.1639 ||:  40%|####      | 38/95 [00:25<00:36,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8747, UAS: 0.9415, LAS: 0.8911, UEM: 0.5952, LEM: 0.3623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8107, partial_loss/deprel_loss: 0.7510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9271, loss: 0.7698, batch_reg_loss: 0.1642, reg_loss: 0.1639 ||:  44%|####4     | 42/95 [00:28<00:34,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8436, UAS: 0.9412, LAS: 0.8902, UEM: 0.5865, LEM: 0.3502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0094, partial_loss/deprel_loss: 0.8746, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0658, loss: 0.7748, batch_reg_loss: 0.1642, reg_loss: 0.1639 ||:  48%|####8     | 46/95 [00:30<00:31,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8768, UAS: 0.9409, LAS: 0.8899, UEM: 0.5940, LEM: 0.3632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5632, partial_loss/deprel_loss: 0.7819, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9025, loss: 0.7776, batch_reg_loss: 0.1643, reg_loss: 0.1640 ||:  53%|#####2    | 50/95 [00:33<00:29,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9404, LAS: 0.8896, UEM: 0.6009, LEM: 0.3688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2029, partial_loss/deprel_loss: 0.3773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5068, loss: 0.7804, batch_reg_loss: 0.1644, reg_loss: 0.1640 ||:  57%|#####6    | 54/95 [00:36<00:27,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9396, LAS: 0.8884, UEM: 0.5930, LEM: 0.3619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5070, partial_loss/deprel_loss: 0.6170, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7594, loss: 0.7874, batch_reg_loss: 0.1644, reg_loss: 0.1640 ||:  61%|######1   | 58/95 [00:38<00:24,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9398, LAS: 0.8883, UEM: 0.5847, LEM: 0.3516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5434, partial_loss/deprel_loss: 0.6657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8058, loss: 0.7893, batch_reg_loss: 0.1645, reg_loss: 0.1640 ||:  65%|######5   | 62/95 [00:41<00:22,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9051, UAS: 0.9405, LAS: 0.8889, UEM: 0.5865, LEM: 0.3500, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3470, partial_loss/deprel_loss: 0.5598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6818, loss: 0.7835, batch_reg_loss: 0.1645, reg_loss: 0.1641 ||:  68%|######8   | 65/95 [00:44<00:21,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9407, LAS: 0.8892, UEM: 0.5836, LEM: 0.3467, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3367, partial_loss/deprel_loss: 0.4958, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6286, loss: 0.7819, batch_reg_loss: 0.1646, reg_loss: 0.1641 ||:  72%|#######1  | 68/95 [00:46<00:19,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8300, UAS: 0.9397, LAS: 0.8878, UEM: 0.5751, LEM: 0.3405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3214, partial_loss/deprel_loss: 0.9422, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1827, loss: 0.7904, batch_reg_loss: 0.1646, reg_loss: 0.1641 ||:  75%|#######4  | 71/95 [00:48<00:16,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9409, LAS: 0.8891, UEM: 0.5931, LEM: 0.3556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1709, partial_loss/deprel_loss: 0.3713, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4959, loss: 0.7792, batch_reg_loss: 0.1647, reg_loss: 0.1641 ||:  78%|#######7  | 74/95 [00:50<00:15,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9412, LAS: 0.8893, UEM: 0.5962, LEM: 0.3574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1853, partial_loss/deprel_loss: 0.3972, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5196, loss: 0.7765, batch_reg_loss: 0.1647, reg_loss: 0.1642 ||:  81%|########1 | 77/95 [00:52<00:13,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8451, UAS: 0.9410, LAS: 0.8891, UEM: 0.5931, LEM: 0.3533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0801, partial_loss/deprel_loss: 0.9144, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1123, loss: 0.7780, batch_reg_loss: 0.1648, reg_loss: 0.1642 ||:  84%|########4 | 80/95 [00:54<00:10,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9405, LAS: 0.8886, UEM: 0.5904, LEM: 0.3518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2335, partial_loss/deprel_loss: 0.3604, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4999, loss: 0.7813, batch_reg_loss: 0.1648, reg_loss: 0.1642 ||:  88%|########8 | 84/95 [00:57<00:07,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8956, UAS: 0.9401, LAS: 0.8881, UEM: 0.5874, LEM: 0.3470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5134, partial_loss/deprel_loss: 0.5706, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7241, loss: 0.7856, batch_reg_loss: 0.1649, reg_loss: 0.1642 ||:  93%|#########2| 88/95 [00:59<00:04,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7838, UAS: 0.9391, LAS: 0.8870, UEM: 0.5827, LEM: 0.3433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1079, partial_loss/deprel_loss: 1.1986, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5454, loss: 0.7937, batch_reg_loss: 0.1649, reg_loss: 0.1643 ||:  96%|#########5| 91/95 [01:02<00:02,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9392, LAS: 0.8870, UEM: 0.5792, LEM: 0.3383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2851, partial_loss/deprel_loss: 0.5187, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6370, loss: 0.7949, batch_reg_loss: 0.1650, reg_loss: 0.1643 ||: 100%|##########| 95/95 [01:04<00:00,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9392, LAS: 0.8870, UEM: 0.5792, LEM: 0.3383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2851, partial_loss/deprel_loss: 0.5187, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6370, loss: 0.7949, batch_reg_loss: 0.1650, reg_loss: 0.1643 ||: 100%|##########| 95/95 [01:04<00:00,  1.47it/s]\n",
+      "2023-04-07 00:00:30,727 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:00:30,727 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 00:00:30,727 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.164  |       N/A\n",
+      "2023-04-07 00:00:30,727 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - UEM                      |     0.579  |       N/A\n",
+      "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - LEM                      |     0.338  |       N/A\n",
+      "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - EM                       |     0.907  |       N/A\n",
+      "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.285  |       N/A\n",
+      "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - UAS                      |     0.939  |       N/A\n",
+      "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.519  |       N/A\n",
+      "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - loss                     |     0.795  |       N/A\n",
+      "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - LAS                      |     0.887  |       N/A\n",
+      "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:00:30,728 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:00:30,729 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:00:30,729 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:00:30,729 - INFO - combo.training.trainer - Epoch duration: 0:01:04.807186\n",
+      "2023-04-07 00:00:30,729 - INFO - combo.training.trainer - Estimated training time remaining: 6:19:18\n",
+      "2023-04-07 00:00:30,729 - INFO - allennlp.training.trainer - Epoch 63/399\n",
+      "2023-04-07 00:00:30,729 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:00:30,730 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:00:30,735 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9214, LAS: 0.8709, UEM: 0.3921, LEM: 0.1982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3276, partial_loss/deprel_loss: 0.5189, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6457, loss: 0.9274, batch_reg_loss: 0.1651, reg_loss: 0.1651 ||:   4%|4         | 4/95 [00:02<01:01,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8297, UAS: 0.9183, LAS: 0.8660, UEM: 0.3468, LEM: 0.1579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3947, partial_loss/deprel_loss: 0.8886, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1549, loss: 0.9582, batch_reg_loss: 0.1651, reg_loss: 0.1651 ||:   7%|7         | 7/95 [00:04<00:59,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8771, UAS: 0.9267, LAS: 0.8754, UEM: 0.4078, LEM: 0.2043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6982, partial_loss/deprel_loss: 0.7160, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8776, loss: 0.8958, batch_reg_loss: 0.1652, reg_loss: 0.1651 ||:  12%|#1        | 11/95 [00:06<00:52,  1.60it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8539, UAS: 0.9305, LAS: 0.8789, UEM: 0.4726, LEM: 0.2452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0189, partial_loss/deprel_loss: 0.8535, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0519, loss: 0.8685, batch_reg_loss: 0.1653, reg_loss: 0.1652 ||:  16%|#5        | 15/95 [00:09<00:49,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9332, LAS: 0.8818, UEM: 0.4824, LEM: 0.2443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5805, partial_loss/deprel_loss: 0.7069, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8470, loss: 0.8474, batch_reg_loss: 0.1653, reg_loss: 0.1652 ||:  19%|#8        | 18/95 [00:11<00:48,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8868, UAS: 0.9346, LAS: 0.8828, UEM: 0.4713, LEM: 0.2292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4694, partial_loss/deprel_loss: 0.6779, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8016, loss: 0.8447, batch_reg_loss: 0.1654, reg_loss: 0.1652 ||:  22%|##2       | 21/95 [00:13<00:48,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9191, UAS: 0.9343, LAS: 0.8826, UEM: 0.4678, LEM: 0.2258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2384, partial_loss/deprel_loss: 0.4394, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5646, loss: 0.8508, batch_reg_loss: 0.1655, reg_loss: 0.1652 ||:  26%|##6       | 25/95 [00:15<00:45,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8786, UAS: 0.9365, LAS: 0.8847, UEM: 0.5053, LEM: 0.2608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6228, partial_loss/deprel_loss: 0.7041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8533, loss: 0.8323, batch_reg_loss: 0.1655, reg_loss: 0.1653 ||:  31%|###       | 29/95 [00:18<00:43,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9382, LAS: 0.8863, UEM: 0.5066, LEM: 0.2574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4859, partial_loss/deprel_loss: 0.6017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7441, loss: 0.8173, batch_reg_loss: 0.1656, reg_loss: 0.1653 ||:  35%|###4      | 33/95 [00:21<00:40,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9013, UAS: 0.9401, LAS: 0.8883, UEM: 0.5258, LEM: 0.2682, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4612, partial_loss/deprel_loss: 0.5999, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7378, loss: 0.8021, batch_reg_loss: 0.1656, reg_loss: 0.1653 ||:  38%|###7      | 36/95 [00:23<00:41,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9416, LAS: 0.8898, UEM: 0.5378, LEM: 0.2733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3752, partial_loss/deprel_loss: 0.4718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6181, loss: 0.7879, batch_reg_loss: 0.1656, reg_loss: 0.1654 ||:  41%|####1     | 39/95 [00:25<00:38,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9415, LAS: 0.8892, UEM: 0.5376, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2148, partial_loss/deprel_loss: 0.4684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5834, loss: 0.7905, batch_reg_loss: 0.1657, reg_loss: 0.1654 ||:  45%|####5     | 43/95 [00:27<00:34,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8736, UAS: 0.9408, LAS: 0.8884, UEM: 0.5277, LEM: 0.2620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7331, partial_loss/deprel_loss: 0.7146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8840, loss: 0.7976, batch_reg_loss: 0.1657, reg_loss: 0.1654 ||:  48%|####8     | 46/95 [00:29<00:32,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9573, UAS: 0.9413, LAS: 0.8890, UEM: 0.5571, LEM: 0.3055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0420, partial_loss/deprel_loss: 0.1709, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3109, loss: 0.7932, batch_reg_loss: 0.1658, reg_loss: 0.1654 ||:  53%|#####2    | 50/95 [00:33<00:31,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8707, UAS: 0.9382, LAS: 0.8855, UEM: 0.5419, LEM: 0.2959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8462, partial_loss/deprel_loss: 0.8174, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9890, loss: 0.8220, batch_reg_loss: 0.1658, reg_loss: 0.1655 ||:  57%|#####6    | 54/95 [00:35<00:28,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8002, UAS: 0.9376, LAS: 0.8850, UEM: 0.5406, LEM: 0.2934, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9688, partial_loss/deprel_loss: 1.1840, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5069, loss: 0.8260, batch_reg_loss: 0.1659, reg_loss: 0.1655 ||:  61%|######1   | 58/95 [00:38<00:24,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9384, LAS: 0.8859, UEM: 0.5466, LEM: 0.2976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1713, partial_loss/deprel_loss: 0.3812, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5051, loss: 0.8189, batch_reg_loss: 0.1659, reg_loss: 0.1655 ||:  64%|######4   | 61/95 [00:40<00:23,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9396, LAS: 0.8873, UEM: 0.5644, LEM: 0.3140, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2480, partial_loss/deprel_loss: 0.4449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5715, loss: 0.8056, batch_reg_loss: 0.1660, reg_loss: 0.1655 ||:  67%|######7   | 64/95 [00:42<00:21,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9396, LAS: 0.8872, UEM: 0.5700, LEM: 0.3215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1402, partial_loss/deprel_loss: 0.3569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4796, loss: 0.8043, batch_reg_loss: 0.1660, reg_loss: 0.1656 ||:  71%|#######   | 67/95 [00:44<00:19,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9051, UAS: 0.9395, LAS: 0.8872, UEM: 0.5704, LEM: 0.3235, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3419, partial_loss/deprel_loss: 0.5650, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6865, loss: 0.8056, batch_reg_loss: 0.1661, reg_loss: 0.1656 ||:  75%|#######4  | 71/95 [00:47<00:16,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9397, LAS: 0.8872, UEM: 0.5716, LEM: 0.3248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5127, partial_loss/deprel_loss: 0.6654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8010, loss: 0.8049, batch_reg_loss: 0.1661, reg_loss: 0.1656 ||:  78%|#######7  | 74/95 [00:49<00:15,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9397, LAS: 0.8872, UEM: 0.5663, LEM: 0.3192, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5178, partial_loss/deprel_loss: 0.6335, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7766, loss: 0.8046, batch_reg_loss: 0.1662, reg_loss: 0.1656 ||:  81%|########1 | 77/95 [00:51<00:12,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8333, UAS: 0.9391, LAS: 0.8865, UEM: 0.5645, LEM: 0.3182, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3299, partial_loss/deprel_loss: 0.9747, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2120, loss: 0.8106, batch_reg_loss: 0.1662, reg_loss: 0.1657 ||:  84%|########4 | 80/95 [00:54<00:10,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9400, LAS: 0.8874, UEM: 0.5756, LEM: 0.3282, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2448, partial_loss/deprel_loss: 0.5046, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6189, loss: 0.8024, batch_reg_loss: 0.1663, reg_loss: 0.1657 ||:  87%|########7 | 83/95 [00:56<00:08,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9407, LAS: 0.8882, UEM: 0.5854, LEM: 0.3402, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3117, partial_loss/deprel_loss: 0.4566, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5940, loss: 0.7962, batch_reg_loss: 0.1663, reg_loss: 0.1657 ||:  91%|######### | 86/95 [00:58<00:06,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8635, UAS: 0.9402, LAS: 0.8877, UEM: 0.5813, LEM: 0.3374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9233, partial_loss/deprel_loss: 0.7878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9813, loss: 0.8002, batch_reg_loss: 0.1664, reg_loss: 0.1657 ||:  94%|#########3| 89/95 [01:00<00:04,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8439, UAS: 0.9401, LAS: 0.8875, UEM: 0.5781, LEM: 0.3345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9979, partial_loss/deprel_loss: 0.9188, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1010, loss: 0.8021, batch_reg_loss: 0.1664, reg_loss: 0.1657 ||:  97%|#########6| 92/95 [01:02<00:02,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8508, UAS: 0.9401, LAS: 0.8876, UEM: 0.5794, LEM: 0.3347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1858, partial_loss/deprel_loss: 0.9170, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1372, loss: 0.8015, batch_reg_loss: 0.1665, reg_loss: 0.1658 ||: 100%|##########| 95/95 [01:04<00:00,  1.47it/s]\n",
+      "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.166  |       N/A\n",
+      "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - UEM                      |     0.579  |       N/A\n",
+      "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - LEM                      |     0.335  |       N/A\n",
+      "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - EM                       |     0.851  |       N/A\n",
+      "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.186  |       N/A\n",
+      "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - UAS                      |     0.940  |       N/A\n",
+      "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.917  |       N/A\n",
+      "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - loss                     |     0.801  |       N/A\n",
+      "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:01:35,408 - INFO - combo.training.tensorboard_writer - LAS                      |     0.888  |       N/A\n",
+      "2023-04-07 00:01:35,409 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:01:35,409 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:01:35,409 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:01:35,409 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:01:35,409 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:01:35,409 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:01:35,409 - INFO - combo.training.trainer - Epoch duration: 0:01:04.680005\n",
+      "2023-04-07 00:01:35,409 - INFO - combo.training.trainer - Estimated training time remaining: 6:17:55\n",
+      "2023-04-07 00:01:35,409 - INFO - allennlp.training.trainer - Epoch 64/399\n",
+      "2023-04-07 00:01:35,410 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:01:35,410 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:01:35,416 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9295, UAS: 0.9472, LAS: 0.9002, UEM: 0.5593, LEM: 0.3013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2380, partial_loss/deprel_loss: 0.3970, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5317, loss: 0.7240, batch_reg_loss: 0.1665, reg_loss: 0.1665 ||:   4%|4         | 4/95 [00:02<00:59,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8633, UAS: 0.9445, LAS: 0.8949, UEM: 0.5081, LEM: 0.2425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8786, partial_loss/deprel_loss: 0.8800, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0463, loss: 0.7558, batch_reg_loss: 0.1666, reg_loss: 0.1665 ||:   8%|8         | 8/95 [00:04<00:54,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8791, UAS: 0.9423, LAS: 0.8919, UEM: 0.4719, LEM: 0.2172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7350, partial_loss/deprel_loss: 0.6780, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8560, loss: 0.7743, batch_reg_loss: 0.1666, reg_loss: 0.1666 ||:  13%|#2        | 12/95 [00:07<00:52,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8671, UAS: 0.9363, LAS: 0.8857, UEM: 0.5424, LEM: 0.3153, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8850, partial_loss/deprel_loss: 0.7542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9470, loss: 0.8111, batch_reg_loss: 0.1667, reg_loss: 0.1666 ||:  16%|#5        | 15/95 [00:09<00:54,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8339, UAS: 0.9363, LAS: 0.8849, UEM: 0.5609, LEM: 0.3296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3685, partial_loss/deprel_loss: 0.9459, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1972, loss: 0.8203, batch_reg_loss: 0.1667, reg_loss: 0.1666 ||:  20%|##        | 19/95 [00:12<00:50,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9379, LAS: 0.8866, UEM: 0.5555, LEM: 0.3195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7078, partial_loss/deprel_loss: 0.6756, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8488, loss: 0.8055, batch_reg_loss: 0.1668, reg_loss: 0.1666 ||:  24%|##4       | 23/95 [00:14<00:46,  1.55it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9138, UAS: 0.9390, LAS: 0.8881, UEM: 0.5410, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3953, partial_loss/deprel_loss: 0.4859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6347, loss: 0.7956, batch_reg_loss: 0.1669, reg_loss: 0.1667 ||:  28%|##8       | 27/95 [00:17<00:42,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9401, LAS: 0.8887, UEM: 0.5347, LEM: 0.2923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5704, partial_loss/deprel_loss: 0.6689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8162, loss: 0.7944, batch_reg_loss: 0.1669, reg_loss: 0.1667 ||:  33%|###2      | 31/95 [00:19<00:38,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9017, UAS: 0.9404, LAS: 0.8885, UEM: 0.5455, LEM: 0.2973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4811, partial_loss/deprel_loss: 0.5935, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7380, loss: 0.7950, batch_reg_loss: 0.1670, reg_loss: 0.1667 ||:  37%|###6      | 35/95 [00:21<00:37,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9410, LAS: 0.8897, UEM: 0.5818, LEM: 0.3517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3507, partial_loss/deprel_loss: 0.5233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6558, loss: 0.7895, batch_reg_loss: 0.1671, reg_loss: 0.1668 ||:  41%|####1     | 39/95 [00:25<00:39,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9068, UAS: 0.9411, LAS: 0.8898, UEM: 0.5699, LEM: 0.3422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4048, partial_loss/deprel_loss: 0.5478, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6863, loss: 0.7894, batch_reg_loss: 0.1671, reg_loss: 0.1668 ||:  44%|####4     | 42/95 [00:28<00:39,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8088, UAS: 0.9403, LAS: 0.8891, UEM: 0.5757, LEM: 0.3450, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6599, partial_loss/deprel_loss: 1.0256, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3196, loss: 0.7933, batch_reg_loss: 0.1671, reg_loss: 0.1668 ||:  47%|####7     | 45/95 [00:30<00:38,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9398, LAS: 0.8885, UEM: 0.5682, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3592, partial_loss/deprel_loss: 0.5030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6414, loss: 0.7956, batch_reg_loss: 0.1672, reg_loss: 0.1668 ||:  52%|#####1    | 49/95 [00:33<00:35,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9409, LAS: 0.8897, UEM: 0.5873, LEM: 0.3537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2698, partial_loss/deprel_loss: 0.4250, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5612, loss: 0.7860, batch_reg_loss: 0.1672, reg_loss: 0.1669 ||:  55%|#####4    | 52/95 [00:35<00:32,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9411, LAS: 0.8898, UEM: 0.5823, LEM: 0.3476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6031, partial_loss/deprel_loss: 0.7107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8565, loss: 0.7849, batch_reg_loss: 0.1673, reg_loss: 0.1669 ||:  59%|#####8    | 56/95 [00:38<00:27,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9406, LAS: 0.8893, UEM: 0.5731, LEM: 0.3389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3573, partial_loss/deprel_loss: 0.5425, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6728, loss: 0.7874, batch_reg_loss: 0.1674, reg_loss: 0.1669 ||:  63%|######3   | 60/95 [00:40<00:23,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9410, LAS: 0.8894, UEM: 0.5753, LEM: 0.3377, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5480, partial_loss/deprel_loss: 0.6567, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8024, loss: 0.7839, batch_reg_loss: 0.1674, reg_loss: 0.1670 ||:  67%|######7   | 64/95 [00:43<00:20,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9406, LAS: 0.8890, UEM: 0.5698, LEM: 0.3337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2822, partial_loss/deprel_loss: 0.4641, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5952, loss: 0.7861, batch_reg_loss: 0.1675, reg_loss: 0.1670 ||:  72%|#######1  | 68/95 [00:46<00:18,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8891, UAS: 0.9412, LAS: 0.8896, UEM: 0.5707, LEM: 0.3303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5073, partial_loss/deprel_loss: 0.7481, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8675, loss: 0.7817, batch_reg_loss: 0.1675, reg_loss: 0.1670 ||:  76%|#######5  | 72/95 [00:48<00:15,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8362, UAS: 0.9407, LAS: 0.8891, UEM: 0.5695, LEM: 0.3305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3392, partial_loss/deprel_loss: 1.0263, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2565, loss: 0.7844, batch_reg_loss: 0.1676, reg_loss: 0.1670 ||:  79%|#######8  | 75/95 [00:50<00:13,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8978, UAS: 0.9401, LAS: 0.8884, UEM: 0.5636, LEM: 0.3251, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4045, partial_loss/deprel_loss: 0.5355, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6769, loss: 0.7911, batch_reg_loss: 0.1676, reg_loss: 0.1671 ||:  82%|########2 | 78/95 [00:53<00:12,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9406, LAS: 0.8891, UEM: 0.5730, LEM: 0.3334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1452, partial_loss/deprel_loss: 0.3148, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4486, loss: 0.7860, batch_reg_loss: 0.1677, reg_loss: 0.1671 ||:  86%|########6 | 82/95 [00:55<00:09,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9412, LAS: 0.8897, UEM: 0.5791, LEM: 0.3361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1987, partial_loss/deprel_loss: 0.3826, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5135, loss: 0.7819, batch_reg_loss: 0.1677, reg_loss: 0.1671 ||:  89%|########9 | 85/95 [00:58<00:07,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9409, LAS: 0.8892, UEM: 0.5757, LEM: 0.3318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4878, partial_loss/deprel_loss: 0.6423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7792, loss: 0.7858, batch_reg_loss: 0.1678, reg_loss: 0.1671 ||:  93%|#########2| 88/95 [01:00<00:05,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8304, UAS: 0.9403, LAS: 0.8885, UEM: 0.5799, LEM: 0.3381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3140, partial_loss/deprel_loss: 1.0576, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2767, loss: 0.7918, batch_reg_loss: 0.1678, reg_loss: 0.1672 ||:  96%|#########5| 91/95 [01:02<00:02,  1.38it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8963, UAS: 0.9396, LAS: 0.8877, UEM: 0.5755, LEM: 0.3341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4699, partial_loss/deprel_loss: 0.6063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7469, loss: 0.7974, batch_reg_loss: 0.1679, reg_loss: 0.1672 ||:  99%|#########8| 94/95 [01:04<00:00,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9399, LAS: 0.8881, UEM: 0.5787, LEM: 0.3373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2153, partial_loss/deprel_loss: 0.3856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5194, loss: 0.7945, batch_reg_loss: 0.1679, reg_loss: 0.1672 ||: 100%|##########| 95/95 [01:05<00:00,  1.46it/s]\n",
+      "2023-04-07 00:02:40,496 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:02:40,496 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 00:02:40,496 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.167  |       N/A\n",
+      "2023-04-07 00:02:40,496 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:02:40,496 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:02:40,496 - INFO - combo.training.tensorboard_writer - UEM                      |     0.579  |       N/A\n",
+      "2023-04-07 00:02:40,496 - INFO - combo.training.tensorboard_writer - LEM                      |     0.337  |       N/A\n",
+      "2023-04-07 00:02:40,496 - INFO - combo.training.tensorboard_writer - EM                       |     0.919  |       N/A\n",
+      "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.215  |       N/A\n",
+      "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - UAS                      |     0.940  |       N/A\n",
+      "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.386  |       N/A\n",
+      "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - loss                     |     0.795  |       N/A\n",
+      "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - LAS                      |     0.888  |       N/A\n",
+      "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:02:40,497 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:02:40,498 - INFO - combo.training.trainer - Epoch duration: 0:01:05.088427\n",
+      "2023-04-07 00:02:40,498 - INFO - combo.training.trainer - Estimated training time remaining: 6:16:36\n",
+      "2023-04-07 00:02:40,498 - INFO - allennlp.training.trainer - Epoch 65/399\n",
+      "2023-04-07 00:02:40,498 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:02:40,499 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:02:40,505 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9564, LAS: 0.9078, UEM: 0.6076, LEM: 0.3064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4727, partial_loss/deprel_loss: 0.5492, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7018, loss: 0.6344, batch_reg_loss: 0.1679, reg_loss: 0.1679 ||:   3%|3         | 3/95 [00:02<01:13,  1.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9593, LAS: 0.9088, UEM: 0.6460, LEM: 0.3347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2772, partial_loss/deprel_loss: 0.5124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6333, loss: 0.6441, batch_reg_loss: 0.1680, reg_loss: 0.1679 ||:   6%|6         | 6/95 [00:04<01:09,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9529, LAS: 0.9027, UEM: 0.6704, LEM: 0.4140, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1125, partial_loss/deprel_loss: 0.2377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3806, loss: 0.6866, batch_reg_loss: 0.1680, reg_loss: 0.1680 ||:   9%|9         | 9/95 [00:06<01:04,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8815, UAS: 0.9511, LAS: 0.9012, UEM: 0.6389, LEM: 0.3824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7581, partial_loss/deprel_loss: 0.6781, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8622, loss: 0.6975, batch_reg_loss: 0.1681, reg_loss: 0.1680 ||:  13%|#2        | 12/95 [00:08<01:00,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9522, LAS: 0.9026, UEM: 0.6560, LEM: 0.4041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4369, partial_loss/deprel_loss: 0.6236, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7544, loss: 0.6851, batch_reg_loss: 0.1681, reg_loss: 0.1680 ||:  16%|#5        | 15/95 [00:10<00:58,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9511, LAS: 0.9019, UEM: 0.6863, LEM: 0.4643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8530, partial_loss/deprel_loss: 0.7887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9697, loss: 0.6922, batch_reg_loss: 0.1682, reg_loss: 0.1680 ||:  19%|#8        | 18/95 [00:13<00:56,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9082, UAS: 0.9495, LAS: 0.8995, UEM: 0.6710, LEM: 0.4392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3663, partial_loss/deprel_loss: 0.5152, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6536, loss: 0.7071, batch_reg_loss: 0.1682, reg_loss: 0.1681 ||:  23%|##3       | 22/95 [00:15<00:51,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9493, LAS: 0.8991, UEM: 0.6559, LEM: 0.4229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2240, partial_loss/deprel_loss: 0.4358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5617, loss: 0.7120, batch_reg_loss: 0.1683, reg_loss: 0.1681 ||:  26%|##6       | 25/95 [00:17<00:50,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9492, LAS: 0.8993, UEM: 0.6571, LEM: 0.4210, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2532, partial_loss/deprel_loss: 0.4325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5650, loss: 0.7124, batch_reg_loss: 0.1683, reg_loss: 0.1681 ||:  29%|##9       | 28/95 [00:19<00:47,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8608, UAS: 0.9469, LAS: 0.8965, UEM: 0.6418, LEM: 0.4084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9097, partial_loss/deprel_loss: 0.8116, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9995, loss: 0.7314, batch_reg_loss: 0.1683, reg_loss: 0.1681 ||:  34%|###3      | 32/95 [00:22<00:42,  1.47it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9467, LAS: 0.8962, UEM: 0.6360, LEM: 0.4018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7673, partial_loss/deprel_loss: 0.7183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8965, loss: 0.7326, batch_reg_loss: 0.1684, reg_loss: 0.1682 ||:  38%|###7      | 36/95 [00:24<00:38,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9472, LAS: 0.8970, UEM: 0.6440, LEM: 0.4078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2836, partial_loss/deprel_loss: 0.4544, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5887, loss: 0.7272, batch_reg_loss: 0.1684, reg_loss: 0.1682 ||:  42%|####2     | 40/95 [00:27<00:35,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9445, LAS: 0.8937, UEM: 0.6242, LEM: 0.3914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5100, partial_loss/deprel_loss: 0.6251, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7706, loss: 0.7519, batch_reg_loss: 0.1685, reg_loss: 0.1682 ||:  46%|####6     | 44/95 [00:29<00:31,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8805, UAS: 0.9451, LAS: 0.8943, UEM: 0.6272, LEM: 0.3931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6013, partial_loss/deprel_loss: 0.6473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8067, loss: 0.7459, batch_reg_loss: 0.1685, reg_loss: 0.1682 ||:  51%|#####     | 48/95 [00:32<00:29,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9457, LAS: 0.8946, UEM: 0.6246, LEM: 0.3849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2902, partial_loss/deprel_loss: 0.4431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5811, loss: 0.7445, batch_reg_loss: 0.1686, reg_loss: 0.1683 ||:  55%|#####4    | 52/95 [00:35<00:28,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8656, UAS: 0.9447, LAS: 0.8932, UEM: 0.6123, LEM: 0.3733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7916, partial_loss/deprel_loss: 0.8026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9691, loss: 0.7550, batch_reg_loss: 0.1687, reg_loss: 0.1683 ||:  59%|#####8    | 56/95 [00:37<00:25,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8389, UAS: 0.9437, LAS: 0.8923, UEM: 0.6005, LEM: 0.3630, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2806, partial_loss/deprel_loss: 0.9364, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1740, loss: 0.7627, batch_reg_loss: 0.1687, reg_loss: 0.1683 ||:  63%|######3   | 60/95 [00:39<00:21,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8578, UAS: 0.9435, LAS: 0.8919, UEM: 0.5947, LEM: 0.3544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9394, partial_loss/deprel_loss: 0.8132, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0072, loss: 0.7646, batch_reg_loss: 0.1688, reg_loss: 0.1683 ||:  67%|######7   | 64/95 [00:42<00:19,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9149, UAS: 0.9428, LAS: 0.8911, UEM: 0.5987, LEM: 0.3553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2543, partial_loss/deprel_loss: 0.4429, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5740, loss: 0.7699, batch_reg_loss: 0.1688, reg_loss: 0.1684 ||:  72%|#######1  | 68/95 [00:45<00:17,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9426, LAS: 0.8908, UEM: 0.5985, LEM: 0.3548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2651, partial_loss/deprel_loss: 0.3904, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5343, loss: 0.7715, batch_reg_loss: 0.1689, reg_loss: 0.1684 ||:  76%|#######5  | 72/95 [00:48<00:15,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9122, UAS: 0.9427, LAS: 0.8907, UEM: 0.5906, LEM: 0.3468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3585, partial_loss/deprel_loss: 0.5088, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6477, loss: 0.7718, batch_reg_loss: 0.1690, reg_loss: 0.1684 ||:  80%|########  | 76/95 [00:50<00:12,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8380, UAS: 0.9404, LAS: 0.8882, UEM: 0.5791, LEM: 0.3399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3009, partial_loss/deprel_loss: 0.8551, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1133, loss: 0.7898, batch_reg_loss: 0.1690, reg_loss: 0.1685 ||:  84%|########4 | 80/95 [00:53<00:09,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8098, UAS: 0.9381, LAS: 0.8858, UEM: 0.5699, LEM: 0.3332, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6742, partial_loss/deprel_loss: 1.0952, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3801, loss: 0.8083, batch_reg_loss: 0.1691, reg_loss: 0.1685 ||:  88%|########8 | 84/95 [00:55<00:07,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9385, LAS: 0.8863, UEM: 0.5736, LEM: 0.3352, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5025, partial_loss/deprel_loss: 0.5241, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6890, loss: 0.8038, batch_reg_loss: 0.1692, reg_loss: 0.1685 ||:  93%|#########2| 88/95 [00:58<00:04,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9391, LAS: 0.8868, UEM: 0.5768, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3505, partial_loss/deprel_loss: 0.5389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6704, loss: 0.7998, batch_reg_loss: 0.1693, reg_loss: 0.1685 ||:  97%|#########6| 92/95 [01:00<00:01,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8963, UAS: 0.9387, LAS: 0.8862, UEM: 0.5743, LEM: 0.3335, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4254, partial_loss/deprel_loss: 0.6097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7421, loss: 0.8043, batch_reg_loss: 0.1693, reg_loss: 0.1686 ||: 100%|##########| 95/95 [01:02<00:00,  1.51it/s]\n",
+      "2023-04-07 00:03:43,247 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9431, LAS: 0.8916, UEM: 0.5405, LEM: 0.2948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3246, partial_loss/deprel_loss: 28.2893, partial_loss/cycle_loss: 0.0000, batch_loss: 22.6963, loss: 28.5523, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  27%|##7       | 3/11 [00:02<00:07,  1.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8423, UAS: 0.9353, LAS: 0.8808, UEM: 0.4659, LEM: 0.2253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4638, partial_loss/deprel_loss: 57.8192, partial_loss/cycle_loss: 0.0000, batch_loss: 46.5482, loss: 31.9561, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:04<00:05,  1.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8985, UAS: 0.9451, LAS: 0.8888, UEM: 0.5769, LEM: 0.2588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5146, partial_loss/deprel_loss: 24.2149, partial_loss/cycle_loss: 0.0000, batch_loss: 19.4748, loss: 27.8085, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  73%|#######2  | 8/11 [00:07<00:02,  1.07it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8661, UAS: 0.9462, LAS: 0.8915, UEM: 0.6454, LEM: 0.3727, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9144, partial_loss/deprel_loss: 44.4241, partial_loss/cycle_loss: 0.0000, batch_loss: 35.7222, loss: 27.4137, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  91%|######### | 10/11 [00:09<00:00,  1.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9294, UAS: 0.9485, LAS: 0.8950, UEM: 0.6749, LEM: 0.4002, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2146, partial_loss/deprel_loss: 22.9214, partial_loss/cycle_loss: 0.0000, batch_loss: 18.3801, loss: 26.5925, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.01it/s]\n",
+      "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.169  |     0.000\n",
+      "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - UEM                      |     0.574  |     0.675\n",
+      "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - LEM                      |     0.334  |     0.400\n",
+      "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - EM                       |     0.896  |     0.929\n",
+      "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.425  |     0.215\n",
+      "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 00:03:54,100 - INFO - combo.training.tensorboard_writer - UAS                      |     0.939  |     0.948\n",
+      "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.610  |    22.921\n",
+      "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - loss                     |     0.804  |    26.592\n",
+      "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - LAS                      |     0.886  |     0.895\n",
+      "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:03:54,101 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 00:03:54,102 - INFO - combo.training.trainer - Epoch duration: 0:01:13.603661\n",
+      "2023-04-07 00:03:54,102 - INFO - combo.training.trainer - Estimated training time remaining: 6:15:59\n",
+      "2023-04-07 00:03:54,102 - INFO - allennlp.training.trainer - Epoch 66/399\n",
+      "2023-04-07 00:03:54,102 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:03:54,103 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:03:54,110 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9122, UAS: 0.9601, LAS: 0.9097, UEM: 0.7095, LEM: 0.4156, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3314, partial_loss/deprel_loss: 0.5307, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6602, loss: 0.6498, batch_reg_loss: 0.1694, reg_loss: 0.1694 ||:   4%|4         | 4/95 [00:02<00:54,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9595, LAS: 0.9089, UEM: 0.7318, LEM: 0.4507, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5926, partial_loss/deprel_loss: 0.6805, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8324, loss: 0.6449, batch_reg_loss: 0.1694, reg_loss: 0.1694 ||:   7%|7         | 7/95 [00:04<00:55,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9554, LAS: 0.9035, UEM: 0.6783, LEM: 0.4010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2470, partial_loss/deprel_loss: 0.3975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5369, loss: 0.6774, batch_reg_loss: 0.1695, reg_loss: 0.1694 ||:  12%|#1        | 11/95 [00:06<00:51,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8499, UAS: 0.9473, LAS: 0.8944, UEM: 0.6155, LEM: 0.3527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9505, partial_loss/deprel_loss: 0.9103, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0879, loss: 0.7509, batch_reg_loss: 0.1695, reg_loss: 0.1694 ||:  16%|#5        | 15/95 [00:09<00:49,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8778, UAS: 0.9481, LAS: 0.8951, UEM: 0.6158, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5815, partial_loss/deprel_loss: 0.6274, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7879, loss: 0.7384, batch_reg_loss: 0.1696, reg_loss: 0.1695 ||:  19%|#8        | 18/95 [00:11<00:49,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8437, UAS: 0.9467, LAS: 0.8940, UEM: 0.6187, LEM: 0.3435, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1853, partial_loss/deprel_loss: 0.9649, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1786, loss: 0.7459, batch_reg_loss: 0.1696, reg_loss: 0.1695 ||:  22%|##2       | 21/95 [00:13<00:48,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8930, UAS: 0.9427, LAS: 0.8898, UEM: 0.6051, LEM: 0.3304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4605, partial_loss/deprel_loss: 0.6038, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7448, loss: 0.7777, batch_reg_loss: 0.1697, reg_loss: 0.1695 ||:  25%|##5       | 24/95 [00:15<00:46,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8805, UAS: 0.9414, LAS: 0.8885, UEM: 0.5777, LEM: 0.3091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6379, partial_loss/deprel_loss: 0.6606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8258, loss: 0.7842, batch_reg_loss: 0.1697, reg_loss: 0.1695 ||:  29%|##9       | 28/95 [00:18<00:43,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9420, LAS: 0.8890, UEM: 0.5812, LEM: 0.3157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1397, partial_loss/deprel_loss: 0.3224, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4556, loss: 0.7807, batch_reg_loss: 0.1698, reg_loss: 0.1696 ||:  33%|###2      | 31/95 [00:20<00:43,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8744, UAS: 0.9431, LAS: 0.8901, UEM: 0.5918, LEM: 0.3229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5835, partial_loss/deprel_loss: 0.7340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8737, loss: 0.7734, batch_reg_loss: 0.1698, reg_loss: 0.1696 ||:  36%|###5      | 34/95 [00:22<00:43,  1.40it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8714, UAS: 0.9435, LAS: 0.8908, UEM: 0.5906, LEM: 0.3209, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7973, partial_loss/deprel_loss: 0.7353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9176, loss: 0.7715, batch_reg_loss: 0.1699, reg_loss: 0.1696 ||:  39%|###8      | 37/95 [00:24<00:41,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8524, UAS: 0.9435, LAS: 0.8912, UEM: 0.6163, LEM: 0.3643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1037, partial_loss/deprel_loss: 0.9039, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1138, loss: 0.7703, batch_reg_loss: 0.1699, reg_loss: 0.1696 ||:  42%|####2     | 40/95 [00:27<00:41,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9444, LAS: 0.8924, UEM: 0.6293, LEM: 0.3798, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1451, partial_loss/deprel_loss: 0.2613, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4081, loss: 0.7592, batch_reg_loss: 0.1700, reg_loss: 0.1697 ||:  46%|####6     | 44/95 [00:30<00:37,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9447, LAS: 0.8929, UEM: 0.6220, LEM: 0.3716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4300, partial_loss/deprel_loss: 0.5710, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7128, loss: 0.7575, batch_reg_loss: 0.1700, reg_loss: 0.1697 ||:  49%|####9     | 47/95 [00:32<00:36,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9456, LAS: 0.8939, UEM: 0.6293, LEM: 0.3772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4173, partial_loss/deprel_loss: 0.5274, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6754, loss: 0.7488, batch_reg_loss: 0.1701, reg_loss: 0.1697 ||:  53%|#####2    | 50/95 [00:34<00:34,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9451, LAS: 0.8935, UEM: 0.6279, LEM: 0.3774, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2563, partial_loss/deprel_loss: 0.4042, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5447, loss: 0.7522, batch_reg_loss: 0.1701, reg_loss: 0.1697 ||:  56%|#####5    | 53/95 [00:37<00:32,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9448, LAS: 0.8931, UEM: 0.6190, LEM: 0.3667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3614, partial_loss/deprel_loss: 0.5620, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6920, loss: 0.7568, batch_reg_loss: 0.1701, reg_loss: 0.1698 ||:  60%|######    | 57/95 [00:39<00:28,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9442, LAS: 0.8929, UEM: 0.6134, LEM: 0.3649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2584, partial_loss/deprel_loss: 0.3723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5197, loss: 0.7584, batch_reg_loss: 0.1702, reg_loss: 0.1698 ||:  64%|######4   | 61/95 [00:42<00:24,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8651, UAS: 0.9437, LAS: 0.8924, UEM: 0.6152, LEM: 0.3693, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0340, partial_loss/deprel_loss: 0.9069, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1026, loss: 0.7631, batch_reg_loss: 0.1702, reg_loss: 0.1698 ||:  67%|######7   | 64/95 [00:44<00:22,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9426, LAS: 0.8911, UEM: 0.6056, LEM: 0.3619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6441, partial_loss/deprel_loss: 0.7303, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8833, loss: 0.7733, batch_reg_loss: 0.1703, reg_loss: 0.1698 ||:  71%|#######   | 67/95 [00:47<00:20,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9220, UAS: 0.9427, LAS: 0.8911, UEM: 0.6021, LEM: 0.3584, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2508, partial_loss/deprel_loss: 0.4391, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5718, loss: 0.7728, batch_reg_loss: 0.1703, reg_loss: 0.1698 ||:  74%|#######3  | 70/95 [00:49<00:18,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8703, UAS: 0.9406, LAS: 0.8890, UEM: 0.5930, LEM: 0.3511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8441, partial_loss/deprel_loss: 0.7311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9241, loss: 0.7889, batch_reg_loss: 0.1704, reg_loss: 0.1699 ||:  78%|#######7  | 74/95 [00:51<00:14,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9407, LAS: 0.8890, UEM: 0.5944, LEM: 0.3503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3029, partial_loss/deprel_loss: 0.4895, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6226, loss: 0.7878, batch_reg_loss: 0.1704, reg_loss: 0.1699 ||:  81%|########1 | 77/95 [00:53<00:12,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9409, LAS: 0.8890, UEM: 0.5910, LEM: 0.3453, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4703, partial_loss/deprel_loss: 0.5552, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7087, loss: 0.7876, batch_reg_loss: 0.1705, reg_loss: 0.1699 ||:  84%|########4 | 80/95 [00:55<00:10,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8330, UAS: 0.9403, LAS: 0.8882, UEM: 0.5875, LEM: 0.3430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2940, partial_loss/deprel_loss: 0.9074, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1553, loss: 0.7936, batch_reg_loss: 0.1706, reg_loss: 0.1699 ||:  88%|########8 | 84/95 [00:58<00:07,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9388, LAS: 0.8866, UEM: 0.5830, LEM: 0.3395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2650, partial_loss/deprel_loss: 0.4753, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6039, loss: 0.8044, batch_reg_loss: 0.1706, reg_loss: 0.1700 ||:  93%|#########2| 88/95 [01:01<00:04,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9390, LAS: 0.8868, UEM: 0.5818, LEM: 0.3369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3476, partial_loss/deprel_loss: 0.4743, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6197, loss: 0.8040, batch_reg_loss: 0.1707, reg_loss: 0.1700 ||:  96%|#########5| 91/95 [01:03<00:02,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9398, LAS: 0.8876, UEM: 0.5812, LEM: 0.3343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4487, partial_loss/deprel_loss: 0.5758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7212, loss: 0.7984, batch_reg_loss: 0.1708, reg_loss: 0.1700 ||: 100%|##########| 95/95 [01:05<00:00,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9398, LAS: 0.8876, UEM: 0.5812, LEM: 0.3343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4487, partial_loss/deprel_loss: 0.5758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7212, loss: 0.7984, batch_reg_loss: 0.1708, reg_loss: 0.1700 ||: 100%|##########| 95/95 [01:05<00:00,  1.44it/s]\n",
+      "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.170  |       N/A\n",
+      "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer - UEM                      |     0.581  |       N/A\n",
+      "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer - LEM                      |     0.334  |       N/A\n",
+      "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer - EM                       |     0.899  |       N/A\n",
+      "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.449  |       N/A\n",
+      "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:05:00,015 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - UAS                      |     0.940  |       N/A\n",
+      "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.576  |       N/A\n",
+      "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - loss                     |     0.798  |       N/A\n",
+      "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - LAS                      |     0.888  |       N/A\n",
+      "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:05:00,016 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:05:00,017 - INFO - combo.training.trainer - Epoch duration: 0:01:05.914712\n",
+      "2023-04-07 00:05:00,017 - INFO - combo.training.trainer - Estimated training time remaining: 6:14:44\n",
+      "2023-04-07 00:05:00,017 - INFO - allennlp.training.trainer - Epoch 67/399\n",
+      "2023-04-07 00:05:00,017 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:05:00,017 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:05:00,024 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8743, UAS: 0.9324, LAS: 0.8811, UEM: 0.5772, LEM: 0.3801, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7538, partial_loss/deprel_loss: 0.7196, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8973, loss: 0.8357, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:   3%|3         | 3/95 [00:02<01:03,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9336, LAS: 0.8826, UEM: 0.6490, LEM: 0.4709, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1526, partial_loss/deprel_loss: 0.2426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3954, loss: 0.8197, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:   6%|6         | 6/95 [00:04<01:02,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9230, LAS: 0.8695, UEM: 0.5531, LEM: 0.3804, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5493, partial_loss/deprel_loss: 0.6046, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7644, loss: 0.9168, batch_reg_loss: 0.1709, reg_loss: 0.1708 ||:  11%|#         | 10/95 [00:06<00:58,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9311, LAS: 0.8784, UEM: 0.5744, LEM: 0.3594, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3293, partial_loss/deprel_loss: 0.5015, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6380, loss: 0.8554, batch_reg_loss: 0.1710, reg_loss: 0.1709 ||:  14%|#3        | 13/95 [00:09<00:57,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9310, LAS: 0.8779, UEM: 0.5689, LEM: 0.3454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2638, partial_loss/deprel_loss: 0.4523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5856, loss: 0.8573, batch_reg_loss: 0.1710, reg_loss: 0.1709 ||:  17%|#6        | 16/95 [00:11<00:57,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9345, LAS: 0.8821, UEM: 0.5764, LEM: 0.3462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2498, partial_loss/deprel_loss: 0.3415, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4943, loss: 0.8235, batch_reg_loss: 0.1711, reg_loss: 0.1709 ||:  21%|##1       | 20/95 [00:14<00:54,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9346, LAS: 0.8826, UEM: 0.5587, LEM: 0.3325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9149, partial_loss/deprel_loss: 0.8323, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0199, loss: 0.8256, batch_reg_loss: 0.1711, reg_loss: 0.1709 ||:  24%|##4       | 23/95 [00:16<00:52,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8519, UAS: 0.9347, LAS: 0.8831, UEM: 0.6021, LEM: 0.4010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9940, partial_loss/deprel_loss: 0.7965, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0072, loss: 0.8231, batch_reg_loss: 0.1712, reg_loss: 0.1710 ||:  27%|##7       | 26/95 [00:18<00:52,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9344, LAS: 0.8825, UEM: 0.5849, LEM: 0.3785, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5843, partial_loss/deprel_loss: 0.6115, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7773, loss: 0.8276, batch_reg_loss: 0.1712, reg_loss: 0.1710 ||:  32%|###1      | 30/95 [00:21<00:45,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8848, UAS: 0.9317, LAS: 0.8796, UEM: 0.5668, LEM: 0.3634, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5949, partial_loss/deprel_loss: 0.6947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8460, loss: 0.8517, batch_reg_loss: 0.1713, reg_loss: 0.1710 ||:  35%|###4      | 33/95 [00:23<00:43,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8752, UAS: 0.9325, LAS: 0.8805, UEM: 0.5634, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7286, partial_loss/deprel_loss: 0.7000, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8771, loss: 0.8469, batch_reg_loss: 0.1713, reg_loss: 0.1711 ||:  39%|###8      | 37/95 [00:25<00:39,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9337, LAS: 0.8818, UEM: 0.5497, LEM: 0.3419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4293, partial_loss/deprel_loss: 0.5699, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7132, loss: 0.8384, batch_reg_loss: 0.1714, reg_loss: 0.1711 ||:  43%|####3     | 41/95 [00:28<00:35,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9360, LAS: 0.8841, UEM: 0.5664, LEM: 0.3446, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3171, partial_loss/deprel_loss: 0.5417, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6682, loss: 0.8215, batch_reg_loss: 0.1715, reg_loss: 0.1711 ||:  47%|####7     | 45/95 [00:30<00:32,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8643, UAS: 0.9355, LAS: 0.8832, UEM: 0.5485, LEM: 0.3297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7287, partial_loss/deprel_loss: 0.7702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9334, loss: 0.8286, batch_reg_loss: 0.1715, reg_loss: 0.1711 ||:  52%|#####1    | 49/95 [00:33<00:29,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9374, LAS: 0.8854, UEM: 0.5735, LEM: 0.3503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1057, partial_loss/deprel_loss: 0.2971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4304, loss: 0.8117, batch_reg_loss: 0.1716, reg_loss: 0.1712 ||:  56%|#####5    | 53/95 [00:36<00:28,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9383, LAS: 0.8866, UEM: 0.5730, LEM: 0.3466, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3638, partial_loss/deprel_loss: 0.4043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5678, loss: 0.8014, batch_reg_loss: 0.1716, reg_loss: 0.1712 ||:  60%|######    | 57/95 [00:38<00:25,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8118, UAS: 0.9382, LAS: 0.8865, UEM: 0.5793, LEM: 0.3523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3618, partial_loss/deprel_loss: 1.0481, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2825, loss: 0.8016, batch_reg_loss: 0.1717, reg_loss: 0.1712 ||:  64%|######4   | 61/95 [00:41<00:23,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9387, LAS: 0.8872, UEM: 0.5830, LEM: 0.3528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2517, partial_loss/deprel_loss: 0.4606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5906, loss: 0.7965, batch_reg_loss: 0.1717, reg_loss: 0.1713 ||:  68%|######8   | 65/95 [00:44<00:21,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8989, UAS: 0.9388, LAS: 0.8873, UEM: 0.5816, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4330, partial_loss/deprel_loss: 0.5291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6816, loss: 0.7948, batch_reg_loss: 0.1718, reg_loss: 0.1713 ||:  72%|#######1  | 68/95 [00:46<00:18,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9387, LAS: 0.8871, UEM: 0.5752, LEM: 0.3444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5528, partial_loss/deprel_loss: 0.6302, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7865, loss: 0.7976, batch_reg_loss: 0.1718, reg_loss: 0.1713 ||:  75%|#######4  | 71/95 [00:48<00:16,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8436, UAS: 0.9384, LAS: 0.8868, UEM: 0.5740, LEM: 0.3433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1857, partial_loss/deprel_loss: 0.8781, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1115, loss: 0.8005, batch_reg_loss: 0.1718, reg_loss: 0.1713 ||:  78%|#######7  | 74/95 [00:51<00:14,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9380, LAS: 0.8862, UEM: 0.5700, LEM: 0.3376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4924, partial_loss/deprel_loss: 0.6506, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7909, loss: 0.8065, batch_reg_loss: 0.1719, reg_loss: 0.1714 ||:  81%|########1 | 77/95 [00:53<00:12,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8883, UAS: 0.9381, LAS: 0.8863, UEM: 0.5635, LEM: 0.3303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4670, partial_loss/deprel_loss: 0.6401, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7774, loss: 0.8060, batch_reg_loss: 0.1719, reg_loss: 0.1714 ||:  85%|########5 | 81/95 [00:55<00:09,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9228, UAS: 0.9376, LAS: 0.8858, UEM: 0.5677, LEM: 0.3325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2746, partial_loss/deprel_loss: 0.4309, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5716, loss: 0.8091, batch_reg_loss: 0.1720, reg_loss: 0.1714 ||:  88%|########8 | 84/95 [00:57<00:07,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9380, LAS: 0.8862, UEM: 0.5673, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3007, partial_loss/deprel_loss: 0.4967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6295, loss: 0.8062, batch_reg_loss: 0.1720, reg_loss: 0.1714 ||:  92%|#########1| 87/95 [01:00<00:05,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8334, UAS: 0.9381, LAS: 0.8865, UEM: 0.5757, LEM: 0.3375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3601, partial_loss/deprel_loss: 0.9394, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1956, loss: 0.8051, batch_reg_loss: 0.1721, reg_loss: 0.1714 ||:  95%|#########4| 90/95 [01:02<00:03,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9388, LAS: 0.8872, UEM: 0.5787, LEM: 0.3383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2748, partial_loss/deprel_loss: 0.4513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5881, loss: 0.8000, batch_reg_loss: 0.1721, reg_loss: 0.1715 ||:  98%|#########7| 93/95 [01:04<00:01,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9392, LAS: 0.8877, UEM: 0.5798, LEM: 0.3381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3072, partial_loss/deprel_loss: 0.4351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5817, loss: 0.7964, batch_reg_loss: 0.1722, reg_loss: 0.1715 ||: 100%|##########| 95/95 [01:06<00:00,  1.43it/s]\n",
+      "2023-04-07 00:06:06,255 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:06:06,255 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 00:06:06,255 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.171  |       N/A\n",
+      "2023-04-07 00:06:06,255 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - UEM                      |     0.580  |       N/A\n",
+      "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - LEM                      |     0.338  |       N/A\n",
+      "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - EM                       |     0.915  |       N/A\n",
+      "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.307  |       N/A\n",
+      "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - UAS                      |     0.939  |       N/A\n",
+      "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.435  |       N/A\n",
+      "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - loss                     |     0.796  |       N/A\n",
+      "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - LAS                      |     0.888  |       N/A\n",
+      "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:06:06,256 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:06:06,257 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:06:06,257 - INFO - combo.training.trainer - Epoch duration: 0:01:06.240258\n",
+      "2023-04-07 00:06:06,257 - INFO - combo.training.trainer - Estimated training time remaining: 6:13:30\n",
+      "2023-04-07 00:06:06,257 - INFO - allennlp.training.trainer - Epoch 68/399\n",
+      "2023-04-07 00:06:06,258 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:06:06,258 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:06:06,265 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9587, LAS: 0.9139, UEM: 0.7856, LEM: 0.5824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2464, partial_loss/deprel_loss: 0.4504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5818, loss: 0.5819, batch_reg_loss: 0.1722, reg_loss: 0.1722 ||:   3%|3         | 3/95 [00:02<01:12,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9519, LAS: 0.9063, UEM: 0.7001, LEM: 0.4794, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1949, partial_loss/deprel_loss: 0.3622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5010, loss: 0.6616, batch_reg_loss: 0.1723, reg_loss: 0.1722 ||:   7%|7         | 7/95 [00:04<01:04,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9491, LAS: 0.9010, UEM: 0.6554, LEM: 0.4208, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3870, partial_loss/deprel_loss: 0.5602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6979, loss: 0.7004, batch_reg_loss: 0.1723, reg_loss: 0.1722 ||:  12%|#1        | 11/95 [00:07<01:01,  1.36it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9070, UAS: 0.9410, LAS: 0.8914, UEM: 0.6062, LEM: 0.3760, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3762, partial_loss/deprel_loss: 0.4839, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6347, loss: 0.7718, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:  16%|#5        | 15/95 [00:10<00:55,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9035, UAS: 0.9450, LAS: 0.8954, UEM: 0.6326, LEM: 0.3857, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2793, partial_loss/deprel_loss: 0.5585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6750, loss: 0.7440, batch_reg_loss: 0.1724, reg_loss: 0.1723 ||:  19%|#8        | 18/95 [00:12<00:54,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9463, LAS: 0.8969, UEM: 0.6529, LEM: 0.4115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1125, partial_loss/deprel_loss: 0.2689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4100, loss: 0.7289, batch_reg_loss: 0.1724, reg_loss: 0.1723 ||:  22%|##2       | 21/95 [00:14<00:53,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9478, LAS: 0.8982, UEM: 0.6541, LEM: 0.4047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2618, partial_loss/deprel_loss: 0.4876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6149, loss: 0.7217, batch_reg_loss: 0.1725, reg_loss: 0.1723 ||:  26%|##6       | 25/95 [00:17<00:49,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9481, LAS: 0.8985, UEM: 0.6538, LEM: 0.4010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1610, partial_loss/deprel_loss: 0.3754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5051, loss: 0.7196, batch_reg_loss: 0.1725, reg_loss: 0.1724 ||:  31%|###       | 29/95 [00:19<00:44,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.9472, LAS: 0.8979, UEM: 0.6350, LEM: 0.3883, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9341, partial_loss/deprel_loss: 0.7667, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9727, loss: 0.7252, batch_reg_loss: 0.1726, reg_loss: 0.1724 ||:  35%|###4      | 33/95 [00:22<00:41,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9463, LAS: 0.8962, UEM: 0.6173, LEM: 0.3697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4791, partial_loss/deprel_loss: 0.5957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7450, loss: 0.7406, batch_reg_loss: 0.1726, reg_loss: 0.1724 ||:  39%|###8      | 37/95 [00:24<00:38,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9454, LAS: 0.8949, UEM: 0.6123, LEM: 0.3632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7145, partial_loss/deprel_loss: 0.7944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9511, loss: 0.7485, batch_reg_loss: 0.1727, reg_loss: 0.1724 ||:  43%|####3     | 41/95 [00:27<00:34,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9445, LAS: 0.8940, UEM: 0.5998, LEM: 0.3515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3833, partial_loss/deprel_loss: 0.5173, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6633, loss: 0.7572, batch_reg_loss: 0.1727, reg_loss: 0.1725 ||:  47%|####7     | 45/95 [00:30<00:32,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8817, UAS: 0.9452, LAS: 0.8948, UEM: 0.6033, LEM: 0.3522, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6803, partial_loss/deprel_loss: 0.6569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8344, loss: 0.7507, batch_reg_loss: 0.1728, reg_loss: 0.1725 ||:  52%|#####1    | 49/95 [00:33<00:31,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9061, UAS: 0.9437, LAS: 0.8933, UEM: 0.5970, LEM: 0.3477, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4687, partial_loss/deprel_loss: 0.5079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6729, loss: 0.7606, batch_reg_loss: 0.1729, reg_loss: 0.1725 ||:  55%|#####4    | 52/95 [00:35<00:30,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8894, UAS: 0.9430, LAS: 0.8921, UEM: 0.5866, LEM: 0.3369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4625, partial_loss/deprel_loss: 0.6118, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7549, loss: 0.7677, batch_reg_loss: 0.1729, reg_loss: 0.1725 ||:  59%|#####8    | 56/95 [00:37<00:26,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8668, UAS: 0.9418, LAS: 0.8908, UEM: 0.5768, LEM: 0.3281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8159, partial_loss/deprel_loss: 0.7028, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8984, loss: 0.7776, batch_reg_loss: 0.1730, reg_loss: 0.1726 ||:  63%|######3   | 60/95 [00:40<00:23,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9425, LAS: 0.8916, UEM: 0.5886, LEM: 0.3404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3835, partial_loss/deprel_loss: 0.4990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6489, loss: 0.7703, batch_reg_loss: 0.1731, reg_loss: 0.1726 ||:  67%|######7   | 64/95 [00:43<00:21,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8844, UAS: 0.9423, LAS: 0.8912, UEM: 0.5833, LEM: 0.3355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6041, partial_loss/deprel_loss: 0.6684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8286, loss: 0.7740, batch_reg_loss: 0.1731, reg_loss: 0.1726 ||:  71%|#######   | 67/95 [00:45<00:19,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9422, LAS: 0.8907, UEM: 0.5799, LEM: 0.3307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7295, partial_loss/deprel_loss: 0.7300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9031, loss: 0.7775, batch_reg_loss: 0.1732, reg_loss: 0.1726 ||:  75%|#######4  | 71/95 [00:48<00:16,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8350, UAS: 0.9406, LAS: 0.8892, UEM: 0.5718, LEM: 0.3253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3351, partial_loss/deprel_loss: 0.8683, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1349, loss: 0.7873, batch_reg_loss: 0.1732, reg_loss: 0.1727 ||:  78%|#######7  | 74/95 [00:50<00:14,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9409, LAS: 0.8895, UEM: 0.5731, LEM: 0.3258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5666, partial_loss/deprel_loss: 0.6794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8301, loss: 0.7837, batch_reg_loss: 0.1733, reg_loss: 0.1727 ||:  81%|########1 | 77/95 [00:52<00:12,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8458, UAS: 0.9407, LAS: 0.8893, UEM: 0.5694, LEM: 0.3221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1221, partial_loss/deprel_loss: 0.9179, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1321, loss: 0.7865, batch_reg_loss: 0.1733, reg_loss: 0.1727 ||:  85%|########5 | 81/95 [00:54<00:09,  1.47it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9061, UAS: 0.9393, LAS: 0.8878, UEM: 0.5622, LEM: 0.3165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4130, partial_loss/deprel_loss: 0.5317, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6813, loss: 0.7980, batch_reg_loss: 0.1734, reg_loss: 0.1727 ||:  89%|########9 | 85/95 [00:57<00:06,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8510, UAS: 0.9388, LAS: 0.8872, UEM: 0.5587, LEM: 0.3138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0143, partial_loss/deprel_loss: 0.9618, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1458, loss: 0.8031, batch_reg_loss: 0.1735, reg_loss: 0.1728 ||:  94%|#########3| 89/95 [01:00<00:04,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9584, UAS: 0.9396, LAS: 0.8882, UEM: 0.5774, LEM: 0.3391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0588, partial_loss/deprel_loss: 0.1635, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3161, loss: 0.7969, batch_reg_loss: 0.1735, reg_loss: 0.1728 ||:  97%|#########6| 92/95 [01:03<00:02,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8345, UAS: 0.9393, LAS: 0.8879, UEM: 0.5786, LEM: 0.3415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4150, partial_loss/deprel_loss: 0.9446, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2123, loss: 0.7990, batch_reg_loss: 0.1736, reg_loss: 0.1728 ||: 100%|##########| 95/95 [01:05<00:00,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8345, UAS: 0.9393, LAS: 0.8879, UEM: 0.5786, LEM: 0.3415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4150, partial_loss/deprel_loss: 0.9446, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2123, loss: 0.7990, batch_reg_loss: 0.1736, reg_loss: 0.1728 ||: 100%|##########| 95/95 [01:05<00:00,  1.46it/s]\n",
+      "2023-04-07 00:07:11,491 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:07:11,491 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 00:07:11,491 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.173  |       N/A\n",
+      "2023-04-07 00:07:11,491 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:07:11,491 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:07:11,491 - INFO - combo.training.tensorboard_writer - UEM                      |     0.579  |       N/A\n",
+      "2023-04-07 00:07:11,491 - INFO - combo.training.tensorboard_writer - LEM                      |     0.341  |       N/A\n",
+      "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - EM                       |     0.834  |       N/A\n",
+      "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.415  |       N/A\n",
+      "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - UAS                      |     0.939  |       N/A\n",
+      "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.945  |       N/A\n",
+      "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - loss                     |     0.799  |       N/A\n",
+      "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - LAS                      |     0.888  |       N/A\n",
+      "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:07:11,492 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:07:11,493 - INFO - combo.training.trainer - Epoch duration: 0:01:05.235624\n",
+      "2023-04-07 00:07:11,493 - INFO - combo.training.trainer - Estimated training time remaining: 6:12:11\n",
+      "2023-04-07 00:07:11,493 - INFO - allennlp.training.trainer - Epoch 69/399\n",
+      "2023-04-07 00:07:11,493 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:07:11,494 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:07:11,501 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8345, UAS: 0.9319, LAS: 0.8809, UEM: 0.4658, LEM: 0.2588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2728, partial_loss/deprel_loss: 0.9373, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1780, loss: 0.8313, batch_reg_loss: 0.1736, reg_loss: 0.1736 ||:   4%|4         | 4/95 [00:02<00:55,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9396, LAS: 0.8886, UEM: 0.5949, LEM: 0.3610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2140, partial_loss/deprel_loss: 0.3690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5117, loss: 0.7732, batch_reg_loss: 0.1737, reg_loss: 0.1736 ||:   7%|7         | 7/95 [00:04<00:55,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9369, LAS: 0.8864, UEM: 0.6029, LEM: 0.3770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1628, partial_loss/deprel_loss: 0.3749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5062, loss: 0.7978, batch_reg_loss: 0.1737, reg_loss: 0.1737 ||:  11%|#         | 10/95 [00:06<00:57,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9600, UAS: 0.9417, LAS: 0.8934, UEM: 0.6786, LEM: 0.4823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0577, partial_loss/deprel_loss: 0.1619, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3148, loss: 0.7504, batch_reg_loss: 0.1738, reg_loss: 0.1737 ||:  14%|#3        | 13/95 [00:09<01:00,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8319, UAS: 0.9398, LAS: 0.8907, UEM: 0.6684, LEM: 0.4707, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3221, partial_loss/deprel_loss: 0.9825, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2242, loss: 0.7711, batch_reg_loss: 0.1738, reg_loss: 0.1737 ||:  17%|#6        | 16/95 [00:11<00:57,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9422, LAS: 0.8933, UEM: 0.6685, LEM: 0.4569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6970, partial_loss/deprel_loss: 0.6860, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8620, loss: 0.7529, batch_reg_loss: 0.1739, reg_loss: 0.1737 ||:  20%|##        | 19/95 [00:13<00:54,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9447, LAS: 0.8956, UEM: 0.6852, LEM: 0.4695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2802, partial_loss/deprel_loss: 0.4948, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6258, loss: 0.7326, batch_reg_loss: 0.1739, reg_loss: 0.1737 ||:  23%|##3       | 22/95 [00:15<00:52,  1.39it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9126, UAS: 0.9456, LAS: 0.8959, UEM: 0.6625, LEM: 0.4378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3983, partial_loss/deprel_loss: 0.5102, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6618, loss: 0.7349, batch_reg_loss: 0.1739, reg_loss: 0.1738 ||:  27%|##7       | 26/95 [00:18<00:47,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9110, UAS: 0.9426, LAS: 0.8929, UEM: 0.6455, LEM: 0.4189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3413, partial_loss/deprel_loss: 0.5252, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6624, loss: 0.7604, batch_reg_loss: 0.1740, reg_loss: 0.1738 ||:  32%|###1      | 30/95 [00:20<00:43,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9441, LAS: 0.8945, UEM: 0.6442, LEM: 0.4079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3032, partial_loss/deprel_loss: 0.4812, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6196, loss: 0.7508, batch_reg_loss: 0.1740, reg_loss: 0.1738 ||:  35%|###4      | 33/95 [00:23<00:43,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9453, LAS: 0.8956, UEM: 0.6464, LEM: 0.4040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2720, partial_loss/deprel_loss: 0.4392, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5798, loss: 0.7407, batch_reg_loss: 0.1741, reg_loss: 0.1738 ||:  38%|###7      | 36/95 [00:25<00:40,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9452, LAS: 0.8957, UEM: 0.6449, LEM: 0.4040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2043, partial_loss/deprel_loss: 0.3425, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4890, loss: 0.7421, batch_reg_loss: 0.1741, reg_loss: 0.1739 ||:  41%|####1     | 39/95 [00:27<00:39,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9450, LAS: 0.8955, UEM: 0.6347, LEM: 0.3927, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5268, partial_loss/deprel_loss: 0.6980, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8379, loss: 0.7425, batch_reg_loss: 0.1742, reg_loss: 0.1739 ||:  44%|####4     | 42/95 [00:29<00:37,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9149, UAS: 0.9453, LAS: 0.8959, UEM: 0.6375, LEM: 0.3956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2734, partial_loss/deprel_loss: 0.4405, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5813, loss: 0.7410, batch_reg_loss: 0.1742, reg_loss: 0.1739 ||:  47%|####7     | 45/95 [00:31<00:36,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8982, UAS: 0.9439, LAS: 0.8945, UEM: 0.6269, LEM: 0.3870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4470, partial_loss/deprel_loss: 0.5936, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7385, loss: 0.7511, batch_reg_loss: 0.1742, reg_loss: 0.1739 ||:  51%|#####     | 48/95 [00:33<00:33,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9136, UAS: 0.9444, LAS: 0.8951, UEM: 0.6316, LEM: 0.3941, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4268, partial_loss/deprel_loss: 0.4800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6436, loss: 0.7477, batch_reg_loss: 0.1743, reg_loss: 0.1739 ||:  54%|#####3    | 51/95 [00:38<00:41,  1.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9235, UAS: 0.9433, LAS: 0.8940, UEM: 0.6272, LEM: 0.3922, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2191, partial_loss/deprel_loss: 0.3953, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5344, loss: 0.7587, batch_reg_loss: 0.1743, reg_loss: 0.1740 ||:  57%|#####6    | 54/95 [00:40<00:35,  1.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8403, UAS: 0.9428, LAS: 0.8932, UEM: 0.6212, LEM: 0.3846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0526, partial_loss/deprel_loss: 0.8650, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0768, loss: 0.7622, batch_reg_loss: 0.1744, reg_loss: 0.1740 ||:  60%|######    | 57/95 [00:42<00:31,  1.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8851, UAS: 0.9407, LAS: 0.8908, UEM: 0.6071, LEM: 0.3733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5570, partial_loss/deprel_loss: 0.6794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8293, loss: 0.7790, batch_reg_loss: 0.1744, reg_loss: 0.1740 ||:  64%|######4   | 61/95 [00:45<00:26,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9403, LAS: 0.8903, UEM: 0.6131, LEM: 0.3780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1507, partial_loss/deprel_loss: 0.3130, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4550, loss: 0.7813, batch_reg_loss: 0.1745, reg_loss: 0.1740 ||:  67%|######7   | 64/95 [00:47<00:24,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9405, LAS: 0.8903, UEM: 0.6066, LEM: 0.3707, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7340, partial_loss/deprel_loss: 0.7126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8914, loss: 0.7835, batch_reg_loss: 0.1745, reg_loss: 0.1740 ||:  71%|#######   | 67/95 [00:49<00:21,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8536, UAS: 0.9400, LAS: 0.8898, UEM: 0.5994, LEM: 0.3642, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1403, partial_loss/deprel_loss: 0.8225, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0606, loss: 0.7869, batch_reg_loss: 0.1746, reg_loss: 0.1741 ||:  75%|#######4  | 71/95 [00:52<00:17,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9404, LAS: 0.8902, UEM: 0.6003, LEM: 0.3654, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2757, partial_loss/deprel_loss: 0.3715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5269, loss: 0.7836, batch_reg_loss: 0.1746, reg_loss: 0.1741 ||:  78%|#######7  | 74/95 [00:54<00:15,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9171, UAS: 0.9413, LAS: 0.8911, UEM: 0.6053, LEM: 0.3651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2430, partial_loss/deprel_loss: 0.5264, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6444, loss: 0.7775, batch_reg_loss: 0.1747, reg_loss: 0.1741 ||:  81%|########1 | 77/95 [00:56<00:13,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8475, UAS: 0.9409, LAS: 0.8904, UEM: 0.5997, LEM: 0.3602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9304, partial_loss/deprel_loss: 0.9354, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1091, loss: 0.7823, batch_reg_loss: 0.1747, reg_loss: 0.1741 ||:  85%|########5 | 81/95 [00:59<00:09,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9223, UAS: 0.9405, LAS: 0.8899, UEM: 0.5967, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2696, partial_loss/deprel_loss: 0.4255, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5691, loss: 0.7860, batch_reg_loss: 0.1748, reg_loss: 0.1742 ||:  88%|########8 | 84/95 [01:01<00:07,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9405, LAS: 0.8898, UEM: 0.5912, LEM: 0.3526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7375, partial_loss/deprel_loss: 0.6926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8764, loss: 0.7868, batch_reg_loss: 0.1748, reg_loss: 0.1742 ||:  92%|#########1| 87/95 [01:03<00:05,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9404, LAS: 0.8896, UEM: 0.5846, LEM: 0.3457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5953, partial_loss/deprel_loss: 0.5995, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7735, loss: 0.7882, batch_reg_loss: 0.1749, reg_loss: 0.1742 ||:  96%|#########5| 91/95 [01:06<00:02,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9403, LAS: 0.8894, UEM: 0.5817, LEM: 0.3430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2989, partial_loss/deprel_loss: 0.4423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5885, loss: 0.7904, batch_reg_loss: 0.1749, reg_loss: 0.1742 ||:  99%|#########8| 94/95 [01:08<00:00,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8721, UAS: 0.9402, LAS: 0.8892, UEM: 0.5793, LEM: 0.3414, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8387, partial_loss/deprel_loss: 0.7951, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9788, loss: 0.7924, batch_reg_loss: 0.1750, reg_loss: 0.1743 ||: 100%|##########| 95/95 [01:08<00:00,  1.38it/s]\n",
+      "2023-04-07 00:08:20,495 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.174  |       N/A\n",
+      "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - UEM                      |     0.579  |       N/A\n",
+      "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - LEM                      |     0.341  |       N/A\n",
+      "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - EM                       |     0.872  |       N/A\n",
+      "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.839  |       N/A\n",
+      "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - UAS                      |     0.940  |       N/A\n",
+      "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.795  |       N/A\n",
+      "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - loss                     |     0.792  |       N/A\n",
+      "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:08:20,496 - INFO - combo.training.tensorboard_writer - LAS                      |     0.889  |       N/A\n",
+      "2023-04-07 00:08:20,497 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:08:20,497 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:08:20,497 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:08:20,497 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:08:20,497 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:08:20,497 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:08:20,497 - INFO - combo.training.trainer - Epoch duration: 0:01:09.004150\n",
+      "2023-04-07 00:08:20,498 - INFO - combo.training.trainer - Estimated training time remaining: 6:11:11\n",
+      "2023-04-07 00:08:20,498 - INFO - allennlp.training.trainer - Epoch 70/399\n",
+      "2023-04-07 00:08:20,498 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:08:20,498 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:08:20,505 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9521, UAS: 0.9491, LAS: 0.9010, UEM: 0.7922, LEM: 0.6567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0717, partial_loss/deprel_loss: 0.1955, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3458, loss: 0.7096, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:   3%|3         | 3/95 [00:02<01:19,  1.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9440, LAS: 0.8947, UEM: 0.7003, LEM: 0.5279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6981, partial_loss/deprel_loss: 0.7286, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8976, loss: 0.7553, batch_reg_loss: 0.1751, reg_loss: 0.1750 ||:   6%|6         | 6/95 [00:04<01:13,  1.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8609, UAS: 0.9396, LAS: 0.8888, UEM: 0.6422, LEM: 0.4571, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9106, partial_loss/deprel_loss: 0.7770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9788, loss: 0.8048, batch_reg_loss: 0.1751, reg_loss: 0.1750 ||:   9%|9         | 9/95 [00:06<01:06,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8853, UAS: 0.9413, LAS: 0.8906, UEM: 0.6105, LEM: 0.4112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6072, partial_loss/deprel_loss: 0.7074, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8625, loss: 0.7915, batch_reg_loss: 0.1752, reg_loss: 0.1751 ||:  13%|#2        | 12/95 [00:08<01:03,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9446, LAS: 0.8935, UEM: 0.6170, LEM: 0.3991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2828, partial_loss/deprel_loss: 0.5331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6582, loss: 0.7705, batch_reg_loss: 0.1752, reg_loss: 0.1751 ||:  16%|#5        | 15/95 [00:10<00:58,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9378, LAS: 0.8873, UEM: 0.5714, LEM: 0.3588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6191, partial_loss/deprel_loss: 0.6607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8276, loss: 0.8160, batch_reg_loss: 0.1753, reg_loss: 0.1751 ||:  20%|##        | 19/95 [00:13<00:53,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9368, LAS: 0.8858, UEM: 0.5476, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4515, partial_loss/deprel_loss: 0.5893, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7370, loss: 0.8286, batch_reg_loss: 0.1753, reg_loss: 0.1751 ||:  23%|##3       | 22/95 [00:15<00:50,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9399, LAS: 0.8889, UEM: 0.5813, LEM: 0.3583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1573, partial_loss/deprel_loss: 0.3624, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4967, loss: 0.8035, batch_reg_loss: 0.1753, reg_loss: 0.1752 ||:  27%|##7       | 26/95 [00:17<00:46,  1.50it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9405, LAS: 0.8898, UEM: 0.5877, LEM: 0.3593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3158, partial_loss/deprel_loss: 0.4406, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5911, loss: 0.7973, batch_reg_loss: 0.1754, reg_loss: 0.1752 ||:  32%|###1      | 30/95 [00:20<00:43,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8727, UAS: 0.9412, LAS: 0.8907, UEM: 0.5935, LEM: 0.3625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8567, partial_loss/deprel_loss: 0.7805, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9712, loss: 0.7906, batch_reg_loss: 0.1754, reg_loss: 0.1752 ||:  35%|###4      | 33/95 [00:22<00:42,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8958, UAS: 0.9419, LAS: 0.8914, UEM: 0.5897, LEM: 0.3527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5001, partial_loss/deprel_loss: 0.5773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7373, loss: 0.7822, batch_reg_loss: 0.1755, reg_loss: 0.1752 ||:  38%|###7      | 36/95 [00:24<00:40,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9427, LAS: 0.8918, UEM: 0.5907, LEM: 0.3508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2411, partial_loss/deprel_loss: 0.3916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5370, loss: 0.7771, batch_reg_loss: 0.1755, reg_loss: 0.1753 ||:  42%|####2     | 40/95 [00:27<00:37,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8573, UAS: 0.9419, LAS: 0.8912, UEM: 0.5871, LEM: 0.3507, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0417, partial_loss/deprel_loss: 0.8071, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0296, loss: 0.7813, batch_reg_loss: 0.1756, reg_loss: 0.1753 ||:  45%|####5     | 43/95 [00:29<00:36,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9427, LAS: 0.8918, UEM: 0.5864, LEM: 0.3449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4019, partial_loss/deprel_loss: 0.6446, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7716, loss: 0.7764, batch_reg_loss: 0.1756, reg_loss: 0.1753 ||:  48%|####8     | 46/95 [00:32<00:35,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9442, LAS: 0.8934, UEM: 0.6045, LEM: 0.3592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2332, partial_loss/deprel_loss: 0.4484, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5810, loss: 0.7629, batch_reg_loss: 0.1756, reg_loss: 0.1753 ||:  52%|#####1    | 49/95 [00:34<00:34,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9393, UAS: 0.9450, LAS: 0.8945, UEM: 0.6186, LEM: 0.3756, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1168, partial_loss/deprel_loss: 0.2561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4040, loss: 0.7553, batch_reg_loss: 0.1757, reg_loss: 0.1753 ||:  55%|#####4    | 52/95 [00:36<00:33,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9457, LAS: 0.8950, UEM: 0.6215, LEM: 0.3739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4822, partial_loss/deprel_loss: 0.6509, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7929, loss: 0.7510, batch_reg_loss: 0.1757, reg_loss: 0.1754 ||:  58%|#####7    | 55/95 [00:39<00:30,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8443, UAS: 0.9443, LAS: 0.8935, UEM: 0.6121, LEM: 0.3654, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2571, partial_loss/deprel_loss: 0.9744, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2066, loss: 0.7650, batch_reg_loss: 0.1757, reg_loss: 0.1754 ||:  62%|######2   | 59/95 [00:41<00:25,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9436, LAS: 0.8929, UEM: 0.6058, LEM: 0.3601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3646, partial_loss/deprel_loss: 0.5462, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6857, loss: 0.7703, batch_reg_loss: 0.1758, reg_loss: 0.1754 ||:  65%|######5   | 62/95 [00:43<00:23,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9439, LAS: 0.8931, UEM: 0.6097, LEM: 0.3655, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1138, partial_loss/deprel_loss: 0.3408, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4712, loss: 0.7681, batch_reg_loss: 0.1758, reg_loss: 0.1754 ||:  68%|######8   | 65/95 [00:45<00:20,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9446, LAS: 0.8938, UEM: 0.6160, LEM: 0.3680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2118, partial_loss/deprel_loss: 0.4220, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5558, loss: 0.7613, batch_reg_loss: 0.1759, reg_loss: 0.1754 ||:  72%|#######1  | 68/95 [00:48<00:19,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9000, UAS: 0.9449, LAS: 0.8940, UEM: 0.6113, LEM: 0.3622, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4066, partial_loss/deprel_loss: 0.5803, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7214, loss: 0.7603, batch_reg_loss: 0.1759, reg_loss: 0.1755 ||:  76%|#######5  | 72/95 [00:50<00:16,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9450, LAS: 0.8938, UEM: 0.6085, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2725, partial_loss/deprel_loss: 0.5266, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6517, loss: 0.7618, batch_reg_loss: 0.1760, reg_loss: 0.1755 ||:  79%|#######8  | 75/95 [00:52<00:14,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8082, UAS: 0.9432, LAS: 0.8917, UEM: 0.5998, LEM: 0.3519, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6078, partial_loss/deprel_loss: 1.0781, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3600, loss: 0.7772, batch_reg_loss: 0.1760, reg_loss: 0.1755 ||:  83%|########3 | 79/95 [00:55<00:10,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8639, UAS: 0.9420, LAS: 0.8903, UEM: 0.5945, LEM: 0.3479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8079, partial_loss/deprel_loss: 0.7865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9668, loss: 0.7864, batch_reg_loss: 0.1760, reg_loss: 0.1755 ||:  86%|########6 | 82/95 [00:57<00:09,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8587, UAS: 0.9422, LAS: 0.8905, UEM: 0.5936, LEM: 0.3463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9196, partial_loss/deprel_loss: 0.8773, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0618, loss: 0.7851, batch_reg_loss: 0.1761, reg_loss: 0.1756 ||:  89%|########9 | 85/95 [00:59<00:07,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8528, UAS: 0.9415, LAS: 0.8897, UEM: 0.5866, LEM: 0.3403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1732, partial_loss/deprel_loss: 0.8958, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1274, loss: 0.7916, batch_reg_loss: 0.1762, reg_loss: 0.1756 ||:  94%|#########3| 89/95 [01:02<00:04,  1.45it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8420, UAS: 0.9405, LAS: 0.8886, UEM: 0.5778, LEM: 0.3342, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2289, partial_loss/deprel_loss: 0.8653, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1143, loss: 0.8000, batch_reg_loss: 0.1762, reg_loss: 0.1756 ||:  98%|#########7| 93/95 [01:04<00:01,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9406, LAS: 0.8886, UEM: 0.5797, LEM: 0.3369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1904, partial_loss/deprel_loss: 0.3714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5115, loss: 0.7998, batch_reg_loss: 0.1763, reg_loss: 0.1756 ||: 100%|##########| 95/95 [01:06<00:00,  1.43it/s]\n",
+      "2023-04-07 00:09:27,115 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8419, UAS: 0.9153, LAS: 0.8558, UEM: 0.1908, LEM: 0.0526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4304, partial_loss/deprel_loss: 56.5432, partial_loss/cycle_loss: 0.0000, batch_loss: 45.5206, loss: 42.2261, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  18%|#8        | 2/11 [00:02<00:10,  1.15s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9318, LAS: 0.8726, UEM: 0.3708, LEM: 0.0868, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4709, partial_loss/deprel_loss: 23.6317, partial_loss/cycle_loss: 0.0000, batch_loss: 18.9995, loss: 33.1798, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:05<00:06,  1.08s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9432, LAS: 0.8868, UEM: 0.5980, LEM: 0.2941, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2243, partial_loss/deprel_loss: 22.6137, partial_loss/cycle_loss: 0.0000, batch_loss: 18.1358, loss: 29.0568, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  64%|######3   | 7/11 [00:07<00:04,  1.08s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9457, LAS: 0.8899, UEM: 0.6081, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4233, partial_loss/deprel_loss: 28.9285, partial_loss/cycle_loss: 0.0000, batch_loss: 23.2275, loss: 27.2084, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  91%|######### | 10/11 [00:09<00:00,  1.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9483, LAS: 0.8943, UEM: 0.6744, LEM: 0.3920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2251, partial_loss/deprel_loss: 19.1517, partial_loss/cycle_loss: 0.0000, batch_loss: 15.3664, loss: 26.1318, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.06it/s]\n",
+      "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.176  |     0.000\n",
+      "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer - UEM                      |     0.580  |     0.674\n",
+      "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer - LEM                      |     0.337  |     0.392\n",
+      "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer - EM                       |     0.927  |     0.938\n",
+      "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.190  |     0.225\n",
+      "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:09:37,459 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - UAS                      |     0.941  |     0.948\n",
+      "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.371  |    19.152\n",
+      "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - loss                     |     0.800  |    26.132\n",
+      "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - LAS                      |     0.889  |     0.894\n",
+      "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:09:37,460 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 00:09:37,461 - INFO - combo.training.trainer - Epoch duration: 0:01:16.963087\n",
+      "2023-04-07 00:09:37,461 - INFO - combo.training.trainer - Estimated training time remaining: 6:10:48\n",
+      "2023-04-07 00:09:37,461 - INFO - allennlp.training.trainer - Epoch 71/399\n",
+      "2023-04-07 00:09:37,461 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:09:37,462 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:09:37,469 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9552, LAS: 0.9068, UEM: 0.6813, LEM: 0.4371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1733, partial_loss/deprel_loss: 0.3007, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4515, loss: 0.6592, batch_reg_loss: 0.1763, reg_loss: 0.1763 ||:   4%|4         | 4/95 [00:02<00:54,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9475, LAS: 0.8981, UEM: 0.5787, LEM: 0.3374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4932, partial_loss/deprel_loss: 0.6592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8024, loss: 0.7276, batch_reg_loss: 0.1764, reg_loss: 0.1763 ||:   8%|8         | 8/95 [00:04<00:50,  1.73it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9581, UAS: 0.9502, LAS: 0.9021, UEM: 0.6920, LEM: 0.4880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0532, partial_loss/deprel_loss: 0.1633, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3177, loss: 0.6972, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  12%|#1        | 11/95 [00:06<00:53,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8585, UAS: 0.9455, LAS: 0.8973, UEM: 0.6476, LEM: 0.4389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9427, partial_loss/deprel_loss: 0.8309, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0298, loss: 0.7332, batch_reg_loss: 0.1765, reg_loss: 0.1764 ||:  16%|#5        | 15/95 [00:09<00:48,  1.64it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9403, LAS: 0.8910, UEM: 0.5839, LEM: 0.3826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6263, partial_loss/deprel_loss: 0.7611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9107, loss: 0.7906, batch_reg_loss: 0.1766, reg_loss: 0.1764 ||:  21%|##1       | 20/95 [00:11<00:41,  1.79it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9412, LAS: 0.8917, UEM: 0.5907, LEM: 0.3735, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2732, partial_loss/deprel_loss: 0.4341, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5785, loss: 0.7859, batch_reg_loss: 0.1767, reg_loss: 0.1765 ||:  26%|##6       | 25/95 [00:13<00:38,  1.83it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9380, LAS: 0.8878, UEM: 0.5626, LEM: 0.3477, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5694, partial_loss/deprel_loss: 0.6708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8273, loss: 0.8117, batch_reg_loss: 0.1767, reg_loss: 0.1765 ||:  31%|###       | 29/95 [00:16<00:38,  1.71it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9386, LAS: 0.8881, UEM: 0.5534, LEM: 0.3321, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5307, partial_loss/deprel_loss: 0.6790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8262, loss: 0.8095, batch_reg_loss: 0.1768, reg_loss: 0.1765 ||:  35%|###4      | 33/95 [00:19<00:37,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8844, UAS: 0.9387, LAS: 0.8882, UEM: 0.5429, LEM: 0.3209, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7026, partial_loss/deprel_loss: 0.6841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8647, loss: 0.8090, batch_reg_loss: 0.1768, reg_loss: 0.1766 ||:  39%|###8      | 37/95 [00:22<00:37,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8166, UAS: 0.9378, LAS: 0.8871, UEM: 0.5435, LEM: 0.3214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5673, partial_loss/deprel_loss: 1.0897, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3621, loss: 0.8157, batch_reg_loss: 0.1769, reg_loss: 0.1766 ||:  43%|####3     | 41/95 [00:25<00:36,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9387, LAS: 0.8877, UEM: 0.5407, LEM: 0.3133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4908, partial_loss/deprel_loss: 0.5889, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7463, loss: 0.8124, batch_reg_loss: 0.1770, reg_loss: 0.1766 ||:  46%|####6     | 44/95 [00:27<00:34,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8346, UAS: 0.9389, LAS: 0.8879, UEM: 0.5550, LEM: 0.3246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3078, partial_loss/deprel_loss: 0.9468, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1960, loss: 0.8088, batch_reg_loss: 0.1770, reg_loss: 0.1766 ||:  49%|####9     | 47/95 [00:29<00:32,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8530, UAS: 0.9387, LAS: 0.8879, UEM: 0.5572, LEM: 0.3274, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0041, partial_loss/deprel_loss: 0.8890, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0890, loss: 0.8090, batch_reg_loss: 0.1771, reg_loss: 0.1767 ||:  53%|#####2    | 50/95 [00:31<00:31,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8482, UAS: 0.9385, LAS: 0.8875, UEM: 0.5519, LEM: 0.3212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1688, partial_loss/deprel_loss: 0.9223, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1487, loss: 0.8117, batch_reg_loss: 0.1771, reg_loss: 0.1767 ||:  56%|#####5    | 53/95 [00:33<00:29,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9386, LAS: 0.8874, UEM: 0.5469, LEM: 0.3151, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3167, partial_loss/deprel_loss: 0.4665, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6137, loss: 0.8119, batch_reg_loss: 0.1771, reg_loss: 0.1767 ||:  59%|#####8    | 56/95 [00:35<00:27,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9388, LAS: 0.8876, UEM: 0.5448, LEM: 0.3094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3204, partial_loss/deprel_loss: 0.4900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6333, loss: 0.8105, batch_reg_loss: 0.1772, reg_loss: 0.1767 ||:  62%|######2   | 59/95 [00:37<00:25,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9393, LAS: 0.8880, UEM: 0.5485, LEM: 0.3130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4376, partial_loss/deprel_loss: 0.6354, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7731, loss: 0.8058, batch_reg_loss: 0.1772, reg_loss: 0.1768 ||:  65%|######5   | 62/95 [00:40<00:23,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9400, LAS: 0.8888, UEM: 0.5493, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3143, partial_loss/deprel_loss: 0.4986, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6390, loss: 0.8020, batch_reg_loss: 0.1773, reg_loss: 0.1768 ||:  69%|######9   | 66/95 [00:42<00:20,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9409, LAS: 0.8897, UEM: 0.5563, LEM: 0.3120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2309, partial_loss/deprel_loss: 0.4179, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5579, loss: 0.7938, batch_reg_loss: 0.1774, reg_loss: 0.1768 ||:  74%|#######3  | 70/95 [00:45<00:16,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9395, LAS: 0.8883, UEM: 0.5604, LEM: 0.3172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1509, partial_loss/deprel_loss: 0.3368, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4770, loss: 0.8039, batch_reg_loss: 0.1774, reg_loss: 0.1768 ||:  77%|#######6  | 73/95 [00:47<00:15,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9264, UAS: 0.9400, LAS: 0.8889, UEM: 0.5613, LEM: 0.3166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2819, partial_loss/deprel_loss: 0.4330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5803, loss: 0.8009, batch_reg_loss: 0.1774, reg_loss: 0.1769 ||:  80%|########  | 76/95 [00:49<00:13,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9402, LAS: 0.8893, UEM: 0.5742, LEM: 0.3325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1263, partial_loss/deprel_loss: 0.2588, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4097, loss: 0.7961, batch_reg_loss: 0.1775, reg_loss: 0.1769 ||:  83%|########3 | 79/95 [00:51<00:11,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8996, UAS: 0.9397, LAS: 0.8887, UEM: 0.5725, LEM: 0.3313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5192, partial_loss/deprel_loss: 0.5978, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7596, loss: 0.8023, batch_reg_loss: 0.1775, reg_loss: 0.1769 ||:  87%|########7 | 83/95 [00:54<00:08,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9400, LAS: 0.8889, UEM: 0.5712, LEM: 0.3279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3889, partial_loss/deprel_loss: 0.5676, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7094, loss: 0.8005, batch_reg_loss: 0.1776, reg_loss: 0.1769 ||:  91%|######### | 86/95 [00:56<00:06,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9034, UAS: 0.9400, LAS: 0.8890, UEM: 0.5667, LEM: 0.3239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4187, partial_loss/deprel_loss: 0.5279, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6837, loss: 0.7999, batch_reg_loss: 0.1776, reg_loss: 0.1770 ||:  94%|#########3| 89/95 [00:58<00:04,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8380, UAS: 0.9403, LAS: 0.8892, UEM: 0.5763, LEM: 0.3333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2965, partial_loss/deprel_loss: 0.9069, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1625, loss: 0.7979, batch_reg_loss: 0.1777, reg_loss: 0.1770 ||:  97%|#########6| 92/95 [01:01<00:02,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9412, LAS: 0.8901, UEM: 0.5836, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2061, partial_loss/deprel_loss: 0.4362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5679, loss: 0.7915, batch_reg_loss: 0.1777, reg_loss: 0.1770 ||: 100%|##########| 95/95 [01:03<00:00,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9412, LAS: 0.8901, UEM: 0.5836, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2061, partial_loss/deprel_loss: 0.4362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5679, loss: 0.7915, batch_reg_loss: 0.1777, reg_loss: 0.1770 ||: 100%|##########| 95/95 [01:03<00:00,  1.49it/s]\n",
+      "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.177  |       N/A\n",
+      "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer - UEM                      |     0.584  |       N/A\n",
+      "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer - LEM                      |     0.337  |       N/A\n",
+      "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer - EM                       |     0.918  |       N/A\n",
+      "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.206  |       N/A\n",
+      "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:10:41,101 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - UAS                      |     0.941  |       N/A\n",
+      "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.436  |       N/A\n",
+      "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - loss                     |     0.792  |       N/A\n",
+      "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - LAS                      |     0.890  |       N/A\n",
+      "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:10:41,102 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:10:41,103 - INFO - combo.training.trainer - Epoch duration: 0:01:03.641837\n",
+      "2023-04-07 00:10:41,103 - INFO - combo.training.trainer - Estimated training time remaining: 6:09:22\n",
+      "2023-04-07 00:10:41,103 - INFO - allennlp.training.trainer - Epoch 72/399\n",
+      "2023-04-07 00:10:41,103 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:10:41,104 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:10:41,111 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9448, LAS: 0.8959, UEM: 0.6095, LEM: 0.3556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2510, partial_loss/deprel_loss: 0.3756, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5284, loss: 0.7326, batch_reg_loss: 0.1778, reg_loss: 0.1777 ||:   4%|4         | 4/95 [00:02<00:59,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8583, UAS: 0.9388, LAS: 0.8880, UEM: 0.5319, LEM: 0.2805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0482, partial_loss/deprel_loss: 0.8046, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0311, loss: 0.8022, batch_reg_loss: 0.1778, reg_loss: 0.1778 ||:   7%|7         | 7/95 [00:04<00:59,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8759, UAS: 0.9419, LAS: 0.8927, UEM: 0.5798, LEM: 0.3305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7500, partial_loss/deprel_loss: 0.7594, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9353, loss: 0.7699, batch_reg_loss: 0.1778, reg_loss: 0.1778 ||:  11%|#         | 10/95 [00:06<00:57,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8871, UAS: 0.9388, LAS: 0.8894, UEM: 0.5484, LEM: 0.3078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6365, partial_loss/deprel_loss: 0.6350, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8131, loss: 0.7911, batch_reg_loss: 0.1779, reg_loss: 0.1778 ||:  14%|#3        | 13/95 [00:08<00:55,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8920, UAS: 0.9358, LAS: 0.8860, UEM: 0.4914, LEM: 0.2684, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5457, partial_loss/deprel_loss: 0.6326, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7931, loss: 0.8190, batch_reg_loss: 0.1779, reg_loss: 0.1778 ||:  18%|#7        | 17/95 [00:11<00:51,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9401, LAS: 0.8908, UEM: 0.5316, LEM: 0.2893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3911, partial_loss/deprel_loss: 0.4793, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6397, loss: 0.7893, batch_reg_loss: 0.1780, reg_loss: 0.1778 ||:  21%|##1       | 20/95 [00:13<00:50,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9426, LAS: 0.8931, UEM: 0.5414, LEM: 0.2897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4643, partial_loss/deprel_loss: 0.5793, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7344, loss: 0.7734, batch_reg_loss: 0.1780, reg_loss: 0.1779 ||:  25%|##5       | 24/95 [00:16<00:47,  1.50it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9434, LAS: 0.8941, UEM: 0.5586, LEM: 0.3096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1725, partial_loss/deprel_loss: 0.3463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4896, loss: 0.7642, batch_reg_loss: 0.1781, reg_loss: 0.1779 ||:  29%|##9       | 28/95 [00:18<00:44,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9452, LAS: 0.8960, UEM: 0.5764, LEM: 0.3207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3343, partial_loss/deprel_loss: 0.5059, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6497, loss: 0.7491, batch_reg_loss: 0.1781, reg_loss: 0.1779 ||:  33%|###2      | 31/95 [00:21<00:46,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9472, LAS: 0.8988, UEM: 0.6355, LEM: 0.4037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1090, partial_loss/deprel_loss: 0.2286, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3829, loss: 0.7275, batch_reg_loss: 0.1782, reg_loss: 0.1780 ||:  36%|###5      | 34/95 [00:23<00:46,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9472, LAS: 0.8983, UEM: 0.6318, LEM: 0.3973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1485, partial_loss/deprel_loss: 0.3607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4965, loss: 0.7297, batch_reg_loss: 0.1782, reg_loss: 0.1780 ||:  40%|####      | 38/95 [00:26<00:41,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9472, LAS: 0.8981, UEM: 0.6233, LEM: 0.3842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5991, partial_loss/deprel_loss: 0.7210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8749, loss: 0.7319, batch_reg_loss: 0.1783, reg_loss: 0.1780 ||:  45%|####5     | 43/95 [00:28<00:33,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9457, LAS: 0.8964, UEM: 0.6122, LEM: 0.3766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5903, partial_loss/deprel_loss: 0.6357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8049, loss: 0.7461, batch_reg_loss: 0.1783, reg_loss: 0.1780 ||:  49%|####9     | 47/95 [00:30<00:28,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8240, UAS: 0.9435, LAS: 0.8936, UEM: 0.6103, LEM: 0.3690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4303, partial_loss/deprel_loss: 1.0489, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3035, loss: 0.7667, batch_reg_loss: 0.1783, reg_loss: 0.1781 ||:  55%|#####4    | 52/95 [00:33<00:24,  1.76it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8994, UAS: 0.9451, LAS: 0.8952, UEM: 0.6205, LEM: 0.3732, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4625, partial_loss/deprel_loss: 0.5809, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7356, loss: 0.7555, batch_reg_loss: 0.1784, reg_loss: 0.1781 ||:  60%|######    | 57/95 [00:35<00:20,  1.83it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9441, LAS: 0.8940, UEM: 0.6165, LEM: 0.3692, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3280, partial_loss/deprel_loss: 0.4945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6396, loss: 0.7638, batch_reg_loss: 0.1785, reg_loss: 0.1781 ||:  64%|######4   | 61/95 [00:38<00:18,  1.79it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8740, UAS: 0.9427, LAS: 0.8925, UEM: 0.6059, LEM: 0.3611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8219, partial_loss/deprel_loss: 0.7629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9532, loss: 0.7773, batch_reg_loss: 0.1785, reg_loss: 0.1781 ||:  68%|######8   | 65/95 [00:40<00:17,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9424, LAS: 0.8920, UEM: 0.6026, LEM: 0.3569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4567, partial_loss/deprel_loss: 0.6063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7550, loss: 0.7816, batch_reg_loss: 0.1786, reg_loss: 0.1782 ||:  73%|#######2  | 69/95 [00:43<00:15,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9406, LAS: 0.8899, UEM: 0.5935, LEM: 0.3497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3250, partial_loss/deprel_loss: 0.4898, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6355, loss: 0.7957, batch_reg_loss: 0.1787, reg_loss: 0.1782 ||:  77%|#######6  | 73/95 [00:45<00:13,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9418, LAS: 0.8913, UEM: 0.6129, LEM: 0.3682, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3080, partial_loss/deprel_loss: 0.4743, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6198, loss: 0.7826, batch_reg_loss: 0.1787, reg_loss: 0.1782 ||:  81%|########1 | 77/95 [00:49<00:12,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8591, UAS: 0.9415, LAS: 0.8906, UEM: 0.6072, LEM: 0.3625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7716, partial_loss/deprel_loss: 0.8624, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0230, loss: 0.7860, batch_reg_loss: 0.1788, reg_loss: 0.1782 ||:  85%|########5 | 81/95 [00:51<00:09,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8835, UAS: 0.9410, LAS: 0.8898, UEM: 0.5993, LEM: 0.3546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4964, partial_loss/deprel_loss: 0.6528, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8003, loss: 0.7914, batch_reg_loss: 0.1789, reg_loss: 0.1783 ||:  89%|########9 | 85/95 [00:54<00:06,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8494, UAS: 0.9406, LAS: 0.8895, UEM: 0.5951, LEM: 0.3518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0214, partial_loss/deprel_loss: 0.9291, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1265, loss: 0.7949, batch_reg_loss: 0.1789, reg_loss: 0.1783 ||:  94%|#########3| 89/95 [00:57<00:04,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9398, LAS: 0.8886, UEM: 0.5865, LEM: 0.3456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7952, partial_loss/deprel_loss: 0.6854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8863, loss: 0.8020, batch_reg_loss: 0.1790, reg_loss: 0.1783 ||:  98%|#########7| 93/95 [00:59<00:01,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9399, LAS: 0.8888, UEM: 0.5849, LEM: 0.3435, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4183, partial_loss/deprel_loss: 0.5110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6715, loss: 0.8009, batch_reg_loss: 0.1790, reg_loss: 0.1783 ||: 100%|##########| 95/95 [01:01<00:00,  1.55it/s]\n",
+      "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.178  |       N/A\n",
+      "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - UEM                      |     0.585  |       N/A\n",
+      "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - LEM                      |     0.343  |       N/A\n",
+      "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - EM                       |     0.909  |       N/A\n",
+      "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.418  |       N/A\n",
+      "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:11:42,407 - INFO - combo.training.tensorboard_writer - UAS                      |     0.940  |       N/A\n",
+      "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.511  |       N/A\n",
+      "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - loss                     |     0.801  |       N/A\n",
+      "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - LAS                      |     0.889  |       N/A\n",
+      "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:11:42,408 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:11:42,409 - INFO - combo.training.trainer - Epoch duration: 0:01:01.305670\n",
+      "2023-04-07 00:11:42,409 - INFO - combo.training.trainer - Estimated training time remaining: 6:07:46\n",
+      "2023-04-07 00:11:42,409 - INFO - allennlp.training.trainer - Epoch 73/399\n",
+      "2023-04-07 00:11:42,409 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:11:42,410 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:11:42,416 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9054, UAS: 0.9595, LAS: 0.9081, UEM: 0.6650, LEM: 0.3547, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3901, partial_loss/deprel_loss: 0.4729, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6354, loss: 0.6435, batch_reg_loss: 0.1791, reg_loss: 0.1790 ||:   3%|3         | 3/95 [00:02<01:14,  1.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8513, UAS: 0.9484, LAS: 0.8968, UEM: 0.5682, LEM: 0.2800, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0665, partial_loss/deprel_loss: 0.8109, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0411, loss: 0.7307, batch_reg_loss: 0.1791, reg_loss: 0.1791 ||:   6%|6         | 6/95 [00:04<01:09,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8441, UAS: 0.9421, LAS: 0.8909, UEM: 0.5965, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2777, partial_loss/deprel_loss: 0.9002, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1549, loss: 0.7789, batch_reg_loss: 0.1791, reg_loss: 0.1791 ||:   9%|9         | 9/95 [00:06<01:07,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9485, LAS: 0.8981, UEM: 0.6525, LEM: 0.3839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3354, partial_loss/deprel_loss: 0.4767, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6276, loss: 0.7280, batch_reg_loss: 0.1792, reg_loss: 0.1791 ||:  13%|#2        | 12/95 [00:08<01:02,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8618, UAS: 0.9463, LAS: 0.8966, UEM: 0.6072, LEM: 0.3466, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0163, partial_loss/deprel_loss: 0.8169, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0360, loss: 0.7424, batch_reg_loss: 0.1792, reg_loss: 0.1791 ||:  17%|#6        | 16/95 [00:11<00:55,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9420, LAS: 0.8917, UEM: 0.6009, LEM: 0.3436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2641, partial_loss/deprel_loss: 0.4819, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6176, loss: 0.7828, batch_reg_loss: 0.1793, reg_loss: 0.1792 ||:  20%|##        | 19/95 [00:13<00:53,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8748, UAS: 0.9395, LAS: 0.8894, UEM: 0.5673, LEM: 0.3185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7418, partial_loss/deprel_loss: 0.6360, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8364, loss: 0.7981, batch_reg_loss: 0.1793, reg_loss: 0.1792 ||:  23%|##3       | 22/95 [00:15<00:51,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9423, LAS: 0.8924, UEM: 0.5907, LEM: 0.3293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2916, partial_loss/deprel_loss: 0.4751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6177, loss: 0.7735, batch_reg_loss: 0.1794, reg_loss: 0.1792 ||:  26%|##6       | 25/95 [00:17<00:51,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8661, UAS: 0.9420, LAS: 0.8923, UEM: 0.5727, LEM: 0.3133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9474, partial_loss/deprel_loss: 0.7746, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9886, loss: 0.7773, batch_reg_loss: 0.1794, reg_loss: 0.1792 ||:  29%|##9       | 28/95 [00:20<00:48,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9076, UAS: 0.9428, LAS: 0.8931, UEM: 0.5892, LEM: 0.3345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4459, partial_loss/deprel_loss: 0.5201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6847, loss: 0.7717, batch_reg_loss: 0.1795, reg_loss: 0.1792 ||:  33%|###2      | 31/95 [00:22<00:46,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9407, LAS: 0.8906, UEM: 0.5706, LEM: 0.3184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4817, partial_loss/deprel_loss: 0.5962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7528, loss: 0.7909, batch_reg_loss: 0.1795, reg_loss: 0.1793 ||:  37%|###6      | 35/95 [00:24<00:40,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8752, UAS: 0.9390, LAS: 0.8885, UEM: 0.5531, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6376, partial_loss/deprel_loss: 0.7715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9243, loss: 0.8063, batch_reg_loss: 0.1796, reg_loss: 0.1793 ||:  40%|####      | 38/95 [00:26<00:39,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9016, UAS: 0.9380, LAS: 0.8873, UEM: 0.5584, LEM: 0.3126, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4264, partial_loss/deprel_loss: 0.5586, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7118, loss: 0.8124, batch_reg_loss: 0.1796, reg_loss: 0.1793 ||:  43%|####3     | 41/95 [00:29<00:39,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9383, LAS: 0.8877, UEM: 0.5571, LEM: 0.3096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2281, partial_loss/deprel_loss: 0.4436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5802, loss: 0.8078, batch_reg_loss: 0.1797, reg_loss: 0.1793 ||:  47%|####7     | 45/95 [00:31<00:34,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8501, UAS: 0.9362, LAS: 0.8857, UEM: 0.5522, LEM: 0.3069, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1931, partial_loss/deprel_loss: 0.8665, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1116, loss: 0.8223, batch_reg_loss: 0.1797, reg_loss: 0.1794 ||:  51%|#####     | 48/95 [00:33<00:32,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9368, LAS: 0.8861, UEM: 0.5426, LEM: 0.2982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5555, partial_loss/deprel_loss: 0.6462, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8079, loss: 0.8225, batch_reg_loss: 0.1798, reg_loss: 0.1794 ||:  55%|#####4    | 52/95 [00:36<00:29,  1.47it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9379, LAS: 0.8875, UEM: 0.5514, LEM: 0.3062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2471, partial_loss/deprel_loss: 0.4047, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5530, loss: 0.8107, batch_reg_loss: 0.1799, reg_loss: 0.1794 ||:  59%|#####8    | 56/95 [00:38<00:25,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8872, UAS: 0.9389, LAS: 0.8886, UEM: 0.5519, LEM: 0.3043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6545, partial_loss/deprel_loss: 0.6234, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8095, loss: 0.8024, batch_reg_loss: 0.1799, reg_loss: 0.1795 ||:  63%|######3   | 60/95 [00:41<00:22,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8556, UAS: 0.9393, LAS: 0.8887, UEM: 0.5533, LEM: 0.3034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9760, partial_loss/deprel_loss: 0.8101, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0233, loss: 0.8015, batch_reg_loss: 0.1800, reg_loss: 0.1795 ||:  67%|######7   | 64/95 [00:44<00:21,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9565, UAS: 0.9405, LAS: 0.8903, UEM: 0.5824, LEM: 0.3405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0535, partial_loss/deprel_loss: 0.1670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3243, loss: 0.7917, batch_reg_loss: 0.1800, reg_loss: 0.1795 ||:  71%|#######   | 67/95 [00:46<00:20,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9412, LAS: 0.8909, UEM: 0.5884, LEM: 0.3439, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3541, partial_loss/deprel_loss: 0.5629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7011, loss: 0.7866, batch_reg_loss: 0.1801, reg_loss: 0.1795 ||:  74%|#######3  | 70/95 [00:49<00:18,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9411, LAS: 0.8908, UEM: 0.5868, LEM: 0.3420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3168, partial_loss/deprel_loss: 0.5028, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6457, loss: 0.7875, batch_reg_loss: 0.1801, reg_loss: 0.1796 ||:  78%|#######7  | 74/95 [00:51<00:14,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8333, UAS: 0.9412, LAS: 0.8907, UEM: 0.5859, LEM: 0.3397, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4250, partial_loss/deprel_loss: 0.9116, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1944, loss: 0.7883, batch_reg_loss: 0.1801, reg_loss: 0.1796 ||:  83%|########3 | 79/95 [00:53<00:10,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9058, UAS: 0.9408, LAS: 0.8901, UEM: 0.5766, LEM: 0.3310, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4056, partial_loss/deprel_loss: 0.5294, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6848, loss: 0.7940, batch_reg_loss: 0.1802, reg_loss: 0.1796 ||:  88%|########8 | 84/95 [00:55<00:06,  1.77it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9403, LAS: 0.8895, UEM: 0.5670, LEM: 0.3224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6572, partial_loss/deprel_loss: 0.7248, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8915, loss: 0.7981, batch_reg_loss: 0.1803, reg_loss: 0.1797 ||:  94%|#########3| 89/95 [00:57<00:03,  1.92it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8557, UAS: 0.9404, LAS: 0.8896, UEM: 0.5810, LEM: 0.3396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9609, partial_loss/deprel_loss: 0.8782, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0751, loss: 0.7993, batch_reg_loss: 0.1803, reg_loss: 0.1797 ||:  99%|#########8| 94/95 [01:01<00:00,  1.74it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9200, UAS: 0.9407, LAS: 0.8899, UEM: 0.5840, LEM: 0.3415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2879, partial_loss/deprel_loss: 0.4204, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5743, loss: 0.7969, batch_reg_loss: 0.1803, reg_loss: 0.1797 ||: 100%|##########| 95/95 [01:02<00:00,  1.53it/s]\n",
+      "2023-04-07 00:12:44,468 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:12:44,468 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 00:12:44,468 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.180  |       N/A\n",
+      "2023-04-07 00:12:44,468 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - UEM                      |     0.584  |       N/A\n",
+      "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - LEM                      |     0.342  |       N/A\n",
+      "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - EM                       |     0.920  |       N/A\n",
+      "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.288  |       N/A\n",
+      "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - UAS                      |     0.941  |       N/A\n",
+      "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.420  |       N/A\n",
+      "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - loss                     |     0.797  |       N/A\n",
+      "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - LAS                      |     0.890  |       N/A\n",
+      "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:12:44,469 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:12:44,470 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:12:44,470 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:12:44,470 - INFO - combo.training.trainer - Epoch duration: 0:01:02.061214\n",
+      "2023-04-07 00:12:44,470 - INFO - combo.training.trainer - Estimated training time remaining: 6:06:15\n",
+      "2023-04-07 00:12:44,470 - INFO - allennlp.training.trainer - Epoch 74/399\n",
+      "2023-04-07 00:12:44,471 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:12:44,471 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:12:44,478 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8353, UAS: 0.9161, LAS: 0.8671, UEM: 0.3030, LEM: 0.1145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3191, partial_loss/deprel_loss: 0.8518, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1257, loss: 0.9598, batch_reg_loss: 0.1804, reg_loss: 0.1804 ||:   3%|3         | 3/95 [00:02<01:02,  1.47it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9306, LAS: 0.8803, UEM: 0.4575, LEM: 0.2172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2753, partial_loss/deprel_loss: 0.4430, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5899, loss: 0.8639, batch_reg_loss: 0.1804, reg_loss: 0.1804 ||:   7%|7         | 7/95 [00:04<01:00,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8492, UAS: 0.9281, LAS: 0.8758, UEM: 0.4062, LEM: 0.1898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1880, partial_loss/deprel_loss: 0.8916, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1314, loss: 0.9038, batch_reg_loss: 0.1805, reg_loss: 0.1804 ||:  12%|#1        | 11/95 [00:07<00:55,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9557, UAS: 0.9358, LAS: 0.8859, UEM: 0.5790, LEM: 0.3826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0826, partial_loss/deprel_loss: 0.1733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3357, loss: 0.8216, batch_reg_loss: 0.1806, reg_loss: 0.1805 ||:  16%|#5        | 15/95 [00:10<00:55,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8652, UAS: 0.9374, LAS: 0.8873, UEM: 0.5968, LEM: 0.3911, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8965, partial_loss/deprel_loss: 0.7724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9778, loss: 0.8044, batch_reg_loss: 0.1806, reg_loss: 0.1805 ||:  19%|#8        | 18/95 [00:12<00:55,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8832, UAS: 0.9352, LAS: 0.8850, UEM: 0.5647, LEM: 0.3632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6314, partial_loss/deprel_loss: 0.6904, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8593, loss: 0.8253, batch_reg_loss: 0.1807, reg_loss: 0.1805 ||:  22%|##2       | 21/95 [00:14<00:52,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8838, UAS: 0.9381, LAS: 0.8877, UEM: 0.5643, LEM: 0.3503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6442, partial_loss/deprel_loss: 0.7299, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8934, loss: 0.8088, batch_reg_loss: 0.1807, reg_loss: 0.1805 ||:  26%|##6       | 25/95 [00:17<00:48,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9391, LAS: 0.8887, UEM: 0.5723, LEM: 0.3488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2430, partial_loss/deprel_loss: 0.4033, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5520, loss: 0.8021, batch_reg_loss: 0.1808, reg_loss: 0.1806 ||:  29%|##9       | 28/95 [00:19<00:47,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8804, UAS: 0.9377, LAS: 0.8867, UEM: 0.5533, LEM: 0.3328, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5782, partial_loss/deprel_loss: 0.7032, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8590, loss: 0.8184, batch_reg_loss: 0.1808, reg_loss: 0.1806 ||:  33%|###2      | 31/95 [00:21<00:44,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9377, LAS: 0.8864, UEM: 0.5491, LEM: 0.3238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3226, partial_loss/deprel_loss: 0.4711, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6222, loss: 0.8197, batch_reg_loss: 0.1808, reg_loss: 0.1806 ||:  36%|###5      | 34/95 [00:23<00:42,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8779, UAS: 0.9379, LAS: 0.8863, UEM: 0.5474, LEM: 0.3215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6239, partial_loss/deprel_loss: 0.7104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8740, loss: 0.8200, batch_reg_loss: 0.1809, reg_loss: 0.1806 ||:  39%|###8      | 37/95 [00:25<00:41,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9380, LAS: 0.8861, UEM: 0.5464, LEM: 0.3193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2049, partial_loss/deprel_loss: 0.4376, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5720, loss: 0.8221, batch_reg_loss: 0.1809, reg_loss: 0.1806 ||:  42%|####2     | 40/95 [00:28<00:40,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8881, UAS: 0.9390, LAS: 0.8873, UEM: 0.5618, LEM: 0.3281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5021, partial_loss/deprel_loss: 0.5595, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7290, loss: 0.8097, batch_reg_loss: 0.1810, reg_loss: 0.1807 ||:  45%|####5     | 43/95 [00:30<00:37,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9395, LAS: 0.8878, UEM: 0.5577, LEM: 0.3224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4646, partial_loss/deprel_loss: 0.5144, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6855, loss: 0.8060, batch_reg_loss: 0.1810, reg_loss: 0.1807 ||:  48%|####8     | 46/95 [00:32<00:35,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8727, UAS: 0.9396, LAS: 0.8876, UEM: 0.5527, LEM: 0.3163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7582, partial_loss/deprel_loss: 0.7119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9023, loss: 0.8061, batch_reg_loss: 0.1811, reg_loss: 0.1807 ||:  52%|#####1    | 49/95 [00:34<00:33,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8512, UAS: 0.9400, LAS: 0.8881, UEM: 0.5570, LEM: 0.3177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1542, partial_loss/deprel_loss: 0.9661, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1848, loss: 0.8046, batch_reg_loss: 0.1811, reg_loss: 0.1807 ||:  55%|#####4    | 52/95 [00:37<00:31,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9407, LAS: 0.8887, UEM: 0.5609, LEM: 0.3184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2055, partial_loss/deprel_loss: 0.4421, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5759, loss: 0.8005, batch_reg_loss: 0.1811, reg_loss: 0.1808 ||:  58%|#####7    | 55/95 [00:39<00:28,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8967, UAS: 0.9409, LAS: 0.8892, UEM: 0.5680, LEM: 0.3269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5210, partial_loss/deprel_loss: 0.6415, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7986, loss: 0.7969, batch_reg_loss: 0.1812, reg_loss: 0.1808 ||:  61%|######1   | 58/95 [00:41<00:26,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9396, LAS: 0.8878, UEM: 0.5615, LEM: 0.3212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5982, partial_loss/deprel_loss: 0.6778, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8431, loss: 0.8095, batch_reg_loss: 0.1812, reg_loss: 0.1808 ||:  64%|######4   | 61/95 [00:43<00:24,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9401, LAS: 0.8883, UEM: 0.5663, LEM: 0.3250, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1634, partial_loss/deprel_loss: 0.3427, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4881, loss: 0.8067, batch_reg_loss: 0.1812, reg_loss: 0.1808 ||:  67%|######7   | 64/95 [00:45<00:22,  1.40it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8817, UAS: 0.9403, LAS: 0.8884, UEM: 0.5733, LEM: 0.3329, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5623, partial_loss/deprel_loss: 0.6810, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8385, loss: 0.8059, batch_reg_loss: 0.1813, reg_loss: 0.1808 ||:  71%|#######   | 67/95 [00:47<00:20,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9399, LAS: 0.8881, UEM: 0.5782, LEM: 0.3375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2383, partial_loss/deprel_loss: 0.4386, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5798, loss: 0.8079, batch_reg_loss: 0.1813, reg_loss: 0.1809 ||:  74%|#######3  | 70/95 [00:49<00:17,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9409, LAS: 0.8893, UEM: 0.5934, LEM: 0.3528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4208, partial_loss/deprel_loss: 0.5587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7125, loss: 0.7988, batch_reg_loss: 0.1814, reg_loss: 0.1809 ||:  77%|#######6  | 73/95 [00:51<00:15,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8297, UAS: 0.9406, LAS: 0.8888, UEM: 0.5909, LEM: 0.3498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3382, partial_loss/deprel_loss: 0.9632, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2196, loss: 0.8014, batch_reg_loss: 0.1814, reg_loss: 0.1809 ||:  81%|########1 | 77/95 [00:54<00:12,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9407, LAS: 0.8889, UEM: 0.5936, LEM: 0.3523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3455, partial_loss/deprel_loss: 0.5269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6721, loss: 0.7998, batch_reg_loss: 0.1815, reg_loss: 0.1809 ||:  84%|########4 | 80/95 [00:56<00:10,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9410, LAS: 0.8892, UEM: 0.5885, LEM: 0.3454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4599, partial_loss/deprel_loss: 0.5396, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7051, loss: 0.7969, batch_reg_loss: 0.1815, reg_loss: 0.1810 ||:  88%|########8 | 84/95 [00:59<00:07,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8511, UAS: 0.9411, LAS: 0.8891, UEM: 0.5851, LEM: 0.3421, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9966, partial_loss/deprel_loss: 0.9497, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1407, loss: 0.7987, batch_reg_loss: 0.1816, reg_loss: 0.1810 ||:  93%|#########2| 88/95 [01:02<00:04,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9414, LAS: 0.8894, UEM: 0.5865, LEM: 0.3415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2723, partial_loss/deprel_loss: 0.4014, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5572, loss: 0.7953, batch_reg_loss: 0.1816, reg_loss: 0.1810 ||:  96%|#########5| 91/95 [01:04<00:02,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9406, LAS: 0.8885, UEM: 0.5807, LEM: 0.3366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3279, partial_loss/deprel_loss: 0.4952, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6434, loss: 0.8012, batch_reg_loss: 0.1817, reg_loss: 0.1810 ||: 100%|##########| 95/95 [01:06<00:00,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9406, LAS: 0.8885, UEM: 0.5807, LEM: 0.3366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3279, partial_loss/deprel_loss: 0.4952, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6434, loss: 0.8012, batch_reg_loss: 0.1817, reg_loss: 0.1810 ||: 100%|##########| 95/95 [01:06<00:00,  1.42it/s]\n",
+      "2023-04-07 00:13:51,409 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.181  |       N/A\n",
+      "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - UEM                      |     0.581  |       N/A\n",
+      "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - LEM                      |     0.337  |       N/A\n",
+      "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - EM                       |     0.910  |       N/A\n",
+      "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.328  |       N/A\n",
+      "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - UAS                      |     0.941  |       N/A\n",
+      "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.495  |       N/A\n",
+      "2023-04-07 00:13:51,410 - INFO - combo.training.tensorboard_writer - loss                     |     0.801  |       N/A\n",
+      "2023-04-07 00:13:51,411 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:13:51,411 - INFO - combo.training.tensorboard_writer - LAS                      |     0.889  |       N/A\n",
+      "2023-04-07 00:13:51,411 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:13:51,411 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:13:51,411 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:13:51,411 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:13:51,411 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:13:51,411 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:13:51,412 - INFO - combo.training.trainer - Epoch duration: 0:01:06.941094\n",
+      "2023-04-07 00:13:51,412 - INFO - combo.training.trainer - Estimated training time remaining: 6:05:05\n",
+      "2023-04-07 00:13:51,412 - INFO - allennlp.training.trainer - Epoch 75/399\n",
+      "2023-04-07 00:13:51,412 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:13:51,412 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:13:51,419 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8504, UAS: 0.9098, LAS: 0.8622, UEM: 0.0877, LEM: 0.0132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1153, partial_loss/deprel_loss: 0.7604, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0131, loss: 0.9803, batch_reg_loss: 0.1817, reg_loss: 0.1817 ||:   3%|3         | 3/95 [00:02<01:03,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8917, UAS: 0.9272, LAS: 0.8776, UEM: 0.3059, LEM: 0.1173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6280, partial_loss/deprel_loss: 0.6272, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8091, loss: 0.8778, batch_reg_loss: 0.1817, reg_loss: 0.1817 ||:   6%|6         | 6/95 [00:04<01:01,  1.44it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9345, LAS: 0.8839, UEM: 0.3528, LEM: 0.1280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4540, partial_loss/deprel_loss: 0.5823, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7384, loss: 0.8420, batch_reg_loss: 0.1818, reg_loss: 0.1817 ||:  11%|#         | 10/95 [00:06<00:55,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9377, LAS: 0.8877, UEM: 0.4580, LEM: 0.2246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2667, partial_loss/deprel_loss: 0.5394, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6667, loss: 0.8077, batch_reg_loss: 0.1819, reg_loss: 0.1818 ||:  16%|#5        | 15/95 [00:08<00:47,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9347, LAS: 0.8835, UEM: 0.4359, LEM: 0.2086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4911, partial_loss/deprel_loss: 0.6512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8011, loss: 0.8421, batch_reg_loss: 0.1819, reg_loss: 0.1818 ||:  21%|##1       | 20/95 [00:11<00:41,  1.79it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8692, UAS: 0.9372, LAS: 0.8859, UEM: 0.4520, LEM: 0.2106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7598, partial_loss/deprel_loss: 0.7057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8985, loss: 0.8208, batch_reg_loss: 0.1820, reg_loss: 0.1818 ||:  26%|##6       | 25/95 [00:13<00:35,  1.95it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9382, LAS: 0.8873, UEM: 0.5193, LEM: 0.2827, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2472, partial_loss/deprel_loss: 0.4111, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5604, loss: 0.8099, batch_reg_loss: 0.1821, reg_loss: 0.1819 ||:  32%|###1      | 30/95 [00:15<00:32,  2.00it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9034, UAS: 0.9392, LAS: 0.8884, UEM: 0.5258, LEM: 0.2831, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4649, partial_loss/deprel_loss: 0.5791, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7385, loss: 0.8038, batch_reg_loss: 0.1822, reg_loss: 0.1819 ||:  36%|###5      | 34/95 [00:17<00:31,  1.94it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8517, UAS: 0.9396, LAS: 0.8886, UEM: 0.5388, LEM: 0.2942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1500, partial_loss/deprel_loss: 0.8686, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1071, loss: 0.8017, batch_reg_loss: 0.1822, reg_loss: 0.1819 ||:  40%|####      | 38/95 [00:20<00:34,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9409, LAS: 0.8901, UEM: 0.5459, LEM: 0.2974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4996, partial_loss/deprel_loss: 0.6586, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8091, loss: 0.7930, batch_reg_loss: 0.1823, reg_loss: 0.1820 ||:  44%|####4     | 42/95 [00:23<00:33,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8711, UAS: 0.9402, LAS: 0.8892, UEM: 0.5421, LEM: 0.2936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6804, partial_loss/deprel_loss: 0.7860, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9472, loss: 0.7997, batch_reg_loss: 0.1823, reg_loss: 0.1820 ||:  48%|####8     | 46/95 [00:26<00:32,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9410, LAS: 0.8900, UEM: 0.5659, LEM: 0.3133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2153, partial_loss/deprel_loss: 0.4134, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5561, loss: 0.7930, batch_reg_loss: 0.1824, reg_loss: 0.1820 ||:  53%|#####2    | 50/95 [00:29<00:30,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7834, UAS: 0.9403, LAS: 0.8895, UEM: 0.5902, LEM: 0.3509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0890, partial_loss/deprel_loss: 1.1278, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5024, loss: 0.7955, batch_reg_loss: 0.1824, reg_loss: 0.1821 ||:  57%|#####6    | 54/95 [00:32<00:29,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8961, UAS: 0.9410, LAS: 0.8903, UEM: 0.5907, LEM: 0.3474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5388, partial_loss/deprel_loss: 0.5865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7594, loss: 0.7904, batch_reg_loss: 0.1825, reg_loss: 0.1821 ||:  60%|######    | 57/95 [00:35<00:27,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9407, LAS: 0.8899, UEM: 0.5785, LEM: 0.3369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3906, partial_loss/deprel_loss: 0.5374, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6905, loss: 0.7937, batch_reg_loss: 0.1825, reg_loss: 0.1821 ||:  64%|######4   | 61/95 [00:37<00:23,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9295, UAS: 0.9415, LAS: 0.8906, UEM: 0.5929, LEM: 0.3509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1582, partial_loss/deprel_loss: 0.3439, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4893, loss: 0.7883, batch_reg_loss: 0.1826, reg_loss: 0.1821 ||:  67%|######7   | 64/95 [00:39<00:22,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9421, LAS: 0.8914, UEM: 0.6002, LEM: 0.3563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2630, partial_loss/deprel_loss: 0.4084, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5620, loss: 0.7812, batch_reg_loss: 0.1826, reg_loss: 0.1821 ||:  71%|#######   | 67/95 [00:42<00:20,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8501, UAS: 0.9420, LAS: 0.8914, UEM: 0.5963, LEM: 0.3506, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3357, partial_loss/deprel_loss: 0.8577, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1360, loss: 0.7819, batch_reg_loss: 0.1827, reg_loss: 0.1822 ||:  75%|#######4  | 71/95 [00:44<00:16,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9426, LAS: 0.8922, UEM: 0.6031, LEM: 0.3568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2671, partial_loss/deprel_loss: 0.3893, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5476, loss: 0.7760, batch_reg_loss: 0.1827, reg_loss: 0.1822 ||:  78%|#######7  | 74/95 [00:47<00:15,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8566, UAS: 0.9417, LAS: 0.8911, UEM: 0.5919, LEM: 0.3480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9803, partial_loss/deprel_loss: 0.8861, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0877, loss: 0.7840, batch_reg_loss: 0.1827, reg_loss: 0.1822 ||:  82%|########2 | 78/95 [00:49<00:11,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9425, LAS: 0.8920, UEM: 0.5974, LEM: 0.3508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3638, partial_loss/deprel_loss: 0.4613, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6246, loss: 0.7768, batch_reg_loss: 0.1828, reg_loss: 0.1822 ||:  85%|########5 | 81/95 [00:51<00:10,  1.39it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8313, UAS: 0.9422, LAS: 0.8917, UEM: 0.5951, LEM: 0.3479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4579, partial_loss/deprel_loss: 0.9162, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2073, loss: 0.7794, batch_reg_loss: 0.1828, reg_loss: 0.1823 ||:  88%|########8 | 84/95 [00:54<00:08,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8766, UAS: 0.9420, LAS: 0.8915, UEM: 0.5913, LEM: 0.3437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7022, partial_loss/deprel_loss: 0.7376, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9134, loss: 0.7813, batch_reg_loss: 0.1828, reg_loss: 0.1823 ||:  92%|#########1| 87/95 [00:56<00:05,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8548, UAS: 0.9407, LAS: 0.8900, UEM: 0.5821, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0682, partial_loss/deprel_loss: 0.8623, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0864, loss: 0.7937, batch_reg_loss: 0.1829, reg_loss: 0.1823 ||:  96%|#########5| 91/95 [00:58<00:02,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9406, LAS: 0.8899, UEM: 0.5845, LEM: 0.3403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1381, partial_loss/deprel_loss: 0.3449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4865, loss: 0.7951, batch_reg_loss: 0.1829, reg_loss: 0.1823 ||: 100%|##########| 95/95 [01:01<00:00,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9406, LAS: 0.8899, UEM: 0.5845, LEM: 0.3403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1381, partial_loss/deprel_loss: 0.3449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4865, loss: 0.7951, batch_reg_loss: 0.1829, reg_loss: 0.1823 ||: 100%|##########| 95/95 [01:01<00:00,  1.54it/s]\n",
+      "2023-04-07 00:14:53,028 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8997, UAS: 0.9663, LAS: 0.9206, UEM: 0.8083, LEM: 0.5614, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4550, partial_loss/deprel_loss: 28.7498, partial_loss/cycle_loss: 0.0000, batch_loss: 23.0908, loss: 20.1704, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  27%|##7       | 3/11 [00:02<00:07,  1.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9597, LAS: 0.9119, UEM: 0.7813, LEM: 0.5211, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2073, partial_loss/deprel_loss: 22.4669, partial_loss/cycle_loss: 0.0000, batch_loss: 18.0150, loss: 20.2816, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:04<00:05,  1.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8609, UAS: 0.9470, LAS: 0.8946, UEM: 0.7130, LEM: 0.4618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0117, partial_loss/deprel_loss: 43.2696, partial_loss/cycle_loss: 0.0000, batch_loss: 34.8180, loss: 25.7831, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  64%|######3   | 7/11 [00:07<00:04,  1.00s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9468, LAS: 0.8939, UEM: 0.6769, LEM: 0.4166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4092, partial_loss/deprel_loss: 24.0904, partial_loss/cycle_loss: 0.0000, batch_loss: 19.3541, loss: 26.5160, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  91%|######### | 10/11 [00:09<00:00,  1.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9021, UAS: 0.9475, LAS: 0.8947, UEM: 0.6682, LEM: 0.3981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5189, partial_loss/deprel_loss: 23.4807, partial_loss/cycle_loss: 0.0000, batch_loss: 18.8884, loss: 25.8226, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.02it/s]\n",
+      "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.182  |     0.000\n",
+      "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer - UEM                      |     0.584  |     0.668\n",
+      "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer - LEM                      |     0.340  |     0.398\n",
+      "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer - EM                       |     0.922  |     0.902\n",
+      "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.138  |     0.519\n",
+      "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:15:03,818 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - UAS                      |     0.941  |     0.947\n",
+      "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.345  |    23.481\n",
+      "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - loss                     |     0.795  |    25.823\n",
+      "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - LAS                      |     0.890  |     0.895\n",
+      "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:15:03,819 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 00:15:03,820 - INFO - combo.training.trainer - Epoch duration: 0:01:12.408039\n",
+      "2023-04-07 00:15:03,820 - INFO - combo.training.trainer - Estimated training time remaining: 6:04:19\n",
+      "2023-04-07 00:15:03,820 - INFO - allennlp.training.trainer - Epoch 76/399\n",
+      "2023-04-07 00:15:03,820 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:15:03,821 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:15:03,827 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9547, LAS: 0.9081, UEM: 0.5728, LEM: 0.2605, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3512, partial_loss/deprel_loss: 0.4644, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6248, loss: 0.6572, batch_reg_loss: 0.1830, reg_loss: 0.1830 ||:   3%|3         | 3/95 [00:02<01:08,  1.35it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9568, LAS: 0.9083, UEM: 0.6590, LEM: 0.3677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1612, partial_loss/deprel_loss: 0.3406, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4878, loss: 0.6524, batch_reg_loss: 0.1831, reg_loss: 0.1830 ||:   7%|7         | 7/95 [00:04<01:03,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8993, UAS: 0.9493, LAS: 0.8998, UEM: 0.6395, LEM: 0.3545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5184, partial_loss/deprel_loss: 0.5381, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7173, loss: 0.7159, batch_reg_loss: 0.1831, reg_loss: 0.1830 ||:  11%|#         | 10/95 [00:07<01:02,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9104, UAS: 0.9520, LAS: 0.9034, UEM: 0.6523, LEM: 0.3639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3222, partial_loss/deprel_loss: 0.5445, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6831, loss: 0.6955, batch_reg_loss: 0.1831, reg_loss: 0.1831 ||:  14%|#3        | 13/95 [00:09<00:59,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8932, UAS: 0.9500, LAS: 0.9006, UEM: 0.6224, LEM: 0.3376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3848, partial_loss/deprel_loss: 0.5336, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6871, loss: 0.7136, batch_reg_loss: 0.1832, reg_loss: 0.1831 ||:  17%|#6        | 16/95 [00:11<00:56,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8650, UAS: 0.9455, LAS: 0.8956, UEM: 0.5912, LEM: 0.3214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9029, partial_loss/deprel_loss: 0.7841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9911, loss: 0.7523, batch_reg_loss: 0.1832, reg_loss: 0.1831 ||:  21%|##1       | 20/95 [00:14<00:52,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8700, UAS: 0.9457, LAS: 0.8952, UEM: 0.5852, LEM: 0.3140, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7514, partial_loss/deprel_loss: 0.6884, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8843, loss: 0.7547, batch_reg_loss: 0.1833, reg_loss: 0.1831 ||:  24%|##4       | 23/95 [00:16<00:50,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8887, UAS: 0.9466, LAS: 0.8961, UEM: 0.5951, LEM: 0.3213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4828, partial_loss/deprel_loss: 0.6079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7662, loss: 0.7427, batch_reg_loss: 0.1833, reg_loss: 0.1831 ||:  27%|##7       | 26/95 [00:18<00:48,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8821, UAS: 0.9473, LAS: 0.8969, UEM: 0.5933, LEM: 0.3197, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6708, partial_loss/deprel_loss: 0.6070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8031, loss: 0.7368, batch_reg_loss: 0.1833, reg_loss: 0.1832 ||:  31%|###       | 29/95 [00:20<00:45,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8887, UAS: 0.9449, LAS: 0.8939, UEM: 0.5724, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5364, partial_loss/deprel_loss: 0.6407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8032, loss: 0.7615, batch_reg_loss: 0.1834, reg_loss: 0.1832 ||:  35%|###4      | 33/95 [00:22<00:39,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9096, UAS: 0.9462, LAS: 0.8961, UEM: 0.6060, LEM: 0.3546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4429, partial_loss/deprel_loss: 0.5341, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6993, loss: 0.7474, batch_reg_loss: 0.1834, reg_loss: 0.1832 ||:  39%|###8      | 37/95 [00:24<00:35,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8778, UAS: 0.9435, LAS: 0.8931, UEM: 0.5781, LEM: 0.3340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7130, partial_loss/deprel_loss: 0.7432, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9206, loss: 0.7751, batch_reg_loss: 0.1835, reg_loss: 0.1832 ||:  44%|####4     | 42/95 [00:26<00:30,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9227, UAS: 0.9434, LAS: 0.8932, UEM: 0.5714, LEM: 0.3264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2446, partial_loss/deprel_loss: 0.4314, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5776, loss: 0.7747, batch_reg_loss: 0.1836, reg_loss: 0.1833 ||:  49%|####9     | 47/95 [00:29<00:26,  1.85it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9430, LAS: 0.8925, UEM: 0.5749, LEM: 0.3285, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2560, partial_loss/deprel_loss: 0.4518, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5963, loss: 0.7768, batch_reg_loss: 0.1837, reg_loss: 0.1833 ||:  55%|#####4    | 52/95 [00:32<00:23,  1.84it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8299, UAS: 0.9423, LAS: 0.8914, UEM: 0.5673, LEM: 0.3215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3642, partial_loss/deprel_loss: 1.0457, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2931, loss: 0.7864, batch_reg_loss: 0.1837, reg_loss: 0.1833 ||:  59%|#####8    | 56/95 [00:34<00:22,  1.74it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8675, UAS: 0.9403, LAS: 0.8895, UEM: 0.5516, LEM: 0.3115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8775, partial_loss/deprel_loss: 0.8152, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0115, loss: 0.8033, batch_reg_loss: 0.1838, reg_loss: 0.1834 ||:  63%|######3   | 60/95 [00:37<00:21,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8566, UAS: 0.9389, LAS: 0.8881, UEM: 0.5582, LEM: 0.3259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9317, partial_loss/deprel_loss: 0.8423, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0441, loss: 0.8129, batch_reg_loss: 0.1838, reg_loss: 0.1834 ||:  67%|######7   | 64/95 [00:40<00:19,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9395, LAS: 0.8886, UEM: 0.5596, LEM: 0.3225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3226, partial_loss/deprel_loss: 0.5221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6661, loss: 0.8077, batch_reg_loss: 0.1839, reg_loss: 0.1834 ||:  72%|#######1  | 68/95 [00:43<00:17,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8961, UAS: 0.9394, LAS: 0.8886, UEM: 0.5535, LEM: 0.3160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5394, partial_loss/deprel_loss: 0.6583, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8185, loss: 0.8094, batch_reg_loss: 0.1840, reg_loss: 0.1834 ||:  76%|#######5  | 72/95 [00:45<00:15,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9399, LAS: 0.8891, UEM: 0.5571, LEM: 0.3188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1855, partial_loss/deprel_loss: 0.3757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5217, loss: 0.8048, batch_reg_loss: 0.1840, reg_loss: 0.1835 ||:  79%|#######8  | 75/95 [00:48<00:13,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9399, LAS: 0.8891, UEM: 0.5653, LEM: 0.3278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1215, partial_loss/deprel_loss: 0.3250, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4684, loss: 0.8041, batch_reg_loss: 0.1841, reg_loss: 0.1835 ||:  82%|########2 | 78/95 [00:50<00:12,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9399, LAS: 0.8889, UEM: 0.5597, LEM: 0.3211, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6635, partial_loss/deprel_loss: 0.7208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8935, loss: 0.8050, batch_reg_loss: 0.1841, reg_loss: 0.1835 ||:  86%|########6 | 82/95 [00:52<00:08,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9406, LAS: 0.8896, UEM: 0.5637, LEM: 0.3224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2760, partial_loss/deprel_loss: 0.4656, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6118, loss: 0.8000, batch_reg_loss: 0.1842, reg_loss: 0.1835 ||:  89%|########9 | 85/95 [00:55<00:06,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9402, LAS: 0.8892, UEM: 0.5712, LEM: 0.3284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2545, partial_loss/deprel_loss: 0.4326, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5812, loss: 0.8039, batch_reg_loss: 0.1842, reg_loss: 0.1836 ||:  93%|#########2| 88/95 [00:57<00:04,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9401, LAS: 0.8893, UEM: 0.5745, LEM: 0.3322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3026, partial_loss/deprel_loss: 0.3780, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5472, loss: 0.8029, batch_reg_loss: 0.1843, reg_loss: 0.1836 ||:  96%|#########5| 91/95 [00:59<00:02,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9405, LAS: 0.8898, UEM: 0.5815, LEM: 0.3397, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1445, partial_loss/deprel_loss: 0.3091, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4605, loss: 0.7986, batch_reg_loss: 0.1843, reg_loss: 0.1836 ||:  99%|#########8| 94/95 [01:02<00:00,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8948, UAS: 0.9405, LAS: 0.8898, UEM: 0.5795, LEM: 0.3377, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5905, partial_loss/deprel_loss: 0.5858, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7710, loss: 0.7983, batch_reg_loss: 0.1843, reg_loss: 0.1836 ||: 100%|##########| 95/95 [01:02<00:00,  1.51it/s]\n",
+      "2023-04-07 00:16:06,583 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.184  |       N/A\n",
+      "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - UEM                      |     0.580  |       N/A\n",
+      "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - LEM                      |     0.338  |       N/A\n",
+      "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - EM                       |     0.895  |       N/A\n",
+      "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.590  |       N/A\n",
+      "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - UAS                      |     0.940  |       N/A\n",
+      "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.586  |       N/A\n",
+      "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - loss                     |     0.798  |       N/A\n",
+      "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - LAS                      |     0.890  |       N/A\n",
+      "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:16:06,584 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:16:06,585 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:16:06,585 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:16:06,585 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:16:06,585 - INFO - combo.training.trainer - Epoch duration: 0:01:02.765135\n",
+      "2023-04-07 00:16:06,585 - INFO - combo.training.trainer - Estimated training time remaining: 6:02:52\n",
+      "2023-04-07 00:16:06,585 - INFO - allennlp.training.trainer - Epoch 77/399\n",
+      "2023-04-07 00:16:06,586 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:16:06,586 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:16:06,592 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9439, LAS: 0.8889, UEM: 0.4439, LEM: 0.1970, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2992, partial_loss/deprel_loss: 0.4709, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6209, loss: 0.8255, batch_reg_loss: 0.1843, reg_loss: 0.1843 ||:   3%|3         | 3/95 [00:02<01:07,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8646, UAS: 0.9431, LAS: 0.8890, UEM: 0.4924, LEM: 0.2474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8434, partial_loss/deprel_loss: 0.7793, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9765, loss: 0.8081, batch_reg_loss: 0.1844, reg_loss: 0.1843 ||:   6%|6         | 6/95 [00:04<01:08,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9478, LAS: 0.8955, UEM: 0.5686, LEM: 0.3123, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2481, partial_loss/deprel_loss: 0.3548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5179, loss: 0.7473, batch_reg_loss: 0.1844, reg_loss: 0.1844 ||:   9%|9         | 9/95 [00:06<01:04,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9347, LAS: 0.8827, UEM: 0.4864, LEM: 0.2618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7772, partial_loss/deprel_loss: 0.7062, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9048, loss: 0.8470, batch_reg_loss: 0.1845, reg_loss: 0.1844 ||:  14%|#3        | 13/95 [00:09<00:58,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9397, LAS: 0.8877, UEM: 0.5467, LEM: 0.2991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1979, partial_loss/deprel_loss: 0.4105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5525, loss: 0.8047, batch_reg_loss: 0.1845, reg_loss: 0.1844 ||:  17%|#6        | 16/95 [00:11<01:00,  1.32it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9374, LAS: 0.8854, UEM: 0.5454, LEM: 0.2955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4462, partial_loss/deprel_loss: 0.5947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7495, loss: 0.8263, batch_reg_loss: 0.1845, reg_loss: 0.1844 ||:  20%|##        | 19/95 [00:14<00:58,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9405, LAS: 0.8888, UEM: 0.5523, LEM: 0.2922, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5662, partial_loss/deprel_loss: 0.6405, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8102, loss: 0.8055, batch_reg_loss: 0.1846, reg_loss: 0.1845 ||:  24%|##4       | 23/95 [00:16<00:52,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9394, LAS: 0.8878, UEM: 0.5432, LEM: 0.2898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2411, partial_loss/deprel_loss: 0.3998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5528, loss: 0.8084, batch_reg_loss: 0.1847, reg_loss: 0.1845 ||:  28%|##8       | 27/95 [00:19<00:48,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8636, UAS: 0.9340, LAS: 0.8821, UEM: 0.5129, LEM: 0.2727, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9194, partial_loss/deprel_loss: 0.8653, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0609, loss: 0.8523, batch_reg_loss: 0.1847, reg_loss: 0.1845 ||:  33%|###2      | 31/95 [00:21<00:42,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9354, LAS: 0.8840, UEM: 0.5591, LEM: 0.3393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5434, partial_loss/deprel_loss: 0.6119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7830, loss: 0.8391, batch_reg_loss: 0.1848, reg_loss: 0.1845 ||:  36%|###5      | 34/95 [00:24<00:41,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8713, UAS: 0.9371, LAS: 0.8851, UEM: 0.5599, LEM: 0.3325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8156, partial_loss/deprel_loss: 0.7787, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9709, loss: 0.8295, batch_reg_loss: 0.1848, reg_loss: 0.1846 ||:  41%|####1     | 39/95 [00:26<00:35,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9384, LAS: 0.8866, UEM: 0.5612, LEM: 0.3288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4756, partial_loss/deprel_loss: 0.5991, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7593, loss: 0.8215, batch_reg_loss: 0.1849, reg_loss: 0.1846 ||:  45%|####5     | 43/95 [00:29<00:33,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9381, LAS: 0.8864, UEM: 0.5519, LEM: 0.3189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5294, partial_loss/deprel_loss: 0.6338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7978, loss: 0.8225, batch_reg_loss: 0.1850, reg_loss: 0.1846 ||:  49%|####9     | 47/95 [00:31<00:31,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8554, UAS: 0.9369, LAS: 0.8851, UEM: 0.5357, LEM: 0.3063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9746, partial_loss/deprel_loss: 0.9515, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1411, loss: 0.8355, batch_reg_loss: 0.1850, reg_loss: 0.1847 ||:  54%|#####3    | 51/95 [00:34<00:28,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9376, LAS: 0.8861, UEM: 0.5443, LEM: 0.3138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2375, partial_loss/deprel_loss: 0.3977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5507, loss: 0.8279, batch_reg_loss: 0.1851, reg_loss: 0.1847 ||:  58%|#####7    | 55/95 [00:37<00:27,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9386, LAS: 0.8872, UEM: 0.5507, LEM: 0.3164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2844, partial_loss/deprel_loss: 0.4675, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6160, loss: 0.8197, batch_reg_loss: 0.1851, reg_loss: 0.1847 ||:  61%|######1   | 58/95 [00:39<00:25,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9364, LAS: 0.8849, UEM: 0.5422, LEM: 0.3103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8464, partial_loss/deprel_loss: 0.7982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9930, loss: 0.8352, batch_reg_loss: 0.1852, reg_loss: 0.1847 ||:  65%|######5   | 62/95 [00:42<00:22,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9373, LAS: 0.8858, UEM: 0.5426, LEM: 0.3070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3489, partial_loss/deprel_loss: 0.5047, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6588, loss: 0.8285, batch_reg_loss: 0.1852, reg_loss: 0.1848 ||:  69%|######9   | 66/95 [00:44<00:19,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9204, UAS: 0.9378, LAS: 0.8860, UEM: 0.5439, LEM: 0.3070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2682, partial_loss/deprel_loss: 0.3856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5474, loss: 0.8271, batch_reg_loss: 0.1853, reg_loss: 0.1848 ||:  74%|#######3  | 70/95 [00:47<00:16,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9374, LAS: 0.8858, UEM: 0.5356, LEM: 0.3000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4395, partial_loss/deprel_loss: 0.4952, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6694, loss: 0.8292, batch_reg_loss: 0.1853, reg_loss: 0.1848 ||:  78%|#######7  | 74/95 [00:49<00:13,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9384, LAS: 0.8870, UEM: 0.5484, LEM: 0.3122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6598, partial_loss/deprel_loss: 0.6407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8299, loss: 0.8207, batch_reg_loss: 0.1854, reg_loss: 0.1848 ||:  82%|########2 | 78/95 [00:51<00:10,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9392, LAS: 0.8877, UEM: 0.5513, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4937, partial_loss/deprel_loss: 0.5759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7449, loss: 0.8148, batch_reg_loss: 0.1854, reg_loss: 0.1849 ||:  86%|########6 | 82/95 [00:54<00:07,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8659, UAS: 0.9389, LAS: 0.8873, UEM: 0.5511, LEM: 0.3134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7606, partial_loss/deprel_loss: 0.7955, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9740, loss: 0.8184, batch_reg_loss: 0.1855, reg_loss: 0.1849 ||:  91%|######### | 86/95 [00:56<00:05,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8712, UAS: 0.9400, LAS: 0.8885, UEM: 0.5753, LEM: 0.3387, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6608, partial_loss/deprel_loss: 0.7416, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9110, loss: 0.8076, batch_reg_loss: 0.1855, reg_loss: 0.1849 ||:  95%|#########4| 90/95 [00:59<00:03,  1.63it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9410, LAS: 0.8896, UEM: 0.5826, LEM: 0.3418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4913, partial_loss/deprel_loss: 0.5570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7294, loss: 0.7992, batch_reg_loss: 0.1856, reg_loss: 0.1850 ||:  99%|#########8| 94/95 [01:01<00:00,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8853, UAS: 0.9410, LAS: 0.8896, UEM: 0.5808, LEM: 0.3399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5826, partial_loss/deprel_loss: 0.6339, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8092, loss: 0.7993, batch_reg_loss: 0.1856, reg_loss: 0.1850 ||: 100%|##########| 95/95 [01:02<00:00,  1.53it/s]\n",
+      "2023-04-07 00:17:08,825 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:17:08,825 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.185  |       N/A\n",
+      "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - UEM                      |     0.581  |       N/A\n",
+      "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - LEM                      |     0.340  |       N/A\n",
+      "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - EM                       |     0.885  |       N/A\n",
+      "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.583  |       N/A\n",
+      "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - UAS                      |     0.941  |       N/A\n",
+      "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.634  |       N/A\n",
+      "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - loss                     |     0.799  |       N/A\n",
+      "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - LAS                      |     0.890  |       N/A\n",
+      "2023-04-07 00:17:08,826 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:17:08,827 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:17:08,827 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:17:08,827 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:17:08,827 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:17:08,827 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:17:08,827 - INFO - combo.training.trainer - Epoch duration: 0:01:02.242022\n",
+      "2023-04-07 00:17:08,828 - INFO - combo.training.trainer - Estimated training time remaining: 6:01:23\n",
+      "2023-04-07 00:17:08,828 - INFO - allennlp.training.trainer - Epoch 78/399\n",
+      "2023-04-07 00:17:08,828 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:17:08,828 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:17:08,835 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9099, UAS: 0.9408, LAS: 0.8896, UEM: 0.4489, LEM: 0.1972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3233, partial_loss/deprel_loss: 0.4872, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6400, loss: 0.7744, batch_reg_loss: 0.1856, reg_loss: 0.1856 ||:   4%|4         | 4/95 [00:02<00:50,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8963, UAS: 0.9516, LAS: 0.9008, UEM: 0.5703, LEM: 0.2929, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4229, partial_loss/deprel_loss: 0.5818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7356, loss: 0.7034, batch_reg_loss: 0.1856, reg_loss: 0.1856 ||:   9%|9         | 9/95 [00:04<00:44,  1.92it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9517, LAS: 0.9012, UEM: 0.5555, LEM: 0.2744, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4896, partial_loss/deprel_loss: 0.5947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7594, loss: 0.7013, batch_reg_loss: 0.1857, reg_loss: 0.1856 ||:  15%|#4        | 14/95 [00:06<00:40,  2.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8719, UAS: 0.9517, LAS: 0.9016, UEM: 0.5903, LEM: 0.3142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9200, partial_loss/deprel_loss: 0.7536, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9726, loss: 0.6973, batch_reg_loss: 0.1857, reg_loss: 0.1856 ||:  18%|#7        | 17/95 [00:08<00:43,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8616, UAS: 0.9495, LAS: 0.8992, UEM: 0.5741, LEM: 0.2999, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0144, partial_loss/deprel_loss: 0.8644, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0801, loss: 0.7219, batch_reg_loss: 0.1857, reg_loss: 0.1856 ||:  21%|##1       | 20/95 [00:10<00:45,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8480, UAS: 0.9484, LAS: 0.8985, UEM: 0.5931, LEM: 0.3295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2113, partial_loss/deprel_loss: 0.8566, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1133, loss: 0.7258, batch_reg_loss: 0.1857, reg_loss: 0.1857 ||:  24%|##4       | 23/95 [00:12<00:45,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8582, UAS: 0.9433, LAS: 0.8927, UEM: 0.5676, LEM: 0.3096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9793, partial_loss/deprel_loss: 0.8778, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0839, loss: 0.7736, batch_reg_loss: 0.1858, reg_loss: 0.1857 ||:  28%|##8       | 27/95 [00:15<00:43,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9438, LAS: 0.8934, UEM: 0.5776, LEM: 0.3224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1801, partial_loss/deprel_loss: 0.3442, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4972, loss: 0.7694, batch_reg_loss: 0.1858, reg_loss: 0.1857 ||:  32%|###1      | 30/95 [00:17<00:44,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9449, LAS: 0.8951, UEM: 0.5874, LEM: 0.3332, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1557, partial_loss/deprel_loss: 0.3232, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4756, loss: 0.7584, batch_reg_loss: 0.1859, reg_loss: 0.1857 ||:  36%|###5      | 34/95 [00:20<00:40,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8581, UAS: 0.9446, LAS: 0.8950, UEM: 0.5828, LEM: 0.3302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0273, partial_loss/deprel_loss: 0.7961, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0282, loss: 0.7593, batch_reg_loss: 0.1859, reg_loss: 0.1857 ||:  39%|###8      | 37/95 [00:22<00:39,  1.45it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9452, LAS: 0.8955, UEM: 0.5810, LEM: 0.3247, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6163, partial_loss/deprel_loss: 0.7001, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8693, loss: 0.7570, batch_reg_loss: 0.1859, reg_loss: 0.1857 ||:  42%|####2     | 40/95 [00:24<00:39,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9457, LAS: 0.8963, UEM: 0.6039, LEM: 0.3536, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1135, partial_loss/deprel_loss: 0.2364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3978, loss: 0.7489, batch_reg_loss: 0.1860, reg_loss: 0.1857 ||:  45%|####5     | 43/95 [00:27<00:38,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9445, LAS: 0.8949, UEM: 0.6038, LEM: 0.3527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2625, partial_loss/deprel_loss: 0.4436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5934, loss: 0.7595, batch_reg_loss: 0.1860, reg_loss: 0.1858 ||:  49%|####9     | 47/95 [00:30<00:34,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9448, LAS: 0.8950, UEM: 0.6067, LEM: 0.3592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5044, partial_loss/deprel_loss: 0.6603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8152, loss: 0.7586, batch_reg_loss: 0.1861, reg_loss: 0.1858 ||:  53%|#####2    | 50/95 [00:32<00:32,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9042, UAS: 0.9457, LAS: 0.8961, UEM: 0.6171, LEM: 0.3676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4020, partial_loss/deprel_loss: 0.5094, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6740, loss: 0.7499, batch_reg_loss: 0.1861, reg_loss: 0.1858 ||:  56%|#####5    | 53/95 [00:34<00:31,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9461, LAS: 0.8965, UEM: 0.6158, LEM: 0.3657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3005, partial_loss/deprel_loss: 0.4337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5932, loss: 0.7458, batch_reg_loss: 0.1861, reg_loss: 0.1858 ||:  59%|#####8    | 56/95 [00:37<00:30,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8676, UAS: 0.9464, LAS: 0.8966, UEM: 0.6168, LEM: 0.3648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7613, partial_loss/deprel_loss: 0.6916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8917, loss: 0.7440, batch_reg_loss: 0.1862, reg_loss: 0.1858 ||:  62%|######2   | 59/95 [00:39<00:29,  1.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9099, UAS: 0.9471, LAS: 0.8972, UEM: 0.6218, LEM: 0.3678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3180, partial_loss/deprel_loss: 0.4791, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6331, loss: 0.7379, batch_reg_loss: 0.1862, reg_loss: 0.1859 ||:  65%|######5   | 62/95 [00:42<00:26,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8780, UAS: 0.9469, LAS: 0.8969, UEM: 0.6130, LEM: 0.3599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6629, partial_loss/deprel_loss: 0.6976, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8769, loss: 0.7409, batch_reg_loss: 0.1862, reg_loss: 0.1859 ||:  68%|######8   | 65/95 [00:44<00:22,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9017, UAS: 0.9460, LAS: 0.8959, UEM: 0.6022, LEM: 0.3518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4262, partial_loss/deprel_loss: 0.5080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6779, loss: 0.7506, batch_reg_loss: 0.1862, reg_loss: 0.1859 ||:  73%|#######2  | 69/95 [00:46<00:18,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8572, UAS: 0.9448, LAS: 0.8947, UEM: 0.5979, LEM: 0.3489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0539, partial_loss/deprel_loss: 0.8267, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0584, loss: 0.7597, batch_reg_loss: 0.1863, reg_loss: 0.1859 ||:  77%|#######6  | 73/95 [00:49<00:15,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8405, UAS: 0.9446, LAS: 0.8948, UEM: 0.6111, LEM: 0.3705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2930, partial_loss/deprel_loss: 0.9116, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1742, loss: 0.7602, batch_reg_loss: 0.1863, reg_loss: 0.1859 ||:  80%|########  | 76/95 [00:51<00:13,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.9432, LAS: 0.8931, UEM: 0.6007, LEM: 0.3616, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6972, partial_loss/deprel_loss: 0.7468, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9233, loss: 0.7716, batch_reg_loss: 0.1864, reg_loss: 0.1859 ||:  84%|########4 | 80/95 [00:53<00:10,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9420, LAS: 0.8918, UEM: 0.5955, LEM: 0.3565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3082, partial_loss/deprel_loss: 0.5144, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6596, loss: 0.7820, batch_reg_loss: 0.1864, reg_loss: 0.1860 ||:  88%|########8 | 84/95 [00:56<00:07,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8801, UAS: 0.9415, LAS: 0.8910, UEM: 0.5861, LEM: 0.3487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5924, partial_loss/deprel_loss: 0.6303, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8092, loss: 0.7896, batch_reg_loss: 0.1865, reg_loss: 0.1860 ||:  93%|#########2| 88/95 [00:59<00:04,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9401, LAS: 0.8894, UEM: 0.5803, LEM: 0.3445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2964, partial_loss/deprel_loss: 0.4255, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5862, loss: 0.7997, batch_reg_loss: 0.1866, reg_loss: 0.1860 ||:  97%|#########6| 92/95 [01:01<00:01,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8661, UAS: 0.9401, LAS: 0.8894, UEM: 0.5777, LEM: 0.3402, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8968, partial_loss/deprel_loss: 0.7831, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9924, loss: 0.8005, batch_reg_loss: 0.1866, reg_loss: 0.1860 ||: 100%|##########| 95/95 [01:03<00:00,  1.49it/s]\n",
+      "2023-04-07 00:18:12,488 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:18:12,488 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 00:18:12,488 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.186  |       N/A\n",
+      "2023-04-07 00:18:12,488 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:18:12,488 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:18:12,488 - INFO - combo.training.tensorboard_writer - UEM                      |     0.578  |       N/A\n",
+      "2023-04-07 00:18:12,488 - INFO - combo.training.tensorboard_writer - LEM                      |     0.340  |       N/A\n",
+      "2023-04-07 00:18:12,488 - INFO - combo.training.tensorboard_writer - EM                       |     0.866  |       N/A\n",
+      "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.897  |       N/A\n",
+      "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - UAS                      |     0.940  |       N/A\n",
+      "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.783  |       N/A\n",
+      "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - loss                     |     0.800  |       N/A\n",
+      "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - LAS                      |     0.889  |       N/A\n",
+      "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:18:12,489 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:18:12,490 - INFO - combo.training.trainer - Epoch duration: 0:01:03.662416\n",
+      "2023-04-07 00:18:12,490 - INFO - combo.training.trainer - Estimated training time remaining: 6:00:01\n",
+      "2023-04-07 00:18:12,490 - INFO - allennlp.training.trainer - Epoch 79/399\n",
+      "2023-04-07 00:18:12,490 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:18:12,491 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:18:12,498 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9283, LAS: 0.8772, UEM: 0.4899, LEM: 0.2588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2977, partial_loss/deprel_loss: 0.4617, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6156, loss: 0.8829, batch_reg_loss: 0.1867, reg_loss: 0.1867 ||:   3%|3         | 3/95 [00:02<01:04,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9239, LAS: 0.8754, UEM: 0.5283, LEM: 0.2744, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3208, partial_loss/deprel_loss: 0.4771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6326, loss: 0.8969, batch_reg_loss: 0.1867, reg_loss: 0.1867 ||:   6%|6         | 6/95 [00:04<01:03,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9365, LAS: 0.8881, UEM: 0.5864, LEM: 0.3135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4957, partial_loss/deprel_loss: 0.6628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8162, loss: 0.8139, batch_reg_loss: 0.1868, reg_loss: 0.1867 ||:   9%|9         | 9/95 [00:06<01:00,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8978, UAS: 0.9396, LAS: 0.8913, UEM: 0.6205, LEM: 0.3589, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4121, partial_loss/deprel_loss: 0.5223, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6871, loss: 0.7861, batch_reg_loss: 0.1868, reg_loss: 0.1867 ||:  13%|#2        | 12/95 [00:08<01:01,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9166, UAS: 0.9441, LAS: 0.8958, UEM: 0.6585, LEM: 0.3974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2032, partial_loss/deprel_loss: 0.3666, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5207, loss: 0.7440, batch_reg_loss: 0.1869, reg_loss: 0.1868 ||:  16%|#5        | 15/95 [00:11<01:00,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9459, LAS: 0.8981, UEM: 0.6616, LEM: 0.3956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3285, partial_loss/deprel_loss: 0.4213, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5896, loss: 0.7234, batch_reg_loss: 0.1869, reg_loss: 0.1868 ||:  19%|#8        | 18/95 [00:13<00:59,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8816, UAS: 0.9478, LAS: 0.9004, UEM: 0.6716, LEM: 0.4070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6162, partial_loss/deprel_loss: 0.6331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8167, loss: 0.7079, batch_reg_loss: 0.1869, reg_loss: 0.1868 ||:  22%|##2       | 21/95 [00:15<00:55,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9474, LAS: 0.9000, UEM: 0.6755, LEM: 0.4183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0440, partial_loss/deprel_loss: 0.8140, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0470, loss: 0.7136, batch_reg_loss: 0.1870, reg_loss: 0.1868 ||:  25%|##5       | 24/95 [00:18<00:55,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8607, UAS: 0.9417, LAS: 0.8937, UEM: 0.6401, LEM: 0.3942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0526, partial_loss/deprel_loss: 0.8241, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0568, loss: 0.7640, batch_reg_loss: 0.1870, reg_loss: 0.1868 ||:  29%|##9       | 28/95 [00:20<00:49,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8408, UAS: 0.9379, LAS: 0.8896, UEM: 0.6116, LEM: 0.3737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3279, partial_loss/deprel_loss: 0.8781, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1551, loss: 0.7982, batch_reg_loss: 0.1870, reg_loss: 0.1869 ||:  34%|###3      | 32/95 [00:23<00:43,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9366, LAS: 0.8882, UEM: 0.5996, LEM: 0.3624, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3334, partial_loss/deprel_loss: 0.4300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5977, loss: 0.8117, batch_reg_loss: 0.1871, reg_loss: 0.1869 ||:  38%|###7      | 36/95 [00:25<00:37,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8622, UAS: 0.9358, LAS: 0.8873, UEM: 0.5815, LEM: 0.3472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8832, partial_loss/deprel_loss: 0.7934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9985, loss: 0.8199, batch_reg_loss: 0.1872, reg_loss: 0.1869 ||:  43%|####3     | 41/95 [00:27<00:32,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8604, UAS: 0.9343, LAS: 0.8852, UEM: 0.5650, LEM: 0.3333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0274, partial_loss/deprel_loss: 0.8131, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0432, loss: 0.8361, batch_reg_loss: 0.1873, reg_loss: 0.1870 ||:  48%|####8     | 46/95 [00:29<00:27,  1.80it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9351, LAS: 0.8856, UEM: 0.5620, LEM: 0.3257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5172, partial_loss/deprel_loss: 0.6135, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7816, loss: 0.8314, batch_reg_loss: 0.1873, reg_loss: 0.1870 ||:  53%|#####2    | 50/95 [00:31<00:24,  1.85it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8983, UAS: 0.9369, LAS: 0.8876, UEM: 0.5930, LEM: 0.3649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5163, partial_loss/deprel_loss: 0.5533, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7333, loss: 0.8152, batch_reg_loss: 0.1874, reg_loss: 0.1870 ||:  57%|#####6    | 54/95 [00:35<00:25,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8488, UAS: 0.9359, LAS: 0.8866, UEM: 0.5788, LEM: 0.3538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1207, partial_loss/deprel_loss: 0.8376, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0817, loss: 0.8220, batch_reg_loss: 0.1875, reg_loss: 0.1870 ||:  61%|######1   | 58/95 [00:37<00:23,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9366, LAS: 0.8873, UEM: 0.5778, LEM: 0.3488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4081, partial_loss/deprel_loss: 0.5361, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6980, loss: 0.8168, batch_reg_loss: 0.1875, reg_loss: 0.1871 ||:  65%|######5   | 62/95 [00:40<00:21,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9374, LAS: 0.8880, UEM: 0.5757, LEM: 0.3446, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3767, partial_loss/deprel_loss: 0.5423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6967, loss: 0.8132, batch_reg_loss: 0.1876, reg_loss: 0.1871 ||:  69%|######9   | 66/95 [00:43<00:18,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8795, UAS: 0.9378, LAS: 0.8881, UEM: 0.5715, LEM: 0.3395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6738, partial_loss/deprel_loss: 0.6987, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8813, loss: 0.8116, batch_reg_loss: 0.1876, reg_loss: 0.1871 ||:  74%|#######3  | 70/95 [00:45<00:16,  1.55it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9212, UAS: 0.9375, LAS: 0.8878, UEM: 0.5671, LEM: 0.3360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2480, partial_loss/deprel_loss: 0.3709, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5340, loss: 0.8145, batch_reg_loss: 0.1877, reg_loss: 0.1872 ||:  78%|#######7  | 74/95 [00:48<00:13,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9382, LAS: 0.8884, UEM: 0.5671, LEM: 0.3338, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4622, partial_loss/deprel_loss: 0.5921, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7539, loss: 0.8099, batch_reg_loss: 0.1877, reg_loss: 0.1872 ||:  82%|########2 | 78/95 [00:50<00:10,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9385, LAS: 0.8885, UEM: 0.5614, LEM: 0.3265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6567, partial_loss/deprel_loss: 0.6606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8476, loss: 0.8097, batch_reg_loss: 0.1878, reg_loss: 0.1872 ||:  86%|########6 | 82/95 [00:53<00:08,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9082, UAS: 0.9396, LAS: 0.8897, UEM: 0.5765, LEM: 0.3417, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4273, partial_loss/deprel_loss: 0.5450, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7093, loss: 0.8001, batch_reg_loss: 0.1878, reg_loss: 0.1872 ||:  91%|######### | 86/95 [00:55<00:05,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9400, LAS: 0.8899, UEM: 0.5763, LEM: 0.3383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3665, partial_loss/deprel_loss: 0.5096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6688, loss: 0.7984, batch_reg_loss: 0.1879, reg_loss: 0.1873 ||:  95%|#########4| 90/95 [00:58<00:03,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9405, LAS: 0.8904, UEM: 0.5754, LEM: 0.3353, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3016, partial_loss/deprel_loss: 0.5141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6595, loss: 0.7965, batch_reg_loss: 0.1879, reg_loss: 0.1873 ||:  99%|#########8| 94/95 [01:01<00:00,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9408, LAS: 0.8907, UEM: 0.5806, LEM: 0.3402, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2214, partial_loss/deprel_loss: 0.3765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5335, loss: 0.7937, batch_reg_loss: 0.1879, reg_loss: 0.1873 ||: 100%|##########| 95/95 [01:01<00:00,  1.53it/s]\n",
+      "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.187  |       N/A\n",
+      "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - UEM                      |     0.581  |       N/A\n",
+      "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - LEM                      |     0.340  |       N/A\n",
+      "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - EM                       |     0.920  |       N/A\n",
+      "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.221  |       N/A\n",
+      "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:19:14,422 - INFO - combo.training.tensorboard_writer - UAS                      |     0.941  |       N/A\n",
+      "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.377  |       N/A\n",
+      "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - loss                     |     0.794  |       N/A\n",
+      "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - LAS                      |     0.891  |       N/A\n",
+      "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:19:14,423 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:19:14,424 - INFO - combo.training.trainer - Epoch duration: 0:01:01.933450\n",
+      "2023-04-07 00:19:14,424 - INFO - combo.training.trainer - Estimated training time remaining: 5:58:32\n",
+      "2023-04-07 00:19:14,424 - INFO - allennlp.training.trainer - Epoch 80/399\n",
+      "2023-04-07 00:19:14,424 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:19:14,424 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:19:14,431 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9596, LAS: 0.9109, UEM: 0.6800, LEM: 0.3824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1690, partial_loss/deprel_loss: 0.3843, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5292, loss: 0.6419, batch_reg_loss: 0.1880, reg_loss: 0.1880 ||:   4%|4         | 4/95 [00:02<01:05,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9272, UAS: 0.9480, LAS: 0.8989, UEM: 0.6161, LEM: 0.3407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2618, partial_loss/deprel_loss: 0.4043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5638, loss: 0.7364, batch_reg_loss: 0.1880, reg_loss: 0.1880 ||:   7%|7         | 7/95 [00:05<01:04,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9235, UAS: 0.9512, LAS: 0.9017, UEM: 0.6269, LEM: 0.3572, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2605, partial_loss/deprel_loss: 0.4553, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6044, loss: 0.7124, batch_reg_loss: 0.1880, reg_loss: 0.1880 ||:  12%|#1        | 11/95 [00:07<01:00,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9506, LAS: 0.9014, UEM: 0.6104, LEM: 0.3410, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3772, partial_loss/deprel_loss: 0.5111, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6724, loss: 0.7203, batch_reg_loss: 0.1881, reg_loss: 0.1880 ||:  15%|#4        | 14/95 [00:10<00:58,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9499, LAS: 0.9004, UEM: 0.5876, LEM: 0.3188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2876, partial_loss/deprel_loss: 0.5166, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6589, loss: 0.7232, batch_reg_loss: 0.1881, reg_loss: 0.1880 ||:  19%|#8        | 18/95 [00:12<00:52,  1.47it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9505, LAS: 0.9008, UEM: 0.5854, LEM: 0.3130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5094, partial_loss/deprel_loss: 0.5760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7508, loss: 0.7181, batch_reg_loss: 0.1881, reg_loss: 0.1880 ||:  22%|##2       | 21/95 [00:14<00:50,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9527, LAS: 0.9041, UEM: 0.6489, LEM: 0.3979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3647, partial_loss/deprel_loss: 0.4708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6377, loss: 0.6928, batch_reg_loss: 0.1882, reg_loss: 0.1881 ||:  25%|##5       | 24/95 [00:17<00:53,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8836, UAS: 0.9512, LAS: 0.9019, UEM: 0.6426, LEM: 0.3904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5918, partial_loss/deprel_loss: 0.6836, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8535, loss: 0.7120, batch_reg_loss: 0.1882, reg_loss: 0.1881 ||:  29%|##9       | 28/95 [00:19<00:48,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9469, LAS: 0.8971, UEM: 0.6465, LEM: 0.4018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1478, partial_loss/deprel_loss: 0.3533, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5004, loss: 0.7485, batch_reg_loss: 0.1882, reg_loss: 0.1881 ||:  33%|###2      | 31/95 [00:22<00:48,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9449, LAS: 0.8948, UEM: 0.6225, LEM: 0.3811, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5434, partial_loss/deprel_loss: 0.5990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7762, loss: 0.7667, batch_reg_loss: 0.1883, reg_loss: 0.1881 ||:  37%|###6      | 35/95 [00:25<00:44,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8643, UAS: 0.9454, LAS: 0.8954, UEM: 0.6357, LEM: 0.3958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6944, partial_loss/deprel_loss: 0.7790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9504, loss: 0.7592, batch_reg_loss: 0.1883, reg_loss: 0.1881 ||:  40%|####      | 38/95 [00:27<00:42,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9443, LAS: 0.8940, UEM: 0.6177, LEM: 0.3797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4132, partial_loss/deprel_loss: 0.4802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6552, loss: 0.7663, batch_reg_loss: 0.1884, reg_loss: 0.1881 ||:  44%|####4     | 42/95 [00:30<00:38,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8821, UAS: 0.9422, LAS: 0.8914, UEM: 0.5969, LEM: 0.3639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8455, partial_loss/deprel_loss: 0.6861, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9064, loss: 0.7889, batch_reg_loss: 0.1884, reg_loss: 0.1882 ||:  48%|####8     | 46/95 [00:32<00:34,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8864, UAS: 0.9425, LAS: 0.8919, UEM: 0.5920, LEM: 0.3586, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5160, partial_loss/deprel_loss: 0.7093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8591, loss: 0.7868, batch_reg_loss: 0.1885, reg_loss: 0.1882 ||:  52%|#####1    | 49/95 [00:34<00:31,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8074, UAS: 0.9416, LAS: 0.8908, UEM: 0.5890, LEM: 0.3524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6451, partial_loss/deprel_loss: 1.1061, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4024, loss: 0.7942, batch_reg_loss: 0.1885, reg_loss: 0.1882 ||:  55%|#####4    | 52/95 [00:36<00:30,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9404, LAS: 0.8894, UEM: 0.5855, LEM: 0.3498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3017, partial_loss/deprel_loss: 0.4170, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5825, loss: 0.8047, batch_reg_loss: 0.1886, reg_loss: 0.1882 ||:  58%|#####7    | 55/95 [00:39<00:29,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9407, LAS: 0.8896, UEM: 0.5849, LEM: 0.3473, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2642, partial_loss/deprel_loss: 0.4808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6261, loss: 0.8032, batch_reg_loss: 0.1886, reg_loss: 0.1882 ||:  61%|######1   | 58/95 [00:41<00:28,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9413, LAS: 0.8899, UEM: 0.5889, LEM: 0.3473, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2398, partial_loss/deprel_loss: 0.4865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6258, loss: 0.7995, batch_reg_loss: 0.1887, reg_loss: 0.1883 ||:  64%|######4   | 61/95 [00:43<00:25,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8982, UAS: 0.9420, LAS: 0.8905, UEM: 0.5975, LEM: 0.3561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4616, partial_loss/deprel_loss: 0.6036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7639, loss: 0.7946, batch_reg_loss: 0.1887, reg_loss: 0.1883 ||:  68%|######8   | 65/95 [00:46<00:21,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8839, UAS: 0.9431, LAS: 0.8917, UEM: 0.6147, LEM: 0.3717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5303, partial_loss/deprel_loss: 0.6276, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7969, loss: 0.7829, batch_reg_loss: 0.1888, reg_loss: 0.1883 ||:  73%|#######2  | 69/95 [00:48<00:16,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8610, UAS: 0.9418, LAS: 0.8903, UEM: 0.6083, LEM: 0.3658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9466, partial_loss/deprel_loss: 0.7993, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0175, loss: 0.7934, batch_reg_loss: 0.1888, reg_loss: 0.1883 ||:  78%|#######7  | 74/95 [00:50<00:12,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8587, UAS: 0.9411, LAS: 0.8898, UEM: 0.5973, LEM: 0.3560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0785, partial_loss/deprel_loss: 0.8666, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0979, loss: 0.7982, batch_reg_loss: 0.1889, reg_loss: 0.1884 ||:  83%|########3 | 79/95 [00:52<00:08,  1.83it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8956, UAS: 0.9412, LAS: 0.8899, UEM: 0.5901, LEM: 0.3479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5880, partial_loss/deprel_loss: 0.5951, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7826, loss: 0.7978, batch_reg_loss: 0.1889, reg_loss: 0.1884 ||:  87%|########7 | 83/95 [00:57<00:08,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8699, UAS: 0.9408, LAS: 0.8894, UEM: 0.5842, LEM: 0.3418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7730, partial_loss/deprel_loss: 0.7625, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9536, loss: 0.8019, batch_reg_loss: 0.1890, reg_loss: 0.1884 ||:  92%|#########1| 87/95 [01:00<00:05,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8416, UAS: 0.9403, LAS: 0.8888, UEM: 0.5809, LEM: 0.3395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3301, partial_loss/deprel_loss: 0.8968, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1725, loss: 0.8064, batch_reg_loss: 0.1890, reg_loss: 0.1884 ||:  96%|#########5| 91/95 [01:02<00:02,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8628, UAS: 0.9402, LAS: 0.8888, UEM: 0.5777, LEM: 0.3366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8507, partial_loss/deprel_loss: 0.8098, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0071, loss: 0.8068, batch_reg_loss: 0.1891, reg_loss: 0.1885 ||: 100%|##########| 95/95 [01:05<00:00,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8628, UAS: 0.9402, LAS: 0.8888, UEM: 0.5777, LEM: 0.3366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8507, partial_loss/deprel_loss: 0.8098, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0071, loss: 0.8068, batch_reg_loss: 0.1891, reg_loss: 0.1885 ||: 100%|##########| 95/95 [01:05<00:00,  1.45it/s]\n",
+      "2023-04-07 00:20:19,918 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9691, LAS: 0.9273, UEM: 0.8205, LEM: 0.5921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1826, partial_loss/deprel_loss: 17.6571, partial_loss/cycle_loss: 0.0000, batch_loss: 14.1622, loss: 18.2288, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  27%|##7       | 3/11 [00:02<00:06,  1.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8371, UAS: 0.9466, LAS: 0.8977, UEM: 0.7012, LEM: 0.4608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5806, partial_loss/deprel_loss: 53.6078, partial_loss/cycle_loss: 0.0000, batch_loss: 43.2024, loss: 23.0699, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  55%|#####4    | 6/11 [00:05<00:04,  1.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8903, UAS: 0.9507, LAS: 0.9004, UEM: 0.7089, LEM: 0.4381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8707, partial_loss/deprel_loss: 32.8457, partial_loss/cycle_loss: 0.0000, batch_loss: 26.4507, loss: 22.7814, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  82%|########1 | 9/11 [00:08<00:01,  1.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8705, UAS: 0.9472, LAS: 0.8956, UEM: 0.6708, LEM: 0.4033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0470, partial_loss/deprel_loss: 41.2218, partial_loss/cycle_loss: 0.0000, batch_loss: 33.1868, loss: 25.0364, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.06it/s]\n",
+      "2023-04-07 00:20:30,262 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.188  |     0.000\n",
+      "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - UEM                      |     0.578  |     0.671\n",
+      "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - LEM                      |     0.337  |     0.403\n",
+      "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - EM                       |     0.863  |     0.871\n",
+      "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.851  |     1.047\n",
+      "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - UAS                      |     0.940  |     0.947\n",
+      "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.810  |    41.222\n",
+      "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - loss                     |     0.807  |    25.036\n",
+      "2023-04-07 00:20:30,263 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:20:30,264 - INFO - combo.training.tensorboard_writer - LAS                      |     0.889  |     0.896\n",
+      "2023-04-07 00:20:30,264 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:20:30,264 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:20:30,264 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:20:30,264 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:20:30,264 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:20:30,264 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 00:20:30,265 - INFO - combo.training.trainer - Epoch duration: 0:01:15.840607\n",
+      "2023-04-07 00:20:30,265 - INFO - combo.training.trainer - Estimated training time remaining: 5:57:59\n",
+      "2023-04-07 00:20:30,265 - INFO - allennlp.training.trainer - Epoch 81/399\n",
+      "2023-04-07 00:20:30,265 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:20:30,265 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:20:30,272 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8982, UAS: 0.9532, LAS: 0.9055, UEM: 0.5120, LEM: 0.2201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4113, partial_loss/deprel_loss: 0.5896, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7431, loss: 0.6814, batch_reg_loss: 0.1891, reg_loss: 0.1891 ||:   4%|4         | 4/95 [00:02<00:58,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9465, LAS: 0.8960, UEM: 0.4424, LEM: 0.1781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5934, partial_loss/deprel_loss: 0.6396, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8196, loss: 0.7523, batch_reg_loss: 0.1892, reg_loss: 0.1891 ||:   8%|8         | 8/95 [00:05<00:55,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9517, LAS: 0.9022, UEM: 0.5925, LEM: 0.3289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1377, partial_loss/deprel_loss: 0.3225, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4748, loss: 0.7044, batch_reg_loss: 0.1892, reg_loss: 0.1892 ||:  12%|#1        | 11/95 [00:07<01:00,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9473, LAS: 0.8976, UEM: 0.5870, LEM: 0.3251, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3146, partial_loss/deprel_loss: 0.4169, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5857, loss: 0.7374, batch_reg_loss: 0.1893, reg_loss: 0.1892 ||:  15%|#4        | 14/95 [00:09<00:57,  1.40it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9034, UAS: 0.9491, LAS: 0.8992, UEM: 0.5768, LEM: 0.3062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3695, partial_loss/deprel_loss: 0.5371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6929, loss: 0.7260, batch_reg_loss: 0.1893, reg_loss: 0.1892 ||:  19%|#8        | 18/95 [00:12<00:52,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9461, LAS: 0.8960, UEM: 0.5606, LEM: 0.2923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3091, partial_loss/deprel_loss: 0.4978, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6495, loss: 0.7472, batch_reg_loss: 0.1894, reg_loss: 0.1892 ||:  23%|##3       | 22/95 [00:14<00:48,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8492, UAS: 0.9437, LAS: 0.8932, UEM: 0.5314, LEM: 0.2714, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1287, partial_loss/deprel_loss: 0.9095, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1428, loss: 0.7699, batch_reg_loss: 0.1894, reg_loss: 0.1893 ||:  27%|##7       | 26/95 [00:17<00:46,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8202, UAS: 0.9407, LAS: 0.8901, UEM: 0.5317, LEM: 0.2779, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6746, partial_loss/deprel_loss: 1.0439, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3595, loss: 0.7930, batch_reg_loss: 0.1894, reg_loss: 0.1893 ||:  31%|###       | 29/95 [00:19<00:46,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9421, LAS: 0.8916, UEM: 0.5485, LEM: 0.2887, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2727, partial_loss/deprel_loss: 0.4476, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6021, loss: 0.7818, batch_reg_loss: 0.1895, reg_loss: 0.1893 ||:  34%|###3      | 32/95 [00:22<00:45,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9428, LAS: 0.8925, UEM: 0.5586, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2292, partial_loss/deprel_loss: 0.4444, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5909, loss: 0.7759, batch_reg_loss: 0.1895, reg_loss: 0.1893 ||:  37%|###6      | 35/95 [00:24<00:44,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9435, LAS: 0.8932, UEM: 0.5609, LEM: 0.2976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2145, partial_loss/deprel_loss: 0.4473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5903, loss: 0.7733, batch_reg_loss: 0.1896, reg_loss: 0.1893 ||:  41%|####1     | 39/95 [00:27<00:39,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9444, LAS: 0.8943, UEM: 0.5979, LEM: 0.3504, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2540, partial_loss/deprel_loss: 0.4483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5990, loss: 0.7647, batch_reg_loss: 0.1896, reg_loss: 0.1894 ||:  44%|####4     | 42/95 [00:29<00:40,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8395, UAS: 0.9431, LAS: 0.8931, UEM: 0.6082, LEM: 0.3675, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4032, partial_loss/deprel_loss: 0.9042, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1936, loss: 0.7752, batch_reg_loss: 0.1897, reg_loss: 0.1894 ||:  47%|####7     | 45/95 [00:31<00:37,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9439, LAS: 0.8941, UEM: 0.6117, LEM: 0.3679, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4422, partial_loss/deprel_loss: 0.5357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7067, loss: 0.7698, batch_reg_loss: 0.1897, reg_loss: 0.1894 ||:  51%|#####     | 48/95 [00:34<00:36,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8776, UAS: 0.9430, LAS: 0.8932, UEM: 0.6004, LEM: 0.3586, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6614, partial_loss/deprel_loss: 0.6990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8812, loss: 0.7761, batch_reg_loss: 0.1897, reg_loss: 0.1894 ||:  54%|#####3    | 51/95 [00:36<00:33,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8883, UAS: 0.9410, LAS: 0.8910, UEM: 0.5863, LEM: 0.3470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6204, partial_loss/deprel_loss: 0.6619, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8434, loss: 0.7930, batch_reg_loss: 0.1898, reg_loss: 0.1894 ||:  58%|#####7    | 55/95 [00:39<00:29,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9415, LAS: 0.8917, UEM: 0.5858, LEM: 0.3449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2670, partial_loss/deprel_loss: 0.4122, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5730, loss: 0.7890, batch_reg_loss: 0.1898, reg_loss: 0.1895 ||:  62%|######2   | 59/95 [00:41<00:25,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9417, LAS: 0.8917, UEM: 0.5870, LEM: 0.3444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2479, partial_loss/deprel_loss: 0.3969, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5570, loss: 0.7890, batch_reg_loss: 0.1899, reg_loss: 0.1895 ||:  65%|######5   | 62/95 [00:44<00:23,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8788, UAS: 0.9418, LAS: 0.8917, UEM: 0.5857, LEM: 0.3411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7133, partial_loss/deprel_loss: 0.6690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8678, loss: 0.7870, batch_reg_loss: 0.1899, reg_loss: 0.1895 ||:  68%|######8   | 65/95 [00:46<00:21,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8292, UAS: 0.9408, LAS: 0.8906, UEM: 0.5769, LEM: 0.3348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4467, partial_loss/deprel_loss: 1.0592, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3266, loss: 0.7982, batch_reg_loss: 0.1900, reg_loss: 0.1895 ||:  72%|#######1  | 68/95 [00:48<00:18,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9413, LAS: 0.8911, UEM: 0.5811, LEM: 0.3386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1525, partial_loss/deprel_loss: 0.3706, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5170, loss: 0.7954, batch_reg_loss: 0.1900, reg_loss: 0.1896 ||:  76%|#######5  | 72/95 [00:50<00:15,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9413, LAS: 0.8908, UEM: 0.5743, LEM: 0.3309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4549, partial_loss/deprel_loss: 0.5787, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7440, loss: 0.7975, batch_reg_loss: 0.1901, reg_loss: 0.1896 ||:  80%|########  | 76/95 [00:53<00:12,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8542, UAS: 0.9407, LAS: 0.8899, UEM: 0.5642, LEM: 0.3228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0134, partial_loss/deprel_loss: 0.7880, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0232, loss: 0.8038, batch_reg_loss: 0.1901, reg_loss: 0.1896 ||:  84%|########4 | 80/95 [00:55<00:09,  1.61it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9418, LAS: 0.8909, UEM: 0.5782, LEM: 0.3335, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5291, partial_loss/deprel_loss: 0.6351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8040, loss: 0.7943, batch_reg_loss: 0.1902, reg_loss: 0.1896 ||:  89%|########9 | 85/95 [00:57<00:05,  1.72it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9418, LAS: 0.8910, UEM: 0.5920, LEM: 0.3441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1692, partial_loss/deprel_loss: 0.3127, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4742, loss: 0.7921, batch_reg_loss: 0.1902, reg_loss: 0.1897 ||:  95%|#########4| 90/95 [01:00<00:02,  1.82it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8971, UAS: 0.9413, LAS: 0.8902, UEM: 0.5830, LEM: 0.3351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4300, partial_loss/deprel_loss: 0.6124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7662, loss: 0.7992, batch_reg_loss: 0.1903, reg_loss: 0.1897 ||: 100%|##########| 95/95 [01:02<00:00,  1.85it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8971, UAS: 0.9413, LAS: 0.8902, UEM: 0.5830, LEM: 0.3351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4300, partial_loss/deprel_loss: 0.6124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7662, loss: 0.7992, batch_reg_loss: 0.1903, reg_loss: 0.1897 ||: 100%|##########| 95/95 [01:02<00:00,  1.51it/s]\n",
+      "2023-04-07 00:21:33,036 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.190  |       N/A\n",
+      "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - UEM                      |     0.583  |       N/A\n",
+      "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - LEM                      |     0.335  |       N/A\n",
+      "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - EM                       |     0.897  |       N/A\n",
+      "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.430  |       N/A\n",
+      "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - UAS                      |     0.941  |       N/A\n",
+      "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.612  |       N/A\n",
+      "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - loss                     |     0.799  |       N/A\n",
+      "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:21:33,037 - INFO - combo.training.tensorboard_writer - LAS                      |     0.890  |       N/A\n",
+      "2023-04-07 00:21:33,038 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:21:33,038 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:21:33,038 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:21:33,038 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:21:33,038 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:21:33,038 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:21:33,038 - INFO - combo.training.trainer - Epoch duration: 0:01:02.773691\n",
+      "2023-04-07 00:21:33,039 - INFO - combo.training.trainer - Estimated training time remaining: 5:56:34\n",
+      "2023-04-07 00:21:33,039 - INFO - allennlp.training.trainer - Epoch 82/399\n",
+      "2023-04-07 00:21:33,039 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:21:33,039 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:21:33,046 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9013, UAS: 0.9454, LAS: 0.8927, UEM: 0.4833, LEM: 0.2201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4030, partial_loss/deprel_loss: 0.5688, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7260, loss: 0.7748, batch_reg_loss: 0.1903, reg_loss: 0.1903 ||:   4%|4         | 4/95 [00:02<00:58,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9485, LAS: 0.8984, UEM: 0.5650, LEM: 0.3109, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5287, partial_loss/deprel_loss: 0.5602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7443, loss: 0.7361, batch_reg_loss: 0.1904, reg_loss: 0.1904 ||:   8%|8         | 8/95 [00:05<00:55,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8782, UAS: 0.9496, LAS: 0.8982, UEM: 0.5911, LEM: 0.3257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7146, partial_loss/deprel_loss: 0.7561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9382, loss: 0.7368, batch_reg_loss: 0.1904, reg_loss: 0.1904 ||:  12%|#1        | 11/95 [00:07<00:54,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9496, LAS: 0.8991, UEM: 0.5772, LEM: 0.3048, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3317, partial_loss/deprel_loss: 0.5018, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6583, loss: 0.7337, batch_reg_loss: 0.1905, reg_loss: 0.1904 ||:  16%|#5        | 15/95 [00:09<00:51,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7966, UAS: 0.9427, LAS: 0.8916, UEM: 0.5607, LEM: 0.2950, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9665, partial_loss/deprel_loss: 1.0984, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4625, loss: 0.7855, batch_reg_loss: 0.1905, reg_loss: 0.1904 ||:  19%|#8        | 18/95 [00:12<00:53,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9454, LAS: 0.8947, UEM: 0.5856, LEM: 0.3131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2318, partial_loss/deprel_loss: 0.4047, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5607, loss: 0.7637, batch_reg_loss: 0.1906, reg_loss: 0.1904 ||:  22%|##2       | 21/95 [00:14<00:53,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9199, UAS: 0.9450, LAS: 0.8941, UEM: 0.5764, LEM: 0.3048, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2536, partial_loss/deprel_loss: 0.4636, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6122, loss: 0.7734, batch_reg_loss: 0.1906, reg_loss: 0.1905 ||:  26%|##6       | 25/95 [00:16<00:47,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9250, UAS: 0.9443, LAS: 0.8936, UEM: 0.5872, LEM: 0.3180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2336, partial_loss/deprel_loss: 0.3758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5380, loss: 0.7777, batch_reg_loss: 0.1907, reg_loss: 0.1905 ||:  29%|##9       | 28/95 [00:19<00:48,  1.38it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9446, LAS: 0.8944, UEM: 0.6237, LEM: 0.3670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1304, partial_loss/deprel_loss: 0.2652, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4289, loss: 0.7715, batch_reg_loss: 0.1907, reg_loss: 0.1905 ||:  33%|###2      | 31/95 [00:21<00:47,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9454, LAS: 0.8951, UEM: 0.6163, LEM: 0.3588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6524, partial_loss/deprel_loss: 0.6512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8422, loss: 0.7654, batch_reg_loss: 0.1907, reg_loss: 0.1905 ||:  37%|###6      | 35/95 [00:24<00:42,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9465, LAS: 0.8960, UEM: 0.6211, LEM: 0.3600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2832, partial_loss/deprel_loss: 0.4528, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6097, loss: 0.7576, batch_reg_loss: 0.1908, reg_loss: 0.1905 ||:  40%|####      | 38/95 [00:26<00:40,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8478, UAS: 0.9463, LAS: 0.8960, UEM: 0.6213, LEM: 0.3611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1968, partial_loss/deprel_loss: 0.8406, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1027, loss: 0.7585, batch_reg_loss: 0.1908, reg_loss: 0.1906 ||:  43%|####3     | 41/95 [00:28<00:37,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9473, LAS: 0.8972, UEM: 0.6317, LEM: 0.3686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2926, partial_loss/deprel_loss: 0.4871, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6391, loss: 0.7465, batch_reg_loss: 0.1908, reg_loss: 0.1906 ||:  46%|####6     | 44/95 [00:31<00:39,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9456, LAS: 0.8952, UEM: 0.6137, LEM: 0.3557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5593, partial_loss/deprel_loss: 0.5878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7730, loss: 0.7609, batch_reg_loss: 0.1909, reg_loss: 0.1906 ||:  51%|#####     | 48/95 [00:33<00:34,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8404, UAS: 0.9454, LAS: 0.8951, UEM: 0.6163, LEM: 0.3577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2513, partial_loss/deprel_loss: 0.9229, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1795, loss: 0.7621, batch_reg_loss: 0.1909, reg_loss: 0.1906 ||:  55%|#####4    | 52/95 [00:36<00:29,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9464, LAS: 0.8965, UEM: 0.6368, LEM: 0.3884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4366, partial_loss/deprel_loss: 0.5854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7466, loss: 0.7526, batch_reg_loss: 0.1910, reg_loss: 0.1906 ||:  58%|#####7    | 55/95 [00:38<00:29,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.9463, LAS: 0.8961, UEM: 0.6380, LEM: 0.3930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7707, partial_loss/deprel_loss: 0.7863, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9742, loss: 0.7552, batch_reg_loss: 0.1910, reg_loss: 0.1907 ||:  61%|######1   | 58/95 [00:40<00:26,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8618, UAS: 0.9463, LAS: 0.8962, UEM: 0.6314, LEM: 0.3879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8695, partial_loss/deprel_loss: 0.7489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9641, loss: 0.7544, batch_reg_loss: 0.1910, reg_loss: 0.1907 ||:  65%|######5   | 62/95 [00:42<00:22,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9459, LAS: 0.8956, UEM: 0.6232, LEM: 0.3803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4445, partial_loss/deprel_loss: 0.5806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7444, loss: 0.7598, batch_reg_loss: 0.1911, reg_loss: 0.1907 ||:  68%|######8   | 65/95 [00:45<00:21,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9439, LAS: 0.8935, UEM: 0.6157, LEM: 0.3744, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4739, partial_loss/deprel_loss: 0.5676, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7400, loss: 0.7744, batch_reg_loss: 0.1911, reg_loss: 0.1907 ||:  72%|#######1  | 68/95 [00:47<00:19,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8383, UAS: 0.9430, LAS: 0.8924, UEM: 0.6092, LEM: 0.3684, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3128, partial_loss/deprel_loss: 0.9474, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2116, loss: 0.7842, batch_reg_loss: 0.1911, reg_loss: 0.1907 ||:  75%|#######4  | 71/95 [00:49<00:17,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9436, LAS: 0.8929, UEM: 0.6133, LEM: 0.3722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4393, partial_loss/deprel_loss: 0.5510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7199, loss: 0.7798, batch_reg_loss: 0.1912, reg_loss: 0.1908 ||:  78%|#######7  | 74/95 [00:52<00:15,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9429, LAS: 0.8922, UEM: 0.6096, LEM: 0.3691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2051, partial_loss/deprel_loss: 0.3906, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5448, loss: 0.7844, batch_reg_loss: 0.1913, reg_loss: 0.1908 ||:  82%|########2 | 78/95 [00:54<00:11,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9426, LAS: 0.8916, UEM: 0.6021, LEM: 0.3612, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3763, partial_loss/deprel_loss: 0.4861, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6555, loss: 0.7880, batch_reg_loss: 0.1913, reg_loss: 0.1908 ||:  86%|########6 | 82/95 [00:57<00:08,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8583, UAS: 0.9417, LAS: 0.8905, UEM: 0.5911, LEM: 0.3528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8662, partial_loss/deprel_loss: 0.7807, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9892, loss: 0.7954, batch_reg_loss: 0.1914, reg_loss: 0.1908 ||:  91%|######### | 86/95 [00:59<00:06,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9417, LAS: 0.8904, UEM: 0.5910, LEM: 0.3524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2937, partial_loss/deprel_loss: 0.5050, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6542, loss: 0.7962, batch_reg_loss: 0.1914, reg_loss: 0.1909 ||:  94%|#########3| 89/95 [01:02<00:04,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9420, LAS: 0.8908, UEM: 0.5895, LEM: 0.3494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4636, partial_loss/deprel_loss: 0.5941, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7595, loss: 0.7946, batch_reg_loss: 0.1915, reg_loss: 0.1909 ||:  98%|#########7| 93/95 [01:05<00:01,  1.40it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8331, UAS: 0.9412, LAS: 0.8899, UEM: 0.5850, LEM: 0.3465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3715, partial_loss/deprel_loss: 1.0574, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3117, loss: 0.8027, batch_reg_loss: 0.1915, reg_loss: 0.1909 ||: 100%|##########| 95/95 [01:06<00:00,  1.43it/s]\n",
+      "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.191  |       N/A\n",
+      "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - UEM                      |     0.585  |       N/A\n",
+      "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - LEM                      |     0.347  |       N/A\n",
+      "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - EM                       |     0.833  |       N/A\n",
+      "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.372  |       N/A\n",
+      "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - UAS                      |     0.941  |       N/A\n",
+      "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.057  |       N/A\n",
+      "2023-04-07 00:22:39,475 - INFO - combo.training.tensorboard_writer - loss                     |     0.803  |       N/A\n",
+      "2023-04-07 00:22:39,476 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:22:39,476 - INFO - combo.training.tensorboard_writer - LAS                      |     0.890  |       N/A\n",
+      "2023-04-07 00:22:39,476 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:22:39,476 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:22:39,476 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:22:39,476 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:22:39,476 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:22:39,476 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:22:39,477 - INFO - combo.training.trainer - Epoch duration: 0:01:06.437919\n",
+      "2023-04-07 00:22:39,477 - INFO - combo.training.trainer - Estimated training time remaining: 5:55:24\n",
+      "2023-04-07 00:22:39,477 - INFO - allennlp.training.trainer - Epoch 83/399\n",
+      "2023-04-07 00:22:39,477 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:22:39,477 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:22:39,484 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9375, LAS: 0.8905, UEM: 0.5267, LEM: 0.2854, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2462, partial_loss/deprel_loss: 0.3812, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5457, loss: 0.7993, batch_reg_loss: 0.1916, reg_loss: 0.1916 ||:   3%|3         | 3/95 [00:02<01:11,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8182, UAS: 0.9347, LAS: 0.8856, UEM: 0.5202, LEM: 0.2607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6103, partial_loss/deprel_loss: 0.9962, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3106, loss: 0.8429, batch_reg_loss: 0.1916, reg_loss: 0.1916 ||:   6%|6         | 6/95 [00:04<01:06,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8114, UAS: 0.9304, LAS: 0.8810, UEM: 0.5515, LEM: 0.3116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6095, partial_loss/deprel_loss: 1.1064, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3986, loss: 0.8810, batch_reg_loss: 0.1917, reg_loss: 0.1916 ||:   9%|9         | 9/95 [00:06<01:04,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8659, UAS: 0.9339, LAS: 0.8839, UEM: 0.5453, LEM: 0.3012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9913, partial_loss/deprel_loss: 0.7666, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0033, loss: 0.8616, batch_reg_loss: 0.1917, reg_loss: 0.1916 ||:  13%|#2        | 12/95 [00:08<01:01,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8309, UAS: 0.9338, LAS: 0.8836, UEM: 0.5344, LEM: 0.2880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3335, partial_loss/deprel_loss: 0.9585, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2253, loss: 0.8581, batch_reg_loss: 0.1918, reg_loss: 0.1917 ||:  18%|#7        | 17/95 [00:11<00:51,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9382, LAS: 0.8884, UEM: 0.5477, LEM: 0.2879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2545, partial_loss/deprel_loss: 0.4284, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5855, loss: 0.8215, batch_reg_loss: 0.1919, reg_loss: 0.1917 ||:  23%|##3       | 22/95 [00:13<00:43,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8598, UAS: 0.9377, LAS: 0.8880, UEM: 0.5889, LEM: 0.3612, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9696, partial_loss/deprel_loss: 0.8608, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0744, loss: 0.8261, batch_reg_loss: 0.1919, reg_loss: 0.1917 ||:  27%|##7       | 26/95 [00:15<00:39,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9411, LAS: 0.8912, UEM: 0.6167, LEM: 0.3742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2082, partial_loss/deprel_loss: 0.4205, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5700, loss: 0.7990, batch_reg_loss: 0.1920, reg_loss: 0.1918 ||:  32%|###1      | 30/95 [00:17<00:37,  1.72it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9389, LAS: 0.8886, UEM: 0.5864, LEM: 0.3509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8068, partial_loss/deprel_loss: 0.6758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8940, loss: 0.8122, batch_reg_loss: 0.1920, reg_loss: 0.1918 ||:  36%|###5      | 34/95 [00:20<00:36,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8687, UAS: 0.9380, LAS: 0.8880, UEM: 0.5727, LEM: 0.3414, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9398, partial_loss/deprel_loss: 0.7578, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9862, loss: 0.8187, batch_reg_loss: 0.1920, reg_loss: 0.1918 ||:  40%|####      | 38/95 [00:22<00:34,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9399, LAS: 0.8897, UEM: 0.5863, LEM: 0.3450, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3260, partial_loss/deprel_loss: 0.5214, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6744, loss: 0.8047, batch_reg_loss: 0.1921, reg_loss: 0.1918 ||:  44%|####4     | 42/95 [00:25<00:34,  1.55it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9413, LAS: 0.8914, UEM: 0.5879, LEM: 0.3408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6506, partial_loss/deprel_loss: 0.6128, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8125, loss: 0.7936, batch_reg_loss: 0.1921, reg_loss: 0.1919 ||:  48%|####8     | 46/95 [00:28<00:31,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8685, UAS: 0.9409, LAS: 0.8906, UEM: 0.5728, LEM: 0.3271, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8299, partial_loss/deprel_loss: 0.7765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9793, loss: 0.7979, batch_reg_loss: 0.1922, reg_loss: 0.1919 ||:  53%|#####2    | 50/95 [00:30<00:27,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9044, UAS: 0.9421, LAS: 0.8921, UEM: 0.5738, LEM: 0.3254, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3728, partial_loss/deprel_loss: 0.5539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7100, loss: 0.7881, batch_reg_loss: 0.1922, reg_loss: 0.1919 ||:  57%|#####6    | 54/95 [00:32<00:24,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9232, UAS: 0.9421, LAS: 0.8923, UEM: 0.5675, LEM: 0.3222, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3272, partial_loss/deprel_loss: 0.3356, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5262, loss: 0.7879, batch_reg_loss: 0.1923, reg_loss: 0.1919 ||:  61%|######1   | 58/95 [00:35<00:23,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8335, UAS: 0.9409, LAS: 0.8907, UEM: 0.5630, LEM: 0.3184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3436, partial_loss/deprel_loss: 0.9344, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2085, loss: 0.7989, batch_reg_loss: 0.1923, reg_loss: 0.1920 ||:  65%|######5   | 62/95 [00:38<00:21,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9404, LAS: 0.8903, UEM: 0.5566, LEM: 0.3132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4736, partial_loss/deprel_loss: 0.5961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7640, loss: 0.8042, batch_reg_loss: 0.1924, reg_loss: 0.1920 ||:  69%|######9   | 66/95 [00:41<00:19,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8967, UAS: 0.9413, LAS: 0.8911, UEM: 0.5739, LEM: 0.3306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4320, partial_loss/deprel_loss: 0.6516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8001, loss: 0.7970, batch_reg_loss: 0.1924, reg_loss: 0.1920 ||:  74%|#######3  | 70/95 [00:44<00:17,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8607, UAS: 0.9412, LAS: 0.8909, UEM: 0.5722, LEM: 0.3291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7803, partial_loss/deprel_loss: 0.8010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9893, loss: 0.7986, batch_reg_loss: 0.1925, reg_loss: 0.1920 ||:  77%|#######6  | 73/95 [00:46<00:15,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9411, LAS: 0.8906, UEM: 0.5774, LEM: 0.3351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1304, partial_loss/deprel_loss: 0.3262, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4795, loss: 0.8013, batch_reg_loss: 0.1925, reg_loss: 0.1920 ||:  80%|########  | 76/95 [00:48<00:13,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9402, LAS: 0.8895, UEM: 0.5729, LEM: 0.3295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5167, partial_loss/deprel_loss: 0.5689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7510, loss: 0.8102, batch_reg_loss: 0.1926, reg_loss: 0.1921 ||:  84%|########4 | 80/95 [00:50<00:10,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9414, LAS: 0.8909, UEM: 0.5957, LEM: 0.3528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2181, partial_loss/deprel_loss: 0.3822, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5420, loss: 0.7994, batch_reg_loss: 0.1926, reg_loss: 0.1921 ||:  87%|########7 | 83/95 [00:53<00:08,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8377, UAS: 0.9407, LAS: 0.8902, UEM: 0.5896, LEM: 0.3478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2760, partial_loss/deprel_loss: 0.9142, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1792, loss: 0.8046, batch_reg_loss: 0.1927, reg_loss: 0.1921 ||:  92%|#########1| 87/95 [00:55<00:05,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9407, LAS: 0.8903, UEM: 0.5877, LEM: 0.3472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2826, partial_loss/deprel_loss: 0.3763, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5503, loss: 0.8036, batch_reg_loss: 0.1927, reg_loss: 0.1921 ||:  95%|#########4| 90/95 [00:58<00:03,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9037, UAS: 0.9409, LAS: 0.8905, UEM: 0.5866, LEM: 0.3455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2854, partial_loss/deprel_loss: 0.4692, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6252, loss: 0.8015, batch_reg_loss: 0.1928, reg_loss: 0.1922 ||:  98%|#########7| 93/95 [01:00<00:01,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8843, UAS: 0.9408, LAS: 0.8904, UEM: 0.5829, LEM: 0.3420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5981, partial_loss/deprel_loss: 0.6764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8536, loss: 0.8021, batch_reg_loss: 0.1928, reg_loss: 0.1922 ||: 100%|##########| 95/95 [01:01<00:00,  1.55it/s]\n",
+      "2023-04-07 00:23:40,869 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.192  |       N/A\n",
+      "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - UEM                      |     0.583  |       N/A\n",
+      "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - LEM                      |     0.342  |       N/A\n",
+      "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - EM                       |     0.884  |       N/A\n",
+      "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.598  |       N/A\n",
+      "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - UAS                      |     0.941  |       N/A\n",
+      "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.676  |       N/A\n",
+      "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - loss                     |     0.802  |       N/A\n",
+      "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - LAS                      |     0.890  |       N/A\n",
+      "2023-04-07 00:23:40,870 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:23:40,871 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:23:40,871 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:23:40,871 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:23:40,871 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:23:40,871 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:23:40,871 - INFO - combo.training.trainer - Epoch duration: 0:01:01.394685\n",
+      "2023-04-07 00:23:40,872 - INFO - combo.training.trainer - Estimated training time remaining: 5:53:54\n",
+      "2023-04-07 00:23:40,872 - INFO - allennlp.training.trainer - Epoch 84/399\n",
+      "2023-04-07 00:23:40,872 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:23:40,872 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:23:40,879 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9451, LAS: 0.8962, UEM: 0.5269, LEM: 0.2642, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4271, partial_loss/deprel_loss: 0.4962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6752, loss: 0.7608, batch_reg_loss: 0.1928, reg_loss: 0.1928 ||:   4%|4         | 4/95 [00:02<01:03,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9516, LAS: 0.9027, UEM: 0.6270, LEM: 0.3490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1486, partial_loss/deprel_loss: 0.3714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5197, loss: 0.7151, batch_reg_loss: 0.1929, reg_loss: 0.1928 ||:   7%|7         | 7/95 [00:05<01:04,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8572, UAS: 0.9464, LAS: 0.8968, UEM: 0.5877, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0149, partial_loss/deprel_loss: 0.8171, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0496, loss: 0.7587, batch_reg_loss: 0.1929, reg_loss: 0.1929 ||:  11%|#         | 10/95 [00:07<01:01,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9475, LAS: 0.8987, UEM: 0.5835, LEM: 0.3159, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5914, partial_loss/deprel_loss: 0.6744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8507, loss: 0.7560, batch_reg_loss: 0.1929, reg_loss: 0.1929 ||:  14%|#3        | 13/95 [00:09<00:58,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9491, LAS: 0.9002, UEM: 0.5839, LEM: 0.3115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2165, partial_loss/deprel_loss: 0.4450, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5922, loss: 0.7433, batch_reg_loss: 0.1930, reg_loss: 0.1929 ||:  17%|#6        | 16/95 [00:11<00:57,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8376, UAS: 0.9421, LAS: 0.8933, UEM: 0.5564, LEM: 0.2936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2379, partial_loss/deprel_loss: 0.9064, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1657, loss: 0.7891, batch_reg_loss: 0.1930, reg_loss: 0.1929 ||:  20%|##        | 19/95 [00:13<00:54,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8832, UAS: 0.9423, LAS: 0.8934, UEM: 0.5402, LEM: 0.2805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7128, partial_loss/deprel_loss: 0.6937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8906, loss: 0.7904, batch_reg_loss: 0.1930, reg_loss: 0.1929 ||:  23%|##3       | 22/95 [00:15<00:52,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8484, UAS: 0.9418, LAS: 0.8932, UEM: 0.5599, LEM: 0.2998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2771, partial_loss/deprel_loss: 0.8405, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1209, loss: 0.7862, batch_reg_loss: 0.1931, reg_loss: 0.1929 ||:  26%|##6       | 25/95 [00:18<00:50,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9440, LAS: 0.8952, UEM: 0.5799, LEM: 0.3142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2042, partial_loss/deprel_loss: 0.4251, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5741, loss: 0.7691, batch_reg_loss: 0.1931, reg_loss: 0.1930 ||:  29%|##9       | 28/95 [00:20<00:47,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8386, UAS: 0.9391, LAS: 0.8896, UEM: 0.5604, LEM: 0.3028, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2063, partial_loss/deprel_loss: 0.8403, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1066, loss: 0.8119, batch_reg_loss: 0.1932, reg_loss: 0.1930 ||:  33%|###2      | 31/95 [00:22<00:44,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9401, LAS: 0.8910, UEM: 0.5682, LEM: 0.3108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4735, partial_loss/deprel_loss: 0.5701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7440, loss: 0.8022, batch_reg_loss: 0.1932, reg_loss: 0.1930 ||:  37%|###6      | 35/95 [00:24<00:40,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9409, LAS: 0.8918, UEM: 0.5754, LEM: 0.3143, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5804, partial_loss/deprel_loss: 0.6790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8525, loss: 0.7963, batch_reg_loss: 0.1933, reg_loss: 0.1930 ||:  41%|####1     | 39/95 [00:27<00:36,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9411, LAS: 0.8918, UEM: 0.5984, LEM: 0.3548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5573, partial_loss/deprel_loss: 0.6468, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8222, loss: 0.7981, batch_reg_loss: 0.1933, reg_loss: 0.1931 ||:  45%|####5     | 43/95 [00:30<00:35,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9422, LAS: 0.8928, UEM: 0.5970, LEM: 0.3487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2616, partial_loss/deprel_loss: 0.4251, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5858, loss: 0.7911, batch_reg_loss: 0.1934, reg_loss: 0.1931 ||:  49%|####9     | 47/95 [00:32<00:30,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9429, LAS: 0.8933, UEM: 0.5970, LEM: 0.3466, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1733, partial_loss/deprel_loss: 0.3771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5298, loss: 0.7856, batch_reg_loss: 0.1934, reg_loss: 0.1931 ||:  55%|#####4    | 52/95 [00:34<00:25,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9439, LAS: 0.8947, UEM: 0.6059, LEM: 0.3573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5545, partial_loss/deprel_loss: 0.6443, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8198, loss: 0.7756, batch_reg_loss: 0.1935, reg_loss: 0.1931 ||:  59%|#####8    | 56/95 [00:37<00:24,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8952, UAS: 0.9433, LAS: 0.8941, UEM: 0.6199, LEM: 0.3747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4348, partial_loss/deprel_loss: 0.5503, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7207, loss: 0.7750, batch_reg_loss: 0.1935, reg_loss: 0.1932 ||:  63%|######3   | 60/95 [00:40<00:23,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8803, UAS: 0.9426, LAS: 0.8932, UEM: 0.6076, LEM: 0.3640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6869, partial_loss/deprel_loss: 0.7540, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9341, loss: 0.7818, batch_reg_loss: 0.1935, reg_loss: 0.1932 ||:  67%|######7   | 64/95 [00:42<00:19,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9431, LAS: 0.8937, UEM: 0.6083, LEM: 0.3633, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2179, partial_loss/deprel_loss: 0.4065, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5624, loss: 0.7767, batch_reg_loss: 0.1936, reg_loss: 0.1932 ||:  72%|#######1  | 68/95 [00:44<00:16,  1.64it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9429, LAS: 0.8933, UEM: 0.6004, LEM: 0.3557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6285, partial_loss/deprel_loss: 0.7207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8959, loss: 0.7792, batch_reg_loss: 0.1936, reg_loss: 0.1932 ||:  76%|#######5  | 72/95 [00:47<00:13,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9424, LAS: 0.8927, UEM: 0.5996, LEM: 0.3561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2378, partial_loss/deprel_loss: 0.4595, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6088, loss: 0.7833, batch_reg_loss: 0.1937, reg_loss: 0.1933 ||:  81%|########1 | 77/95 [00:49<00:10,  1.79it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9417, LAS: 0.8918, UEM: 0.5899, LEM: 0.3470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8107, partial_loss/deprel_loss: 0.7399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9478, loss: 0.7908, batch_reg_loss: 0.1938, reg_loss: 0.1933 ||:  86%|########6 | 82/95 [00:51<00:06,  1.92it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8613, UAS: 0.9407, LAS: 0.8907, UEM: 0.5812, LEM: 0.3407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9775, partial_loss/deprel_loss: 0.8004, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0296, loss: 0.8001, batch_reg_loss: 0.1938, reg_loss: 0.1933 ||:  91%|######### | 86/95 [00:54<00:05,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8971, UAS: 0.9400, LAS: 0.8900, UEM: 0.5715, LEM: 0.3336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4604, partial_loss/deprel_loss: 0.5352, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7141, loss: 0.8060, batch_reg_loss: 0.1939, reg_loss: 0.1933 ||:  95%|#########4| 90/95 [00:57<00:03,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9074, UAS: 0.9401, LAS: 0.8903, UEM: 0.5700, LEM: 0.3311, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3952, partial_loss/deprel_loss: 0.5165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6862, loss: 0.8044, batch_reg_loss: 0.1939, reg_loss: 0.1934 ||:  99%|#########8| 94/95 [01:00<00:00,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9405, LAS: 0.8907, UEM: 0.5782, LEM: 0.3395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1208, partial_loss/deprel_loss: 0.3166, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4714, loss: 0.8009, batch_reg_loss: 0.1940, reg_loss: 0.1934 ||: 100%|##########| 95/95 [01:01<00:00,  1.55it/s]\n",
+      "2023-04-07 00:24:42,021 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:24:42,021 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 00:24:42,021 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.193  |       N/A\n",
+      "2023-04-07 00:24:42,021 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:24:42,021 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - UEM                      |     0.578  |       N/A\n",
+      "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - LEM                      |     0.339  |       N/A\n",
+      "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - EM                       |     0.932  |       N/A\n",
+      "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.121  |       N/A\n",
+      "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - UAS                      |     0.940  |       N/A\n",
+      "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.317  |       N/A\n",
+      "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - loss                     |     0.801  |       N/A\n",
+      "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - LAS                      |     0.891  |       N/A\n",
+      "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:24:42,022 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:24:42,023 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:24:42,023 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:24:42,023 - INFO - combo.training.trainer - Epoch duration: 0:01:01.151488\n",
+      "2023-04-07 00:24:42,023 - INFO - combo.training.trainer - Estimated training time remaining: 5:52:25\n",
+      "2023-04-07 00:24:42,023 - INFO - allennlp.training.trainer - Epoch 85/399\n",
+      "2023-04-07 00:24:42,024 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:24:42,024 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:24:42,030 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9041, UAS: 0.9466, LAS: 0.8997, UEM: 0.4561, LEM: 0.2193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4473, partial_loss/deprel_loss: 0.5097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6912, loss: 0.7181, batch_reg_loss: 0.1940, reg_loss: 0.1940 ||:   3%|3         | 3/95 [00:02<01:01,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8827, UAS: 0.9368, LAS: 0.8882, UEM: 0.3619, LEM: 0.1613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6710, partial_loss/deprel_loss: 0.7099, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8962, loss: 0.8291, batch_reg_loss: 0.1941, reg_loss: 0.1940 ||:   7%|7         | 7/95 [00:04<00:56,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8766, UAS: 0.9316, LAS: 0.8808, UEM: 0.3174, LEM: 0.1327, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6454, partial_loss/deprel_loss: 0.6888, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8743, loss: 0.8748, batch_reg_loss: 0.1941, reg_loss: 0.1940 ||:  11%|#         | 10/95 [00:06<00:55,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9397, LAS: 0.8890, UEM: 0.4730, LEM: 0.2343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2931, partial_loss/deprel_loss: 0.4276, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5948, loss: 0.8079, batch_reg_loss: 0.1941, reg_loss: 0.1941 ||:  14%|#3        | 13/95 [00:08<00:54,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9064, UAS: 0.9408, LAS: 0.8907, UEM: 0.4914, LEM: 0.2435, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3559, partial_loss/deprel_loss: 0.5021, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6671, loss: 0.7967, batch_reg_loss: 0.1942, reg_loss: 0.1941 ||:  18%|#7        | 17/95 [00:10<00:49,  1.57it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9401, LAS: 0.8899, UEM: 0.4798, LEM: 0.2367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4468, partial_loss/deprel_loss: 0.4423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6375, loss: 0.8073, batch_reg_loss: 0.1943, reg_loss: 0.1941 ||:  22%|##2       | 21/95 [00:13<00:46,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8486, UAS: 0.9404, LAS: 0.8903, UEM: 0.5016, LEM: 0.2535, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2345, partial_loss/deprel_loss: 0.8768, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1426, loss: 0.8032, batch_reg_loss: 0.1943, reg_loss: 0.1941 ||:  25%|##5       | 24/95 [00:15<00:47,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9191, UAS: 0.9419, LAS: 0.8923, UEM: 0.5276, LEM: 0.2797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3129, partial_loss/deprel_loss: 0.4355, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6053, loss: 0.7858, batch_reg_loss: 0.1943, reg_loss: 0.1942 ||:  28%|##8       | 27/95 [00:17<00:48,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8795, UAS: 0.9422, LAS: 0.8923, UEM: 0.5250, LEM: 0.2755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7323, partial_loss/deprel_loss: 0.6823, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8867, loss: 0.7885, batch_reg_loss: 0.1944, reg_loss: 0.1942 ||:  33%|###2      | 31/95 [00:20<00:44,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9423, LAS: 0.8925, UEM: 0.5366, LEM: 0.2861, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2038, partial_loss/deprel_loss: 0.3853, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5434, loss: 0.7862, batch_reg_loss: 0.1944, reg_loss: 0.1942 ||:  36%|###5      | 34/95 [00:22<00:43,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9410, LAS: 0.8913, UEM: 0.5240, LEM: 0.2777, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4180, partial_loss/deprel_loss: 0.5033, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6807, loss: 0.7934, batch_reg_loss: 0.1944, reg_loss: 0.1942 ||:  39%|###8      | 37/95 [00:25<00:42,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9208, UAS: 0.9421, LAS: 0.8924, UEM: 0.5291, LEM: 0.2791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2863, partial_loss/deprel_loss: 0.4049, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5757, loss: 0.7884, batch_reg_loss: 0.1945, reg_loss: 0.1942 ||:  43%|####3     | 41/95 [00:27<00:38,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8837, UAS: 0.9432, LAS: 0.8933, UEM: 0.5458, LEM: 0.2925, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5333, partial_loss/deprel_loss: 0.6796, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8448, loss: 0.7791, batch_reg_loss: 0.1945, reg_loss: 0.1943 ||:  46%|####6     | 44/95 [00:29<00:36,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9064, UAS: 0.9433, LAS: 0.8932, UEM: 0.5358, LEM: 0.2840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4555, partial_loss/deprel_loss: 0.5005, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6861, loss: 0.7829, batch_reg_loss: 0.1945, reg_loss: 0.1943 ||:  51%|#####     | 48/95 [00:32<00:32,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8969, UAS: 0.9437, LAS: 0.8938, UEM: 0.5471, LEM: 0.2971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4086, partial_loss/deprel_loss: 0.5916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7496, loss: 0.7790, batch_reg_loss: 0.1946, reg_loss: 0.1943 ||:  54%|#####3    | 51/95 [00:34<00:30,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9588, UAS: 0.9440, LAS: 0.8945, UEM: 0.5814, LEM: 0.3416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0533, partial_loss/deprel_loss: 0.1731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3438, loss: 0.7741, batch_reg_loss: 0.1946, reg_loss: 0.1943 ||:  57%|#####6    | 54/95 [00:37<00:30,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9442, LAS: 0.8947, UEM: 0.5798, LEM: 0.3374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3199, partial_loss/deprel_loss: 0.5124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6686, loss: 0.7741, batch_reg_loss: 0.1947, reg_loss: 0.1943 ||:  61%|######1   | 58/95 [00:39<00:26,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8674, UAS: 0.9429, LAS: 0.8935, UEM: 0.5735, LEM: 0.3322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8163, partial_loss/deprel_loss: 0.7422, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9517, loss: 0.7821, batch_reg_loss: 0.1947, reg_loss: 0.1944 ||:  64%|######4   | 61/95 [00:41<00:23,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9431, LAS: 0.8936, UEM: 0.5759, LEM: 0.3323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3294, partial_loss/deprel_loss: 0.5370, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6902, loss: 0.7815, batch_reg_loss: 0.1947, reg_loss: 0.1944 ||:  67%|######7   | 64/95 [00:43<00:22,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9436, LAS: 0.8942, UEM: 0.5927, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1745, partial_loss/deprel_loss: 0.3375, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4997, loss: 0.7782, batch_reg_loss: 0.1948, reg_loss: 0.1944 ||:  71%|#######   | 67/95 [00:46<00:20,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9436, LAS: 0.8938, UEM: 0.5873, LEM: 0.3443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5926, partial_loss/deprel_loss: 0.6632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8439, loss: 0.7793, batch_reg_loss: 0.1948, reg_loss: 0.1944 ||:  75%|#######4  | 71/95 [00:48<00:17,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8932, UAS: 0.9439, LAS: 0.8939, UEM: 0.5835, LEM: 0.3387, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5846, partial_loss/deprel_loss: 0.6107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8003, loss: 0.7786, batch_reg_loss: 0.1948, reg_loss: 0.1944 ||:  79%|#######8  | 75/95 [00:51<00:13,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8163, UAS: 0.9432, LAS: 0.8934, UEM: 0.5854, LEM: 0.3423, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7572, partial_loss/deprel_loss: 1.0228, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3645, loss: 0.7825, batch_reg_loss: 0.1949, reg_loss: 0.1944 ||:  82%|########2 | 78/95 [00:53<00:11,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8684, UAS: 0.9431, LAS: 0.8933, UEM: 0.5838, LEM: 0.3411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9157, partial_loss/deprel_loss: 0.7864, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0072, loss: 0.7831, batch_reg_loss: 0.1949, reg_loss: 0.1945 ||:  85%|########5 | 81/95 [00:55<00:09,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9414, LAS: 0.8913, UEM: 0.5762, LEM: 0.3364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8134, partial_loss/deprel_loss: 0.7467, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9549, loss: 0.7976, batch_reg_loss: 0.1949, reg_loss: 0.1945 ||:  88%|########8 | 84/95 [00:57<00:07,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7966, UAS: 0.9408, LAS: 0.8907, UEM: 0.5804, LEM: 0.3395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0394, partial_loss/deprel_loss: 1.1325, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5089, loss: 0.8013, batch_reg_loss: 0.1950, reg_loss: 0.1945 ||:  92%|#########1| 87/95 [00:59<00:05,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8980, UAS: 0.9410, LAS: 0.8907, UEM: 0.5769, LEM: 0.3337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3560, partial_loss/deprel_loss: 0.5438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7013, loss: 0.8017, batch_reg_loss: 0.1950, reg_loss: 0.1945 ||:  96%|#########5| 91/95 [01:02<00:02,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9410, LAS: 0.8908, UEM: 0.5845, LEM: 0.3444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3546, partial_loss/deprel_loss: 0.4884, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6568, loss: 0.8013, batch_reg_loss: 0.1951, reg_loss: 0.1945 ||: 100%|##########| 95/95 [01:05<00:00,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9410, LAS: 0.8908, UEM: 0.5845, LEM: 0.3444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3546, partial_loss/deprel_loss: 0.4884, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6568, loss: 0.8013, batch_reg_loss: 0.1951, reg_loss: 0.1945 ||: 100%|##########| 95/95 [01:05<00:00,  1.46it/s]\n",
+      "2023-04-07 00:25:47,060 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8879, UAS: 0.9228, LAS: 0.8633, UEM: 0.3296, LEM: 0.0726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8452, partial_loss/deprel_loss: 32.7309, partial_loss/cycle_loss: 0.0000, batch_loss: 26.3538, loss: 34.2431, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  18%|#8        | 2/11 [00:02<00:09,  1.03s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9381, LAS: 0.8814, UEM: 0.5156, LEM: 0.2156, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3101, partial_loss/deprel_loss: 26.3036, partial_loss/cycle_loss: 0.0000, batch_loss: 21.1049, loss: 27.7967, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  55%|#####4    | 6/11 [00:04<00:04,  1.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9497, LAS: 0.8967, UEM: 0.6925, LEM: 0.4118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1871, partial_loss/deprel_loss: 21.0855, partial_loss/cycle_loss: 0.0000, batch_loss: 16.9058, loss: 23.2656, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  91%|######### | 10/11 [00:07<00:00,  1.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9474, LAS: 0.8946, UEM: 0.6749, LEM: 0.3976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1030, partial_loss/deprel_loss: 45.7873, partial_loss/cycle_loss: 0.0000, batch_loss: 36.8505, loss: 24.5006, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:07<00:00,  1.41it/s]\n",
+      "2023-04-07 00:25:54,870 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:25:54,870 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 00:25:54,870 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.195  |     0.000\n",
+      "2023-04-07 00:25:54,870 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - UEM                      |     0.585  |     0.675\n",
+      "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - LEM                      |     0.344  |     0.398\n",
+      "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - EM                       |     0.916  |     0.874\n",
+      "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.355  |     1.103\n",
+      "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - UAS                      |     0.941  |     0.947\n",
+      "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.488  |    45.787\n",
+      "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - loss                     |     0.801  |    24.501\n",
+      "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - LAS                      |     0.891  |     0.895\n",
+      "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:25:54,871 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:25:54,872 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 00:25:54,872 - INFO - combo.training.trainer - Epoch duration: 0:01:12.848706\n",
+      "2023-04-07 00:25:54,872 - INFO - combo.training.trainer - Estimated training time remaining: 5:51:38\n",
+      "2023-04-07 00:25:54,872 - INFO - allennlp.training.trainer - Epoch 86/399\n",
+      "2023-04-07 00:25:54,873 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:25:54,873 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:25:54,880 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9303, LAS: 0.8790, UEM: 0.5903, LEM: 0.3342, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2182, partial_loss/deprel_loss: 0.4540, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6020, loss: 0.8753, batch_reg_loss: 0.1952, reg_loss: 0.1951 ||:   5%|5         | 5/95 [00:02<00:40,  2.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9434, LAS: 0.8926, UEM: 0.6223, LEM: 0.3405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2440, partial_loss/deprel_loss: 0.4128, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5743, loss: 0.7749, batch_reg_loss: 0.1952, reg_loss: 0.1952 ||:   9%|9         | 9/95 [00:04<00:40,  2.10it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8643, UAS: 0.9415, LAS: 0.8907, UEM: 0.6017, LEM: 0.3346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9514, partial_loss/deprel_loss: 0.7318, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9710, loss: 0.7896, batch_reg_loss: 0.1953, reg_loss: 0.1952 ||:  13%|#2        | 12/95 [00:06<00:45,  1.83it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9411, LAS: 0.8912, UEM: 0.5743, LEM: 0.3158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3750, partial_loss/deprel_loss: 0.4740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6495, loss: 0.7949, batch_reg_loss: 0.1953, reg_loss: 0.1952 ||:  17%|#6        | 16/95 [00:09<00:46,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9423, LAS: 0.8922, UEM: 0.5722, LEM: 0.3120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4842, partial_loss/deprel_loss: 0.5115, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7014, loss: 0.7872, batch_reg_loss: 0.1953, reg_loss: 0.1952 ||:  20%|##        | 19/95 [00:11<00:47,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9438, LAS: 0.8937, UEM: 0.5861, LEM: 0.3237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3016, partial_loss/deprel_loss: 0.4416, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6089, loss: 0.7726, batch_reg_loss: 0.1954, reg_loss: 0.1952 ||:  23%|##3       | 22/95 [00:14<00:52,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8921, UAS: 0.9440, LAS: 0.8947, UEM: 0.5654, LEM: 0.3043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6113, partial_loss/deprel_loss: 0.6593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8451, loss: 0.7651, batch_reg_loss: 0.1954, reg_loss: 0.1953 ||:  27%|##7       | 26/95 [00:16<00:47,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8375, UAS: 0.9401, LAS: 0.8902, UEM: 0.5559, LEM: 0.2979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3724, partial_loss/deprel_loss: 0.9640, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2411, loss: 0.8040, batch_reg_loss: 0.1954, reg_loss: 0.1953 ||:  31%|###       | 29/95 [00:18<00:45,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9427, LAS: 0.8938, UEM: 0.6186, LEM: 0.3789, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4439, partial_loss/deprel_loss: 0.4964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6814, loss: 0.7770, batch_reg_loss: 0.1955, reg_loss: 0.1953 ||:  34%|###3      | 32/95 [00:21<00:48,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9427, LAS: 0.8938, UEM: 0.6178, LEM: 0.3764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2642, partial_loss/deprel_loss: 0.4197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5841, loss: 0.7726, batch_reg_loss: 0.1955, reg_loss: 0.1953 ||:  37%|###6      | 35/95 [00:23<00:44,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8743, UAS: 0.9427, LAS: 0.8938, UEM: 0.6098, LEM: 0.3661, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7651, partial_loss/deprel_loss: 0.7290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9318, loss: 0.7718, batch_reg_loss: 0.1955, reg_loss: 0.1953 ||:  40%|####      | 38/95 [00:25<00:41,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8767, UAS: 0.9435, LAS: 0.8944, UEM: 0.6106, LEM: 0.3641, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7390, partial_loss/deprel_loss: 0.7182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9179, loss: 0.7679, batch_reg_loss: 0.1956, reg_loss: 0.1954 ||:  43%|####3     | 41/95 [00:28<00:39,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8844, UAS: 0.9429, LAS: 0.8935, UEM: 0.5934, LEM: 0.3483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7213, partial_loss/deprel_loss: 0.7034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9026, loss: 0.7772, batch_reg_loss: 0.1956, reg_loss: 0.1954 ||:  47%|####7     | 45/95 [00:30<00:35,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9216, UAS: 0.9438, LAS: 0.8945, UEM: 0.5972, LEM: 0.3493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2743, partial_loss/deprel_loss: 0.4010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5714, loss: 0.7687, batch_reg_loss: 0.1957, reg_loss: 0.1954 ||:  51%|#####     | 48/95 [00:32<00:33,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9421, LAS: 0.8928, UEM: 0.5813, LEM: 0.3374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5677, partial_loss/deprel_loss: 0.6120, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7988, loss: 0.7809, batch_reg_loss: 0.1957, reg_loss: 0.1954 ||:  55%|#####4    | 52/95 [00:35<00:29,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8515, UAS: 0.9420, LAS: 0.8925, UEM: 0.5764, LEM: 0.3323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9556, partial_loss/deprel_loss: 0.8274, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0488, loss: 0.7859, batch_reg_loss: 0.1958, reg_loss: 0.1954 ||:  59%|#####8    | 56/95 [00:37<00:26,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9419, LAS: 0.8923, UEM: 0.5689, LEM: 0.3253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6214, partial_loss/deprel_loss: 0.6430, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8345, loss: 0.7897, batch_reg_loss: 0.1958, reg_loss: 0.1955 ||:  63%|######3   | 60/95 [00:40<00:23,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9411, LAS: 0.8915, UEM: 0.5695, LEM: 0.3278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1562, partial_loss/deprel_loss: 0.3311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4920, loss: 0.7975, batch_reg_loss: 0.1959, reg_loss: 0.1955 ||:  66%|######6   | 63/95 [00:42<00:21,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9412, LAS: 0.8916, UEM: 0.5788, LEM: 0.3418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1075, partial_loss/deprel_loss: 0.2779, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4397, loss: 0.7970, batch_reg_loss: 0.1959, reg_loss: 0.1955 ||:  69%|######9   | 66/95 [00:44<00:20,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9420, LAS: 0.8924, UEM: 0.5859, LEM: 0.3466, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2186, partial_loss/deprel_loss: 0.4007, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5603, loss: 0.7910, batch_reg_loss: 0.1960, reg_loss: 0.1955 ||:  74%|#######3  | 70/95 [00:47<00:17,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.9424, LAS: 0.8926, UEM: 0.5855, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6856, partial_loss/deprel_loss: 0.6499, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8531, loss: 0.7894, batch_reg_loss: 0.1960, reg_loss: 0.1955 ||:  77%|#######6  | 73/95 [00:49<00:15,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9419, LAS: 0.8921, UEM: 0.5873, LEM: 0.3468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1316, partial_loss/deprel_loss: 0.3316, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4876, loss: 0.7939, batch_reg_loss: 0.1960, reg_loss: 0.1956 ||:  80%|########  | 76/95 [00:51<00:13,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8577, UAS: 0.9419, LAS: 0.8920, UEM: 0.5851, LEM: 0.3440, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0526, partial_loss/deprel_loss: 0.9078, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1329, loss: 0.7961, batch_reg_loss: 0.1961, reg_loss: 0.1956 ||:  84%|########4 | 80/95 [00:54<00:10,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.9415, LAS: 0.8915, UEM: 0.5799, LEM: 0.3399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8618, partial_loss/deprel_loss: 0.7938, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0035, loss: 0.8000, batch_reg_loss: 0.1961, reg_loss: 0.1956 ||:  87%|########7 | 83/95 [00:56<00:08,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8685, UAS: 0.9413, LAS: 0.8911, UEM: 0.5741, LEM: 0.3337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8762, partial_loss/deprel_loss: 0.7787, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9944, loss: 0.8044, batch_reg_loss: 0.1962, reg_loss: 0.1956 ||:  92%|#########1| 87/95 [00:58<00:05,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8978, UAS: 0.9415, LAS: 0.8913, UEM: 0.5878, LEM: 0.3489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4850, partial_loss/deprel_loss: 0.5832, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7597, loss: 0.8039, batch_reg_loss: 0.1962, reg_loss: 0.1957 ||:  96%|#########5| 91/95 [01:02<00:02,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9417, LAS: 0.8914, UEM: 0.5839, LEM: 0.3443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4754, partial_loss/deprel_loss: 0.5637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7423, loss: 0.8023, batch_reg_loss: 0.1963, reg_loss: 0.1957 ||: 100%|##########| 95/95 [01:04<00:00,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9417, LAS: 0.8914, UEM: 0.5839, LEM: 0.3443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4754, partial_loss/deprel_loss: 0.5637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7423, loss: 0.8023, batch_reg_loss: 0.1963, reg_loss: 0.1957 ||: 100%|##########| 95/95 [01:04<00:00,  1.47it/s]\n",
+      "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.196  |       N/A\n",
+      "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - UEM                      |     0.584  |       N/A\n",
+      "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - LEM                      |     0.344  |       N/A\n",
+      "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - EM                       |     0.893  |       N/A\n",
+      "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.475  |       N/A\n",
+      "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:26:59,579 - INFO - combo.training.tensorboard_writer - UAS                      |     0.942  |       N/A\n",
+      "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.564  |       N/A\n",
+      "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - loss                     |     0.802  |       N/A\n",
+      "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - LAS                      |     0.891  |       N/A\n",
+      "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:26:59,580 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:26:59,581 - INFO - combo.training.trainer - Epoch duration: 0:01:04.708363\n",
+      "2023-04-07 00:26:59,581 - INFO - combo.training.trainer - Estimated training time remaining: 5:50:22\n",
+      "2023-04-07 00:26:59,581 - INFO - allennlp.training.trainer - Epoch 87/399\n",
+      "2023-04-07 00:26:59,581 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:26:59,581 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:26:59,588 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9615, LAS: 0.9135, UEM: 0.6192, LEM: 0.3103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3482, partial_loss/deprel_loss: 0.4458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6226, loss: 0.6525, batch_reg_loss: 0.1963, reg_loss: 0.1963 ||:   4%|4         | 4/95 [00:02<00:49,  1.82it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9525, LAS: 0.9039, UEM: 0.5553, LEM: 0.2723, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3492, partial_loss/deprel_loss: 0.4513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6272, loss: 0.7114, batch_reg_loss: 0.1963, reg_loss: 0.1963 ||:   7%|7         | 7/95 [00:04<00:53,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8363, UAS: 0.9434, LAS: 0.8928, UEM: 0.5168, LEM: 0.2456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3595, partial_loss/deprel_loss: 0.9489, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2274, loss: 0.7922, batch_reg_loss: 0.1964, reg_loss: 0.1963 ||:  11%|#         | 10/95 [00:06<00:53,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9357, LAS: 0.8853, UEM: 0.5261, LEM: 0.2734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1825, partial_loss/deprel_loss: 0.3490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5121, loss: 0.8409, batch_reg_loss: 0.1964, reg_loss: 0.1964 ||:  15%|#4        | 14/95 [00:09<00:51,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9392, LAS: 0.8890, UEM: 0.5406, LEM: 0.2792, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2855, partial_loss/deprel_loss: 0.4373, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6035, loss: 0.8206, batch_reg_loss: 0.1965, reg_loss: 0.1964 ||:  19%|#8        | 18/95 [00:11<00:49,  1.55it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8982, UAS: 0.9399, LAS: 0.8901, UEM: 0.5422, LEM: 0.2855, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4526, partial_loss/deprel_loss: 0.5380, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7175, loss: 0.8118, batch_reg_loss: 0.1965, reg_loss: 0.1964 ||:  22%|##2       | 21/95 [00:13<00:48,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9220, UAS: 0.9409, LAS: 0.8908, UEM: 0.5386, LEM: 0.2820, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2947, partial_loss/deprel_loss: 0.4101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5836, loss: 0.8113, batch_reg_loss: 0.1966, reg_loss: 0.1964 ||:  26%|##6       | 25/95 [00:16<00:44,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8926, UAS: 0.9423, LAS: 0.8922, UEM: 0.5240, LEM: 0.2676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5496, partial_loss/deprel_loss: 0.6464, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8237, loss: 0.8047, batch_reg_loss: 0.1966, reg_loss: 0.1965 ||:  32%|###1      | 30/95 [00:18<00:37,  1.72it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9406, LAS: 0.8905, UEM: 0.5147, LEM: 0.2611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5974, partial_loss/deprel_loss: 0.6037, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7992, loss: 0.8168, batch_reg_loss: 0.1967, reg_loss: 0.1965 ||:  37%|###6      | 35/95 [00:20<00:32,  1.83it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8994, UAS: 0.9417, LAS: 0.8920, UEM: 0.5224, LEM: 0.2722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3679, partial_loss/deprel_loss: 0.5009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6711, loss: 0.8073, batch_reg_loss: 0.1968, reg_loss: 0.1965 ||:  42%|####2     | 40/95 [00:23<00:28,  1.90it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9440, LAS: 0.8946, UEM: 0.5725, LEM: 0.3269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1316, partial_loss/deprel_loss: 0.3212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4801, loss: 0.7860, batch_reg_loss: 0.1968, reg_loss: 0.1965 ||:  46%|####6     | 44/95 [00:25<00:26,  1.89it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9447, LAS: 0.8956, UEM: 0.5881, LEM: 0.3401, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2774, partial_loss/deprel_loss: 0.3738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5514, loss: 0.7778, batch_reg_loss: 0.1969, reg_loss: 0.1966 ||:  51%|#####     | 48/95 [00:28<00:28,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9442, LAS: 0.8951, UEM: 0.5793, LEM: 0.3325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1747, partial_loss/deprel_loss: 0.3913, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5449, loss: 0.7808, batch_reg_loss: 0.1969, reg_loss: 0.1966 ||:  55%|#####4    | 52/95 [00:31<00:26,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8194, UAS: 0.9433, LAS: 0.8942, UEM: 0.5829, LEM: 0.3378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6835, partial_loss/deprel_loss: 1.0484, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3723, loss: 0.7876, batch_reg_loss: 0.1969, reg_loss: 0.1966 ||:  59%|#####8    | 56/95 [00:34<00:26,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9443, LAS: 0.8949, UEM: 0.5903, LEM: 0.3392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2637, partial_loss/deprel_loss: 0.4897, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6414, loss: 0.7808, batch_reg_loss: 0.1970, reg_loss: 0.1966 ||:  63%|######3   | 60/95 [00:37<00:25,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9443, LAS: 0.8949, UEM: 0.5840, LEM: 0.3326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3851, partial_loss/deprel_loss: 0.5246, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6937, loss: 0.7806, batch_reg_loss: 0.1970, reg_loss: 0.1967 ||:  67%|######7   | 64/95 [00:40<00:22,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9077, UAS: 0.9443, LAS: 0.8950, UEM: 0.5846, LEM: 0.3332, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4486, partial_loss/deprel_loss: 0.4704, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6631, loss: 0.7800, batch_reg_loss: 0.1971, reg_loss: 0.1967 ||:  72%|#######1  | 68/95 [00:42<00:18,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8545, UAS: 0.9439, LAS: 0.8946, UEM: 0.5818, LEM: 0.3319, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0211, partial_loss/deprel_loss: 0.8719, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0988, loss: 0.7833, batch_reg_loss: 0.1971, reg_loss: 0.1967 ||:  75%|#######4  | 71/95 [00:45<00:16,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8461, UAS: 0.9427, LAS: 0.8933, UEM: 0.5758, LEM: 0.3279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2804, partial_loss/deprel_loss: 0.8496, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1329, loss: 0.7921, batch_reg_loss: 0.1972, reg_loss: 0.1967 ||:  79%|#######8  | 75/95 [00:47<00:13,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8436, UAS: 0.9426, LAS: 0.8932, UEM: 0.5802, LEM: 0.3319, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3690, partial_loss/deprel_loss: 0.8747, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1707, loss: 0.7923, batch_reg_loss: 0.1972, reg_loss: 0.1967 ||:  82%|########2 | 78/95 [00:49<00:11,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8829, UAS: 0.9424, LAS: 0.8930, UEM: 0.5744, LEM: 0.3273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6648, partial_loss/deprel_loss: 0.6441, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8455, loss: 0.7947, batch_reg_loss: 0.1972, reg_loss: 0.1968 ||:  85%|########5 | 81/95 [00:51<00:09,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9427, LAS: 0.8933, UEM: 0.5824, LEM: 0.3363, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3121, partial_loss/deprel_loss: 0.4870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6493, loss: 0.7919, batch_reg_loss: 0.1973, reg_loss: 0.1968 ||:  88%|########8 | 84/95 [00:54<00:08,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8740, UAS: 0.9424, LAS: 0.8929, UEM: 0.5754, LEM: 0.3304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8627, partial_loss/deprel_loss: 0.8393, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0413, loss: 0.7959, batch_reg_loss: 0.1973, reg_loss: 0.1968 ||:  92%|#########1| 87/95 [00:56<00:05,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8650, UAS: 0.9418, LAS: 0.8922, UEM: 0.5728, LEM: 0.3289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8800, partial_loss/deprel_loss: 0.7644, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9849, loss: 0.8008, batch_reg_loss: 0.1974, reg_loss: 0.1968 ||:  96%|#########5| 91/95 [00:58<00:02,  1.49it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9513, UAS: 0.9425, LAS: 0.8930, UEM: 0.5869, LEM: 0.3465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0619, partial_loss/deprel_loss: 0.1758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3505, loss: 0.7957, batch_reg_loss: 0.1974, reg_loss: 0.1968 ||: 100%|##########| 95/95 [01:01<00:00,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9513, UAS: 0.9425, LAS: 0.8930, UEM: 0.5869, LEM: 0.3465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0619, partial_loss/deprel_loss: 0.1758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3505, loss: 0.7957, batch_reg_loss: 0.1974, reg_loss: 0.1968 ||: 100%|##########| 95/95 [01:01<00:00,  1.54it/s]\n",
+      "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.197  |       N/A\n",
+      "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - UEM                      |     0.587  |       N/A\n",
+      "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - LEM                      |     0.347  |       N/A\n",
+      "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - EM                       |     0.951  |       N/A\n",
+      "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.062  |       N/A\n",
+      "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:28:01,203 - INFO - combo.training.tensorboard_writer - UAS                      |     0.943  |       N/A\n",
+      "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.176  |       N/A\n",
+      "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - loss                     |     0.796  |       N/A\n",
+      "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - LAS                      |     0.893  |       N/A\n",
+      "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:28:01,204 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:28:01,205 - INFO - combo.training.trainer - Epoch duration: 0:01:01.623636\n",
+      "2023-04-07 00:28:01,205 - INFO - combo.training.trainer - Estimated training time remaining: 5:48:55\n",
+      "2023-04-07 00:28:01,205 - INFO - allennlp.training.trainer - Epoch 88/399\n",
+      "2023-04-07 00:28:01,205 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:28:01,205 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:28:01,211 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8541, UAS: 0.9353, LAS: 0.8842, UEM: 0.4656, LEM: 0.2133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9636, partial_loss/deprel_loss: 0.8324, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0561, loss: 0.8300, batch_reg_loss: 0.1975, reg_loss: 0.1975 ||:   3%|3         | 3/95 [00:02<01:09,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8447, UAS: 0.9345, LAS: 0.8837, UEM: 0.4115, LEM: 0.1826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3071, partial_loss/deprel_loss: 0.8828, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1652, loss: 0.8505, batch_reg_loss: 0.1975, reg_loss: 0.1975 ||:   7%|7         | 7/95 [00:04<01:02,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9450, LAS: 0.8953, UEM: 0.5579, LEM: 0.3034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3981, partial_loss/deprel_loss: 0.4900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6692, loss: 0.7676, batch_reg_loss: 0.1976, reg_loss: 0.1975 ||:  11%|#         | 10/95 [00:06<01:01,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9481, LAS: 0.8994, UEM: 0.5789, LEM: 0.3212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3607, partial_loss/deprel_loss: 0.4957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6663, loss: 0.7347, batch_reg_loss: 0.1976, reg_loss: 0.1975 ||:  14%|#3        | 13/95 [00:09<00:58,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8963, UAS: 0.9512, LAS: 0.9047, UEM: 0.6611, LEM: 0.4402, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6081, partial_loss/deprel_loss: 0.7000, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8793, loss: 0.7090, batch_reg_loss: 0.1976, reg_loss: 0.1975 ||:  17%|#6        | 16/95 [00:11<01:00,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9520, LAS: 0.9051, UEM: 0.6520, LEM: 0.4225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3609, partial_loss/deprel_loss: 0.4233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6084, loss: 0.7045, batch_reg_loss: 0.1976, reg_loss: 0.1976 ||:  20%|##        | 19/95 [00:13<00:58,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9511, LAS: 0.9039, UEM: 0.6374, LEM: 0.4072, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2298, partial_loss/deprel_loss: 0.3898, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5555, loss: 0.7115, batch_reg_loss: 0.1977, reg_loss: 0.1976 ||:  24%|##4       | 23/95 [00:16<00:54,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8630, UAS: 0.9472, LAS: 0.8994, UEM: 0.6104, LEM: 0.3832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0077, partial_loss/deprel_loss: 0.8336, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0661, loss: 0.7468, batch_reg_loss: 0.1977, reg_loss: 0.1976 ||:  28%|##8       | 27/95 [00:19<00:49,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9473, LAS: 0.8991, UEM: 0.6025, LEM: 0.3750, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7115, partial_loss/deprel_loss: 0.6357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8486, loss: 0.7498, batch_reg_loss: 0.1977, reg_loss: 0.1976 ||:  33%|###2      | 31/95 [00:22<00:44,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7966, UAS: 0.9438, LAS: 0.8954, UEM: 0.5855, LEM: 0.3608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9936, partial_loss/deprel_loss: 0.9843, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3839, loss: 0.7738, batch_reg_loss: 0.1977, reg_loss: 0.1976 ||:  36%|###5      | 34/95 [00:24<00:43,  1.40it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9240, UAS: 0.9449, LAS: 0.8968, UEM: 0.5936, LEM: 0.3637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2525, partial_loss/deprel_loss: 0.3521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5299, loss: 0.7618, batch_reg_loss: 0.1978, reg_loss: 0.1976 ||:  39%|###8      | 37/95 [00:26<00:42,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8425, UAS: 0.9435, LAS: 0.8951, UEM: 0.5877, LEM: 0.3561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2622, partial_loss/deprel_loss: 0.9161, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1831, loss: 0.7751, batch_reg_loss: 0.1978, reg_loss: 0.1976 ||:  42%|####2     | 40/95 [00:28<00:40,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9431, LAS: 0.8944, UEM: 0.5807, LEM: 0.3472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4448, partial_loss/deprel_loss: 0.6319, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7923, loss: 0.7778, batch_reg_loss: 0.1978, reg_loss: 0.1977 ||:  45%|####5     | 43/95 [00:31<00:39,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8784, UAS: 0.9427, LAS: 0.8940, UEM: 0.5724, LEM: 0.3383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7533, partial_loss/deprel_loss: 0.6934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9033, loss: 0.7822, batch_reg_loss: 0.1979, reg_loss: 0.1977 ||:  49%|####9     | 47/95 [00:33<00:34,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9435, LAS: 0.8949, UEM: 0.5817, LEM: 0.3460, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2394, partial_loss/deprel_loss: 0.3445, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5214, loss: 0.7740, batch_reg_loss: 0.1979, reg_loss: 0.1977 ||:  53%|#####2    | 50/95 [00:36<00:33,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8197, UAS: 0.9415, LAS: 0.8927, UEM: 0.5700, LEM: 0.3374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4372, partial_loss/deprel_loss: 1.0914, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3585, loss: 0.7914, batch_reg_loss: 0.1980, reg_loss: 0.1977 ||:  56%|#####5    | 53/95 [00:38<00:30,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9413, LAS: 0.8922, UEM: 0.5691, LEM: 0.3350, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2474, partial_loss/deprel_loss: 0.4322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5933, loss: 0.7934, batch_reg_loss: 0.1980, reg_loss: 0.1977 ||:  59%|#####8    | 56/95 [00:40<00:28,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8790, UAS: 0.9411, LAS: 0.8918, UEM: 0.5593, LEM: 0.3255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8201, partial_loss/deprel_loss: 0.6674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8960, loss: 0.7948, batch_reg_loss: 0.1981, reg_loss: 0.1977 ||:  64%|######4   | 61/95 [00:42<00:22,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9403, LAS: 0.8908, UEM: 0.5581, LEM: 0.3284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1353, partial_loss/deprel_loss: 0.3320, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4908, loss: 0.8029, batch_reg_loss: 0.1981, reg_loss: 0.1978 ||:  69%|######9   | 66/95 [00:45<00:17,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8370, UAS: 0.9406, LAS: 0.8907, UEM: 0.5623, LEM: 0.3296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0894, partial_loss/deprel_loss: 0.9622, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1858, loss: 0.8026, batch_reg_loss: 0.1982, reg_loss: 0.1978 ||:  75%|#######4  | 71/95 [00:47<00:13,  1.79it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9408, LAS: 0.8909, UEM: 0.5787, LEM: 0.3477, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1041, partial_loss/deprel_loss: 0.2437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4141, loss: 0.8013, batch_reg_loss: 0.1983, reg_loss: 0.1978 ||:  80%|########  | 76/95 [00:50<00:10,  1.79it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8768, UAS: 0.9404, LAS: 0.8905, UEM: 0.5721, LEM: 0.3411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6706, partial_loss/deprel_loss: 0.6264, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8336, loss: 0.8033, batch_reg_loss: 0.1983, reg_loss: 0.1979 ||:  84%|########4 | 80/95 [00:52<00:08,  1.73it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9411, LAS: 0.8912, UEM: 0.5771, LEM: 0.3429, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3645, partial_loss/deprel_loss: 0.5852, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7394, loss: 0.7981, batch_reg_loss: 0.1984, reg_loss: 0.1979 ||:  88%|########8 | 84/95 [00:55<00:06,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9054, UAS: 0.9412, LAS: 0.8912, UEM: 0.5732, LEM: 0.3380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4024, partial_loss/deprel_loss: 0.5715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7361, loss: 0.8009, batch_reg_loss: 0.1984, reg_loss: 0.1979 ||:  93%|#########2| 88/95 [00:58<00:04,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9422, LAS: 0.8921, UEM: 0.5884, LEM: 0.3509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1376, partial_loss/deprel_loss: 0.3224, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4839, loss: 0.7930, batch_reg_loss: 0.1984, reg_loss: 0.1979 ||:  97%|#########6| 92/95 [01:00<00:01,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8840, UAS: 0.9420, LAS: 0.8917, UEM: 0.5827, LEM: 0.3449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6680, partial_loss/deprel_loss: 0.7358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9207, loss: 0.7973, batch_reg_loss: 0.1985, reg_loss: 0.1979 ||: 100%|##########| 95/95 [01:02<00:00,  1.51it/s]\n",
+      "2023-04-07 00:29:04,015 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.198  |       N/A\n",
+      "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - UEM                      |     0.583  |       N/A\n",
+      "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - LEM                      |     0.345  |       N/A\n",
+      "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - EM                       |     0.884  |       N/A\n",
+      "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.668  |       N/A\n",
+      "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - UAS                      |     0.942  |       N/A\n",
+      "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.736  |       N/A\n",
+      "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - loss                     |     0.797  |       N/A\n",
+      "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - LAS                      |     0.892  |       N/A\n",
+      "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:29:04,016 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:29:04,017 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:29:04,017 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:29:04,017 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:29:04,017 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:29:04,017 - INFO - combo.training.trainer - Epoch duration: 0:01:02.812578\n",
+      "2023-04-07 00:29:04,018 - INFO - combo.training.trainer - Estimated training time remaining: 5:47:33\n",
+      "2023-04-07 00:29:04,018 - INFO - allennlp.training.trainer - Epoch 89/399\n",
+      "2023-04-07 00:29:04,018 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:29:04,018 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:29:04,025 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9481, LAS: 0.9035, UEM: 0.4851, LEM: 0.2334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5204, partial_loss/deprel_loss: 0.5339, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7297, loss: 0.7150, batch_reg_loss: 0.1985, reg_loss: 0.1985 ||:   3%|3         | 3/95 [00:02<01:01,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8994, UAS: 0.9456, LAS: 0.8989, UEM: 0.4396, LEM: 0.1978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4658, partial_loss/deprel_loss: 0.5637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7426, loss: 0.7531, batch_reg_loss: 0.1985, reg_loss: 0.1985 ||:   6%|6         | 6/95 [00:04<01:02,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9442, LAS: 0.8966, UEM: 0.4105, LEM: 0.1650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7382, partial_loss/deprel_loss: 0.7128, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9165, loss: 0.7817, batch_reg_loss: 0.1986, reg_loss: 0.1985 ||:  11%|#         | 10/95 [00:06<00:57,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9434, LAS: 0.8962, UEM: 0.4338, LEM: 0.1837, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5118, partial_loss/deprel_loss: 0.5192, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7163, loss: 0.7785, batch_reg_loss: 0.1986, reg_loss: 0.1985 ||:  14%|#3        | 13/95 [00:08<00:56,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9447, LAS: 0.8973, UEM: 0.4778, LEM: 0.2194, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2952, partial_loss/deprel_loss: 0.4379, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6080, loss: 0.7694, batch_reg_loss: 0.1986, reg_loss: 0.1985 ||:  17%|#6        | 16/95 [00:11<00:56,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9442, LAS: 0.8967, UEM: 0.5127, LEM: 0.2585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4065, partial_loss/deprel_loss: 0.4926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6740, loss: 0.7751, batch_reg_loss: 0.1987, reg_loss: 0.1986 ||:  20%|##        | 19/95 [00:13<00:55,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9470, LAS: 0.8991, UEM: 0.5595, LEM: 0.2950, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2982, partial_loss/deprel_loss: 0.4643, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6297, loss: 0.7508, batch_reg_loss: 0.1987, reg_loss: 0.1986 ||:  23%|##3       | 22/95 [00:16<00:55,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8875, UAS: 0.9477, LAS: 0.8998, UEM: 0.5598, LEM: 0.2940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6401, partial_loss/deprel_loss: 0.6176, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8208, loss: 0.7474, batch_reg_loss: 0.1987, reg_loss: 0.1986 ||:  26%|##6       | 25/95 [00:18<00:51,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9437, LAS: 0.8956, UEM: 0.5304, LEM: 0.2771, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4528, partial_loss/deprel_loss: 0.5562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7343, loss: 0.7814, batch_reg_loss: 0.1988, reg_loss: 0.1986 ||:  31%|###       | 29/95 [00:20<00:46,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8773, UAS: 0.9447, LAS: 0.8961, UEM: 0.5438, LEM: 0.2865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6302, partial_loss/deprel_loss: 0.6282, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8274, loss: 0.7733, batch_reg_loss: 0.1988, reg_loss: 0.1986 ||:  34%|###3      | 32/95 [00:23<00:46,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9434, LAS: 0.8946, UEM: 0.5375, LEM: 0.2838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5787, partial_loss/deprel_loss: 0.6191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8098, loss: 0.7841, batch_reg_loss: 0.1988, reg_loss: 0.1986 ||:  38%|###7      | 36/95 [00:25<00:42,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9428, LAS: 0.8936, UEM: 0.5350, LEM: 0.2805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5987, partial_loss/deprel_loss: 0.7361, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9075, loss: 0.7898, batch_reg_loss: 0.1989, reg_loss: 0.1987 ||:  42%|####2     | 40/95 [00:28<00:38,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8581, UAS: 0.9414, LAS: 0.8919, UEM: 0.5269, LEM: 0.2763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9567, partial_loss/deprel_loss: 0.8349, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0581, loss: 0.8030, batch_reg_loss: 0.1989, reg_loss: 0.1987 ||:  46%|####6     | 44/95 [00:31<00:34,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9420, LAS: 0.8931, UEM: 0.5699, LEM: 0.3356, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2347, partial_loss/deprel_loss: 0.3596, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5336, loss: 0.7941, batch_reg_loss: 0.1990, reg_loss: 0.1987 ||:  49%|####9     | 47/95 [00:33<00:35,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8519, UAS: 0.9396, LAS: 0.8906, UEM: 0.5562, LEM: 0.3261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0159, partial_loss/deprel_loss: 0.8514, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0833, loss: 0.8123, batch_reg_loss: 0.1990, reg_loss: 0.1987 ||:  53%|#####2    | 50/95 [00:35<00:32,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8634, UAS: 0.9394, LAS: 0.8902, UEM: 0.5621, LEM: 0.3331, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9020, partial_loss/deprel_loss: 0.7869, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0089, loss: 0.8138, batch_reg_loss: 0.1990, reg_loss: 0.1987 ||:  56%|#####5    | 53/95 [00:37<00:30,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9413, UAS: 0.9405, LAS: 0.8913, UEM: 0.5770, LEM: 0.3473, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1214, partial_loss/deprel_loss: 0.2771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4450, loss: 0.8053, batch_reg_loss: 0.1991, reg_loss: 0.1988 ||:  59%|#####8    | 56/95 [00:40<00:29,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9407, LAS: 0.8914, UEM: 0.5740, LEM: 0.3429, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2917, partial_loss/deprel_loss: 0.4701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6335, loss: 0.8043, batch_reg_loss: 0.1991, reg_loss: 0.1988 ||:  62%|######2   | 59/95 [00:42<00:26,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8363, UAS: 0.9388, LAS: 0.8892, UEM: 0.5662, LEM: 0.3380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3096, partial_loss/deprel_loss: 0.8764, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1622, loss: 0.8187, batch_reg_loss: 0.1992, reg_loss: 0.1988 ||:  65%|######5   | 62/95 [00:44<00:23,  1.41it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9393, LAS: 0.8896, UEM: 0.5640, LEM: 0.3341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2854, partial_loss/deprel_loss: 0.5068, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6617, loss: 0.8159, batch_reg_loss: 0.1992, reg_loss: 0.1988 ||:  69%|######9   | 66/95 [00:46<00:19,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9396, LAS: 0.8899, UEM: 0.5684, LEM: 0.3402, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2685, partial_loss/deprel_loss: 0.3919, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5665, loss: 0.8126, batch_reg_loss: 0.1993, reg_loss: 0.1988 ||:  74%|#######3  | 70/95 [00:49<00:16,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9406, LAS: 0.8911, UEM: 0.5816, LEM: 0.3534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5669, partial_loss/deprel_loss: 0.6554, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8370, loss: 0.8050, batch_reg_loss: 0.1993, reg_loss: 0.1989 ||:  78%|#######7  | 74/95 [00:52<00:14,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9397, LAS: 0.8902, UEM: 0.5767, LEM: 0.3488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4900, partial_loss/deprel_loss: 0.5398, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7292, loss: 0.8124, batch_reg_loss: 0.1994, reg_loss: 0.1989 ||:  81%|########1 | 77/95 [00:54<00:12,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9408, LAS: 0.8914, UEM: 0.5873, LEM: 0.3560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2311, partial_loss/deprel_loss: 0.4149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5775, loss: 0.8032, batch_reg_loss: 0.1994, reg_loss: 0.1989 ||:  84%|########4 | 80/95 [00:56<00:10,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9411, LAS: 0.8917, UEM: 0.5851, LEM: 0.3524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3257, partial_loss/deprel_loss: 0.4570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6301, loss: 0.8013, batch_reg_loss: 0.1994, reg_loss: 0.1989 ||:  87%|########7 | 83/95 [00:58<00:08,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8574, UAS: 0.9405, LAS: 0.8909, UEM: 0.5781, LEM: 0.3464, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0019, partial_loss/deprel_loss: 0.7952, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0360, loss: 0.8081, batch_reg_loss: 0.1995, reg_loss: 0.1989 ||:  92%|#########1| 87/95 [01:01<00:05,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8821, UAS: 0.9401, LAS: 0.8905, UEM: 0.5735, LEM: 0.3432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7059, partial_loss/deprel_loss: 0.6153, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8329, loss: 0.8110, batch_reg_loss: 0.1995, reg_loss: 0.1990 ||:  95%|#########4| 90/95 [01:03<00:03,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9411, LAS: 0.8917, UEM: 0.5826, LEM: 0.3512, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2421, partial_loss/deprel_loss: 0.4209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5847, loss: 0.8023, batch_reg_loss: 0.1996, reg_loss: 0.1990 ||: 100%|##########| 95/95 [01:05<00:00,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9411, LAS: 0.8917, UEM: 0.5826, LEM: 0.3512, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2421, partial_loss/deprel_loss: 0.4209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5847, loss: 0.8023, batch_reg_loss: 0.1996, reg_loss: 0.1990 ||: 100%|##########| 95/95 [01:05<00:00,  1.45it/s]\n",
+      "2023-04-07 00:30:09,657 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:30:09,657 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 00:30:09,657 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.199  |       N/A\n",
+      "2023-04-07 00:30:09,657 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - UEM                      |     0.583  |       N/A\n",
+      "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - LEM                      |     0.351  |       N/A\n",
+      "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - EM                       |     0.914  |       N/A\n",
+      "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.242  |       N/A\n",
+      "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - UAS                      |     0.941  |       N/A\n",
+      "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.421  |       N/A\n",
+      "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - loss                     |     0.802  |       N/A\n",
+      "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - LAS                      |     0.892  |       N/A\n",
+      "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:30:09,658 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:30:09,659 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:30:09,659 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:30:09,659 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:30:09,659 - INFO - combo.training.trainer - Epoch duration: 0:01:05.641583\n",
+      "2023-04-07 00:30:09,659 - INFO - combo.training.trainer - Estimated training time remaining: 5:46:21\n",
+      "2023-04-07 00:30:09,659 - INFO - allennlp.training.trainer - Epoch 90/399\n",
+      "2023-04-07 00:30:09,660 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:30:09,660 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:30:09,667 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8791, UAS: 0.9450, LAS: 0.8936, UEM: 0.5123, LEM: 0.2704, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7253, partial_loss/deprel_loss: 0.6645, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8763, loss: 0.7937, batch_reg_loss: 0.1996, reg_loss: 0.1996 ||:   5%|5         | 5/95 [00:02<00:42,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9180, UAS: 0.9427, LAS: 0.8942, UEM: 0.5429, LEM: 0.3019, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4502, partial_loss/deprel_loss: 0.4530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6521, loss: 0.7870, batch_reg_loss: 0.1997, reg_loss: 0.1996 ||:  11%|#         | 10/95 [00:04<00:39,  2.14it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9460, LAS: 0.8988, UEM: 0.5889, LEM: 0.3498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2637, partial_loss/deprel_loss: 0.3950, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5685, loss: 0.7484, batch_reg_loss: 0.1997, reg_loss: 0.1997 ||:  15%|#4        | 14/95 [00:07<00:41,  1.96it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9267, UAS: 0.9508, LAS: 0.9035, UEM: 0.6386, LEM: 0.3827, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2179, partial_loss/deprel_loss: 0.3739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5424, loss: 0.7130, batch_reg_loss: 0.1998, reg_loss: 0.1997 ||:  19%|#8        | 18/95 [00:09<00:43,  1.77it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9519, LAS: 0.9046, UEM: 0.6384, LEM: 0.3777, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2246, partial_loss/deprel_loss: 0.3800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5487, loss: 0.7054, batch_reg_loss: 0.1998, reg_loss: 0.1997 ||:  22%|##2       | 21/95 [00:12<00:47,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8569, UAS: 0.9489, LAS: 0.9007, UEM: 0.6122, LEM: 0.3584, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0449, partial_loss/deprel_loss: 0.8457, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0853, loss: 0.7370, batch_reg_loss: 0.1998, reg_loss: 0.1997 ||:  25%|##5       | 24/95 [00:14<00:46,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8575, UAS: 0.9482, LAS: 0.8997, UEM: 0.6132, LEM: 0.3599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0205, partial_loss/deprel_loss: 0.8360, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0728, loss: 0.7427, batch_reg_loss: 0.1998, reg_loss: 0.1997 ||:  29%|##9       | 28/95 [00:16<00:43,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9118, UAS: 0.9476, LAS: 0.8990, UEM: 0.5980, LEM: 0.3459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3960, partial_loss/deprel_loss: 0.4589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6462, loss: 0.7487, batch_reg_loss: 0.1999, reg_loss: 0.1997 ||:  33%|###2      | 31/95 [00:18<00:42,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9457, LAS: 0.8969, UEM: 0.5970, LEM: 0.3444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3393, partial_loss/deprel_loss: 0.5142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6791, loss: 0.7626, batch_reg_loss: 0.1999, reg_loss: 0.1998 ||:  36%|###5      | 34/95 [00:21<00:41,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9449, LAS: 0.8961, UEM: 0.5941, LEM: 0.3444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2567, partial_loss/deprel_loss: 0.4196, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5870, loss: 0.7677, batch_reg_loss: 0.1999, reg_loss: 0.1998 ||:  40%|####      | 38/95 [00:23<00:38,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.9417, LAS: 0.8924, UEM: 0.5785, LEM: 0.3343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9151, partial_loss/deprel_loss: 0.7372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9727, loss: 0.7963, batch_reg_loss: 0.2000, reg_loss: 0.1998 ||:  43%|####3     | 41/95 [00:25<00:37,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8640, UAS: 0.9403, LAS: 0.8911, UEM: 0.5619, LEM: 0.3214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1120, partial_loss/deprel_loss: 0.7932, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0570, loss: 0.8087, batch_reg_loss: 0.2000, reg_loss: 0.1998 ||:  47%|####7     | 45/95 [00:28<00:32,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9415, LAS: 0.8924, UEM: 0.5658, LEM: 0.3217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3023, partial_loss/deprel_loss: 0.5293, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6840, loss: 0.7983, batch_reg_loss: 0.2001, reg_loss: 0.1998 ||:  52%|#####1    | 49/95 [00:30<00:29,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9432, LAS: 0.8943, UEM: 0.5872, LEM: 0.3421, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1945, partial_loss/deprel_loss: 0.2997, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4789, loss: 0.7849, batch_reg_loss: 0.2002, reg_loss: 0.1999 ||:  56%|#####5    | 53/95 [00:33<00:29,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8522, UAS: 0.9423, LAS: 0.8932, UEM: 0.5780, LEM: 0.3340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2293, partial_loss/deprel_loss: 0.9079, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1724, loss: 0.7951, batch_reg_loss: 0.2002, reg_loss: 0.1999 ||:  60%|######    | 57/95 [00:36<00:25,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9628, UAS: 0.9417, LAS: 0.8928, UEM: 0.5927, LEM: 0.3617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0499, partial_loss/deprel_loss: 0.1731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3488, loss: 0.7994, batch_reg_loss: 0.2003, reg_loss: 0.1999 ||:  64%|######4   | 61/95 [00:39<00:23,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9199, UAS: 0.9412, LAS: 0.8921, UEM: 0.5921, LEM: 0.3604, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2756, partial_loss/deprel_loss: 0.4309, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6002, loss: 0.8031, batch_reg_loss: 0.2003, reg_loss: 0.1999 ||:  67%|######7   | 64/95 [00:42<00:23,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9423, LAS: 0.8931, UEM: 0.6025, LEM: 0.3670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3239, partial_loss/deprel_loss: 0.5025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6671, loss: 0.7938, batch_reg_loss: 0.2004, reg_loss: 0.1999 ||:  71%|#######   | 67/95 [00:44<00:21,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8860, UAS: 0.9422, LAS: 0.8929, UEM: 0.6057, LEM: 0.3713, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5660, partial_loss/deprel_loss: 0.5883, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7842, loss: 0.7939, batch_reg_loss: 0.2004, reg_loss: 0.2000 ||:  74%|#######3  | 70/95 [00:46<00:19,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9420, LAS: 0.8928, UEM: 0.6053, LEM: 0.3705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2561, partial_loss/deprel_loss: 0.4256, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5922, loss: 0.7944, batch_reg_loss: 0.2004, reg_loss: 0.2000 ||:  77%|#######6  | 73/95 [00:48<00:16,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8880, UAS: 0.9422, LAS: 0.8928, UEM: 0.5995, LEM: 0.3640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5083, partial_loss/deprel_loss: 0.7004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8625, loss: 0.7949, batch_reg_loss: 0.2005, reg_loss: 0.2000 ||:  80%|########  | 76/95 [00:50<00:13,  1.37it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9424, LAS: 0.8932, UEM: 0.6052, LEM: 0.3733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0929, partial_loss/deprel_loss: 0.2348, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4069, loss: 0.7926, batch_reg_loss: 0.2005, reg_loss: 0.2000 ||:  83%|########3 | 79/95 [00:53<00:11,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8726, UAS: 0.9423, LAS: 0.8931, UEM: 0.5989, LEM: 0.3663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6515, partial_loss/deprel_loss: 0.8085, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9777, loss: 0.7942, batch_reg_loss: 0.2006, reg_loss: 0.2000 ||:  87%|########7 | 83/95 [00:55<00:08,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8680, UAS: 0.9423, LAS: 0.8929, UEM: 0.5913, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8163, partial_loss/deprel_loss: 0.6959, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9206, loss: 0.7933, batch_reg_loss: 0.2006, reg_loss: 0.2001 ||:  92%|#########1| 87/95 [00:58<00:05,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9423, LAS: 0.8929, UEM: 0.5877, LEM: 0.3532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2587, partial_loss/deprel_loss: 0.4601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6205, loss: 0.7947, batch_reg_loss: 0.2006, reg_loss: 0.2001 ||:  96%|#########5| 91/95 [01:00<00:02,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9417, LAS: 0.8922, UEM: 0.5804, LEM: 0.3468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4732, partial_loss/deprel_loss: 0.5810, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7602, loss: 0.8000, batch_reg_loss: 0.2007, reg_loss: 0.2001 ||: 100%|##########| 95/95 [01:03<00:00,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9417, LAS: 0.8922, UEM: 0.5804, LEM: 0.3468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4732, partial_loss/deprel_loss: 0.5810, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7602, loss: 0.8000, batch_reg_loss: 0.2007, reg_loss: 0.2001 ||: 100%|##########| 95/95 [01:03<00:00,  1.51it/s]\n",
+      "2023-04-07 00:31:12,789 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8827, UAS: 0.9410, LAS: 0.8857, UEM: 0.4621, LEM: 0.1514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8507, partial_loss/deprel_loss: 31.5549, partial_loss/cycle_loss: 0.0000, batch_loss: 25.4141, loss: 21.2894, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  27%|##7       | 3/11 [00:02<00:07,  1.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9450, LAS: 0.8936, UEM: 0.6514, LEM: 0.4265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1134, partial_loss/deprel_loss: 43.5343, partial_loss/cycle_loss: 0.0000, batch_loss: 35.0502, loss: 21.7831, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:04<00:05,  1.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8486, UAS: 0.9368, LAS: 0.8826, UEM: 0.5799, LEM: 0.3637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5046, partial_loss/deprel_loss: 49.4599, partial_loss/cycle_loss: 0.0000, batch_loss: 39.8689, loss: 25.7462, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  64%|######3   | 7/11 [00:07<00:04,  1.02s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9441, LAS: 0.8900, UEM: 0.6513, LEM: 0.3949, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4922, partial_loss/deprel_loss: 26.0854, partial_loss/cycle_loss: 0.0000, batch_loss: 20.9668, loss: 24.0852, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  82%|########1 | 9/11 [00:09<00:02,  1.02s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9477, LAS: 0.8952, UEM: 0.6692, LEM: 0.4064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3859, partial_loss/deprel_loss: 21.0911, partial_loss/cycle_loss: 0.0000, batch_loss: 16.9501, loss: 23.0576, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:11<00:00,  1.00s/it]\n",
+      "2023-04-07 00:31:23,825 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.200  |     0.000\n",
+      "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - UEM                      |     0.580  |     0.669\n",
+      "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - LEM                      |     0.347  |     0.406\n",
+      "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - EM                       |     0.897  |     0.918\n",
+      "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.473  |     0.386\n",
+      "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - UAS                      |     0.942  |     0.948\n",
+      "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.581  |    21.091\n",
+      "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - loss                     |     0.800  |    23.058\n",
+      "2023-04-07 00:31:23,826 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:31:23,827 - INFO - combo.training.tensorboard_writer - LAS                      |     0.892  |     0.895\n",
+      "2023-04-07 00:31:23,827 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:31:23,827 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:31:23,827 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:31:23,827 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:31:23,827 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:31:23,827 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 00:31:23,828 - INFO - combo.training.trainer - Epoch duration: 0:01:14.168224\n",
+      "2023-04-07 00:31:23,828 - INFO - combo.training.trainer - Estimated training time remaining: 5:45:39\n",
+      "2023-04-07 00:31:23,828 - INFO - allennlp.training.trainer - Epoch 91/399\n",
+      "2023-04-07 00:31:23,828 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:31:23,828 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:31:23,836 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8423, UAS: 0.9371, LAS: 0.8873, UEM: 0.5567, LEM: 0.3038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2762, partial_loss/deprel_loss: 0.9301, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2001, loss: 0.8243, batch_reg_loss: 0.2007, reg_loss: 0.2007 ||:   4%|4         | 4/95 [00:02<00:57,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9257, LAS: 0.8748, UEM: 0.4554, LEM: 0.2406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5300, partial_loss/deprel_loss: 0.5716, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7641, loss: 0.9286, batch_reg_loss: 0.2008, reg_loss: 0.2007 ||:   7%|7         | 7/95 [00:04<00:56,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9312, LAS: 0.8795, UEM: 0.4493, LEM: 0.2157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4770, partial_loss/deprel_loss: 0.5947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7720, loss: 0.9050, batch_reg_loss: 0.2008, reg_loss: 0.2008 ||:  12%|#1        | 11/95 [00:07<00:53,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8584, UAS: 0.9337, LAS: 0.8820, UEM: 0.4745, LEM: 0.2472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9149, partial_loss/deprel_loss: 0.8923, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0978, loss: 0.8786, batch_reg_loss: 0.2009, reg_loss: 0.2008 ||:  17%|#6        | 16/95 [00:09<00:46,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9357, LAS: 0.8855, UEM: 0.5141, LEM: 0.2935, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1272, partial_loss/deprel_loss: 0.2702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4426, loss: 0.8593, batch_reg_loss: 0.2010, reg_loss: 0.2008 ||:  22%|##2       | 21/95 [00:11<00:41,  1.78it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8628, UAS: 0.9367, LAS: 0.8866, UEM: 0.5174, LEM: 0.2886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0210, partial_loss/deprel_loss: 0.8528, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0875, loss: 0.8502, batch_reg_loss: 0.2011, reg_loss: 0.2009 ||:  26%|##6       | 25/95 [00:14<00:42,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8575, UAS: 0.9350, LAS: 0.8844, UEM: 0.4910, LEM: 0.2678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9201, partial_loss/deprel_loss: 0.8418, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0586, loss: 0.8664, batch_reg_loss: 0.2011, reg_loss: 0.2009 ||:  31%|###       | 29/95 [00:16<00:39,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9362, LAS: 0.8850, UEM: 0.5022, LEM: 0.2761, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5716, partial_loss/deprel_loss: 0.6732, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8541, loss: 0.8630, batch_reg_loss: 0.2012, reg_loss: 0.2009 ||:  35%|###4      | 33/95 [00:19<00:36,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8791, UAS: 0.9373, LAS: 0.8861, UEM: 0.4997, LEM: 0.2710, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7257, partial_loss/deprel_loss: 0.5830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8128, loss: 0.8521, batch_reg_loss: 0.2012, reg_loss: 0.2010 ||:  39%|###8      | 37/95 [00:21<00:34,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8843, UAS: 0.9377, LAS: 0.8863, UEM: 0.5018, LEM: 0.2710, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5346, partial_loss/deprel_loss: 0.6944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8637, loss: 0.8491, batch_reg_loss: 0.2013, reg_loss: 0.2010 ||:  43%|####3     | 41/95 [00:23<00:30,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9386, LAS: 0.8873, UEM: 0.5077, LEM: 0.2737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3799, partial_loss/deprel_loss: 0.5438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7123, loss: 0.8409, batch_reg_loss: 0.2013, reg_loss: 0.2010 ||:  47%|####7     | 45/95 [00:25<00:27,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8428, UAS: 0.9375, LAS: 0.8861, UEM: 0.5085, LEM: 0.2744, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3011, partial_loss/deprel_loss: 0.9288, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2046, loss: 0.8502, batch_reg_loss: 0.2014, reg_loss: 0.2010 ||:  52%|#####1    | 49/95 [00:27<00:24,  1.86it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8920, UAS: 0.9384, LAS: 0.8875, UEM: 0.5119, LEM: 0.2741, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5170, partial_loss/deprel_loss: 0.6469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8223, loss: 0.8384, batch_reg_loss: 0.2014, reg_loss: 0.2011 ||:  56%|#####5    | 53/95 [00:30<00:24,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9405, LAS: 0.8896, UEM: 0.5428, LEM: 0.2976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1974, partial_loss/deprel_loss: 0.4242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5803, loss: 0.8211, batch_reg_loss: 0.2015, reg_loss: 0.2011 ||:  60%|######    | 57/95 [00:33<00:22,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9399, LAS: 0.8888, UEM: 0.5363, LEM: 0.2924, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2275, partial_loss/deprel_loss: 0.4788, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6300, loss: 0.8269, batch_reg_loss: 0.2015, reg_loss: 0.2011 ||:  64%|######4   | 61/95 [00:36<00:22,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9406, LAS: 0.8896, UEM: 0.5465, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3062, partial_loss/deprel_loss: 0.5368, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6922, loss: 0.8216, batch_reg_loss: 0.2015, reg_loss: 0.2011 ||:  68%|######8   | 65/95 [00:39<00:19,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9390, LAS: 0.8876, UEM: 0.5362, LEM: 0.2917, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4192, partial_loss/deprel_loss: 0.5808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7500, loss: 0.8364, batch_reg_loss: 0.2016, reg_loss: 0.2012 ||:  73%|#######2  | 69/95 [00:41<00:17,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9397, LAS: 0.8884, UEM: 0.5377, LEM: 0.2904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4453, partial_loss/deprel_loss: 0.5649, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7426, loss: 0.8307, batch_reg_loss: 0.2016, reg_loss: 0.2012 ||:  77%|#######6  | 73/95 [00:44<00:14,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9408, LAS: 0.8897, UEM: 0.5490, LEM: 0.2981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2844, partial_loss/deprel_loss: 0.5402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6907, loss: 0.8207, batch_reg_loss: 0.2017, reg_loss: 0.2012 ||:  81%|########1 | 77/95 [00:46<00:11,  1.60it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8566, UAS: 0.9404, LAS: 0.8891, UEM: 0.5405, LEM: 0.2920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9738, partial_loss/deprel_loss: 0.8144, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0480, loss: 0.8244, batch_reg_loss: 0.2017, reg_loss: 0.2012 ||:  85%|########5 | 81/95 [00:49<00:09,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9405, LAS: 0.8894, UEM: 0.5521, LEM: 0.3079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7789, partial_loss/deprel_loss: 0.7887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9885, loss: 0.8224, batch_reg_loss: 0.2018, reg_loss: 0.2013 ||:  89%|########9 | 85/95 [00:51<00:06,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9407, LAS: 0.8896, UEM: 0.5525, LEM: 0.3072, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2857, partial_loss/deprel_loss: 0.4783, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6416, loss: 0.8202, batch_reg_loss: 0.2018, reg_loss: 0.2013 ||:  94%|#########3| 89/95 [00:54<00:04,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9415, LAS: 0.8907, UEM: 0.5746, LEM: 0.3355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6793, partial_loss/deprel_loss: 0.6564, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8628, loss: 0.8122, batch_reg_loss: 0.2019, reg_loss: 0.2013 ||:  97%|#########6| 92/95 [00:57<00:02,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9420, LAS: 0.8913, UEM: 0.5830, LEM: 0.3426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3710, partial_loss/deprel_loss: 0.5733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7347, loss: 0.8078, batch_reg_loss: 0.2019, reg_loss: 0.2013 ||: 100%|##########| 95/95 [01:00<00:00,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9420, LAS: 0.8913, UEM: 0.5830, LEM: 0.3426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3710, partial_loss/deprel_loss: 0.5733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7347, loss: 0.8078, batch_reg_loss: 0.2019, reg_loss: 0.2013 ||: 100%|##########| 95/95 [01:00<00:00,  1.58it/s]\n",
+      "2023-04-07 00:32:23,942 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:32:23,943 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 00:32:23,943 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.201  |       N/A\n",
+      "2023-04-07 00:32:23,943 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:32:23,943 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:32:23,943 - INFO - combo.training.tensorboard_writer - UEM                      |     0.583  |       N/A\n",
+      "2023-04-07 00:32:23,943 - INFO - combo.training.tensorboard_writer - LEM                      |     0.343  |       N/A\n",
+      "2023-04-07 00:32:23,943 - INFO - combo.training.tensorboard_writer - EM                       |     0.903  |       N/A\n",
+      "2023-04-07 00:32:23,943 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.371  |       N/A\n",
+      "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - UAS                      |     0.942  |       N/A\n",
+      "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.573  |       N/A\n",
+      "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - loss                     |     0.808  |       N/A\n",
+      "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - LAS                      |     0.891  |       N/A\n",
+      "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:32:23,944 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:32:23,945 - INFO - combo.training.trainer - Epoch duration: 0:01:00.117234\n",
+      "2023-04-07 00:32:23,945 - INFO - combo.training.trainer - Estimated training time remaining: 5:44:08\n",
+      "2023-04-07 00:32:23,945 - INFO - allennlp.training.trainer - Epoch 92/399\n",
+      "2023-04-07 00:32:23,946 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:32:23,946 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:32:23,954 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9442, LAS: 0.8960, UEM: 0.5319, LEM: 0.2802, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4404, partial_loss/deprel_loss: 0.5520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7316, loss: 0.7707, batch_reg_loss: 0.2019, reg_loss: 0.2019 ||:   4%|4         | 4/95 [00:02<00:59,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9456, LAS: 0.8981, UEM: 0.5816, LEM: 0.3474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1495, partial_loss/deprel_loss: 0.3068, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4773, loss: 0.7387, batch_reg_loss: 0.2019, reg_loss: 0.2019 ||:   8%|8         | 8/95 [00:05<00:56,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8817, UAS: 0.9471, LAS: 0.9002, UEM: 0.6313, LEM: 0.4217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5522, partial_loss/deprel_loss: 0.6129, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8028, loss: 0.7206, batch_reg_loss: 0.2020, reg_loss: 0.2019 ||:  12%|#1        | 11/95 [00:07<00:55,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9030, UAS: 0.9462, LAS: 0.8976, UEM: 0.6210, LEM: 0.3998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3214, partial_loss/deprel_loss: 0.5144, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6778, loss: 0.7467, batch_reg_loss: 0.2020, reg_loss: 0.2019 ||:  16%|#5        | 15/95 [00:09<00:52,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9080, UAS: 0.9444, LAS: 0.8952, UEM: 0.6189, LEM: 0.3916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3924, partial_loss/deprel_loss: 0.4781, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6630, loss: 0.7662, batch_reg_loss: 0.2020, reg_loss: 0.2020 ||:  20%|##        | 19/95 [00:12<00:49,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9434, LAS: 0.8938, UEM: 0.6076, LEM: 0.3793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2709, partial_loss/deprel_loss: 0.4472, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6140, loss: 0.7728, batch_reg_loss: 0.2021, reg_loss: 0.2020 ||:  23%|##3       | 22/95 [00:14<00:50,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8735, UAS: 0.9412, LAS: 0.8916, UEM: 0.5937, LEM: 0.3670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8600, partial_loss/deprel_loss: 0.7354, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9624, loss: 0.7932, batch_reg_loss: 0.2021, reg_loss: 0.2020 ||:  26%|##6       | 25/95 [00:16<00:48,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9422, LAS: 0.8923, UEM: 0.5865, LEM: 0.3515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3595, partial_loss/deprel_loss: 0.4932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6686, loss: 0.7888, batch_reg_loss: 0.2021, reg_loss: 0.2020 ||:  31%|###       | 29/95 [00:21<00:55,  1.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9415, LAS: 0.8919, UEM: 0.5860, LEM: 0.3555, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1778, partial_loss/deprel_loss: 0.3281, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5002, loss: 0.7944, batch_reg_loss: 0.2022, reg_loss: 0.2020 ||:  34%|###3      | 32/95 [00:23<00:50,  1.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9419, LAS: 0.8920, UEM: 0.5921, LEM: 0.3607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1603, partial_loss/deprel_loss: 0.3331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5008, loss: 0.7953, batch_reg_loss: 0.2022, reg_loss: 0.2020 ||:  37%|###6      | 35/95 [00:25<00:46,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8533, UAS: 0.9408, LAS: 0.8909, UEM: 0.5806, LEM: 0.3548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9589, partial_loss/deprel_loss: 0.8305, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0585, loss: 0.8064, batch_reg_loss: 0.2023, reg_loss: 0.2021 ||:  41%|####1     | 39/95 [00:28<00:41,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9423, LAS: 0.8925, UEM: 0.5876, LEM: 0.3544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3185, partial_loss/deprel_loss: 0.5269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6876, loss: 0.7962, batch_reg_loss: 0.2023, reg_loss: 0.2021 ||:  44%|####4     | 42/95 [00:30<00:39,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9592, UAS: 0.9438, LAS: 0.8944, UEM: 0.6200, LEM: 0.3971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0571, partial_loss/deprel_loss: 0.1655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3461, loss: 0.7831, batch_reg_loss: 0.2024, reg_loss: 0.2021 ||:  47%|####7     | 45/95 [00:33<00:39,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8392, UAS: 0.9418, LAS: 0.8922, UEM: 0.6045, LEM: 0.3833, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3574, partial_loss/deprel_loss: 0.9085, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2007, loss: 0.8013, batch_reg_loss: 0.2024, reg_loss: 0.2021 ||:  52%|#####1    | 49/95 [00:35<00:32,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9072, UAS: 0.9424, LAS: 0.8929, UEM: 0.6013, LEM: 0.3761, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3916, partial_loss/deprel_loss: 0.5326, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7068, loss: 0.7964, batch_reg_loss: 0.2024, reg_loss: 0.2021 ||:  55%|#####4    | 52/95 [00:37<00:30,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9412, LAS: 0.8915, UEM: 0.5947, LEM: 0.3675, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4025, partial_loss/deprel_loss: 0.5741, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7422, loss: 0.8054, batch_reg_loss: 0.2025, reg_loss: 0.2022 ||:  59%|#####8    | 56/95 [00:40<00:27,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8825, UAS: 0.9409, LAS: 0.8910, UEM: 0.5882, LEM: 0.3601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6082, partial_loss/deprel_loss: 0.7029, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8864, loss: 0.8087, batch_reg_loss: 0.2025, reg_loss: 0.2022 ||:  62%|######2   | 59/95 [00:42<00:25,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9401, LAS: 0.8899, UEM: 0.5841, LEM: 0.3563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2223, partial_loss/deprel_loss: 0.4426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6011, loss: 0.8175, batch_reg_loss: 0.2025, reg_loss: 0.2022 ||:  66%|######6   | 63/95 [00:44<00:21,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9406, LAS: 0.8906, UEM: 0.5872, LEM: 0.3573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2858, partial_loss/deprel_loss: 0.3845, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5674, loss: 0.8137, batch_reg_loss: 0.2026, reg_loss: 0.2022 ||:  71%|#######   | 67/95 [00:47<00:18,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9401, LAS: 0.8899, UEM: 0.5741, LEM: 0.3454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4226, partial_loss/deprel_loss: 0.5250, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7072, loss: 0.8188, batch_reg_loss: 0.2027, reg_loss: 0.2022 ||:  76%|#######5  | 72/95 [00:49<00:13,  1.72it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9407, LAS: 0.8906, UEM: 0.5698, LEM: 0.3386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4196, partial_loss/deprel_loss: 0.5379, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7169, loss: 0.8153, batch_reg_loss: 0.2027, reg_loss: 0.2023 ||:  81%|########1 | 77/95 [00:51<00:09,  1.89it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9411, LAS: 0.8912, UEM: 0.5748, LEM: 0.3440, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6897, partial_loss/deprel_loss: 0.6689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8758, loss: 0.8105, batch_reg_loss: 0.2028, reg_loss: 0.2023 ||:  85%|########5 | 81/95 [00:54<00:08,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9416, LAS: 0.8918, UEM: 0.5759, LEM: 0.3427, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2683, partial_loss/deprel_loss: 0.4690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6316, loss: 0.8069, batch_reg_loss: 0.2028, reg_loss: 0.2023 ||:  89%|########9 | 85/95 [00:57<00:06,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8029, UAS: 0.9412, LAS: 0.8914, UEM: 0.5784, LEM: 0.3446, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7882, partial_loss/deprel_loss: 1.1323, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4663, loss: 0.8093, batch_reg_loss: 0.2028, reg_loss: 0.2023 ||:  94%|#########3| 89/95 [01:00<00:03,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8948, UAS: 0.9421, LAS: 0.8924, UEM: 0.5892, LEM: 0.3514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3949, partial_loss/deprel_loss: 0.5763, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7429, loss: 0.8016, batch_reg_loss: 0.2029, reg_loss: 0.2024 ||:  98%|#########7| 93/95 [01:03<00:01,  1.38it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9421, LAS: 0.8923, UEM: 0.5866, LEM: 0.3486, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7543, partial_loss/deprel_loss: 0.7355, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9422, loss: 0.8027, batch_reg_loss: 0.2029, reg_loss: 0.2024 ||: 100%|##########| 95/95 [01:04<00:00,  1.46it/s]\n",
+      "2023-04-07 00:33:28,887 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:33:28,887 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 00:33:28,887 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.202  |       N/A\n",
+      "2023-04-07 00:33:28,887 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:33:28,887 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:33:28,887 - INFO - combo.training.tensorboard_writer - UEM                      |     0.587  |       N/A\n",
+      "2023-04-07 00:33:28,887 - INFO - combo.training.tensorboard_writer - LEM                      |     0.349  |       N/A\n",
+      "2023-04-07 00:33:28,887 - INFO - combo.training.tensorboard_writer - EM                       |     0.880  |       N/A\n",
+      "2023-04-07 00:33:28,887 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.754  |       N/A\n",
+      "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - UAS                      |     0.942  |       N/A\n",
+      "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.736  |       N/A\n",
+      "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - loss                     |     0.803  |       N/A\n",
+      "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - LAS                      |     0.892  |       N/A\n",
+      "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:33:28,888 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:33:28,889 - INFO - combo.training.trainer - Epoch duration: 0:01:04.943569\n",
+      "2023-04-07 00:33:28,889 - INFO - combo.training.trainer - Estimated training time remaining: 5:42:54\n",
+      "2023-04-07 00:33:28,889 - INFO - allennlp.training.trainer - Epoch 93/399\n",
+      "2023-04-07 00:33:28,889 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:33:28,890 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:33:28,897 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9551, LAS: 0.9079, UEM: 0.6613, LEM: 0.4019, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1750, partial_loss/deprel_loss: 0.3460, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5148, loss: 0.6752, batch_reg_loss: 0.2029, reg_loss: 0.2029 ||:   3%|3         | 3/95 [00:02<01:07,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9494, LAS: 0.9022, UEM: 0.5784, LEM: 0.3213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3563, partial_loss/deprel_loss: 0.4778, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6564, loss: 0.7243, batch_reg_loss: 0.2029, reg_loss: 0.2029 ||:   6%|6         | 6/95 [00:04<01:07,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9448, LAS: 0.8972, UEM: 0.5689, LEM: 0.3321, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1788, partial_loss/deprel_loss: 0.3445, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5143, loss: 0.7537, batch_reg_loss: 0.2030, reg_loss: 0.2029 ||:  11%|#         | 10/95 [00:07<01:01,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8584, UAS: 0.9417, LAS: 0.8925, UEM: 0.5342, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0468, partial_loss/deprel_loss: 0.8551, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0965, loss: 0.7887, batch_reg_loss: 0.2030, reg_loss: 0.2029 ||:  15%|#4        | 14/95 [00:09<00:56,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9263, UAS: 0.9447, LAS: 0.8960, UEM: 0.5514, LEM: 0.3017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2834, partial_loss/deprel_loss: 0.3764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5609, loss: 0.7672, batch_reg_loss: 0.2030, reg_loss: 0.2030 ||:  18%|#7        | 17/95 [00:11<00:54,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9473, LAS: 0.8985, UEM: 0.5909, LEM: 0.3318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1812, partial_loss/deprel_loss: 0.4431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5937, loss: 0.7474, batch_reg_loss: 0.2031, reg_loss: 0.2030 ||:  21%|##1       | 20/95 [00:14<00:53,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9474, LAS: 0.8990, UEM: 0.5733, LEM: 0.3164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6749, partial_loss/deprel_loss: 0.6347, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8458, loss: 0.7480, batch_reg_loss: 0.2031, reg_loss: 0.2030 ||:  24%|##4       | 23/95 [00:16<00:53,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8548, UAS: 0.9447, LAS: 0.8957, UEM: 0.5516, LEM: 0.2992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9470, partial_loss/deprel_loss: 0.8236, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0514, loss: 0.7682, batch_reg_loss: 0.2031, reg_loss: 0.2030 ||:  27%|##7       | 26/95 [00:18<00:50,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8569, UAS: 0.9424, LAS: 0.8937, UEM: 0.5940, LEM: 0.3676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9548, partial_loss/deprel_loss: 0.8370, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0637, loss: 0.7856, batch_reg_loss: 0.2031, reg_loss: 0.2030 ||:  31%|###       | 29/95 [00:21<00:50,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9420, LAS: 0.8930, UEM: 0.5906, LEM: 0.3642, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2851, partial_loss/deprel_loss: 0.4377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6104, loss: 0.7914, batch_reg_loss: 0.2032, reg_loss: 0.2030 ||:  35%|###4      | 33/95 [00:24<00:46,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9439, LAS: 0.8952, UEM: 0.6147, LEM: 0.3827, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1416, partial_loss/deprel_loss: 0.3271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4932, loss: 0.7750, batch_reg_loss: 0.2032, reg_loss: 0.2030 ||:  38%|###7      | 36/95 [00:26<00:46,  1.27it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8617, UAS: 0.9413, LAS: 0.8925, UEM: 0.6020, LEM: 0.3715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9797, partial_loss/deprel_loss: 0.7980, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0376, loss: 0.7976, batch_reg_loss: 0.2032, reg_loss: 0.2031 ||:  42%|####2     | 40/95 [00:29<00:41,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9051, UAS: 0.9413, LAS: 0.8926, UEM: 0.6014, LEM: 0.3681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4059, partial_loss/deprel_loss: 0.4809, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6692, loss: 0.7987, batch_reg_loss: 0.2033, reg_loss: 0.2031 ||:  45%|####5     | 43/95 [00:31<00:38,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9416, LAS: 0.8929, UEM: 0.5940, LEM: 0.3589, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3520, partial_loss/deprel_loss: 0.4431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6282, loss: 0.7982, batch_reg_loss: 0.2033, reg_loss: 0.2031 ||:  48%|####8     | 46/95 [00:33<00:36,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8989, UAS: 0.9408, LAS: 0.8923, UEM: 0.5932, LEM: 0.3610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5310, partial_loss/deprel_loss: 0.5824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7755, loss: 0.8032, batch_reg_loss: 0.2033, reg_loss: 0.2031 ||:  52%|#####1    | 49/95 [00:35<00:33,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9141, UAS: 0.9416, LAS: 0.8931, UEM: 0.5977, LEM: 0.3633, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2374, partial_loss/deprel_loss: 0.4133, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5815, loss: 0.7971, batch_reg_loss: 0.2034, reg_loss: 0.2031 ||:  55%|#####4    | 52/95 [00:38<00:32,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9239, UAS: 0.9422, LAS: 0.8936, UEM: 0.5977, LEM: 0.3625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1901, partial_loss/deprel_loss: 0.3562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5264, loss: 0.7912, batch_reg_loss: 0.2034, reg_loss: 0.2031 ||:  58%|#####7    | 55/95 [00:40<00:30,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9437, LAS: 0.8952, UEM: 0.6204, LEM: 0.3839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2211, partial_loss/deprel_loss: 0.4185, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5825, loss: 0.7779, batch_reg_loss: 0.2035, reg_loss: 0.2032 ||:  61%|######1   | 58/95 [00:42<00:27,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9420, LAS: 0.8931, UEM: 0.6115, LEM: 0.3768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2662, partial_loss/deprel_loss: 0.4593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6242, loss: 0.7915, batch_reg_loss: 0.2035, reg_loss: 0.2032 ||:  65%|######5   | 62/95 [00:45<00:23,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9412, LAS: 0.8922, UEM: 0.6038, LEM: 0.3705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3845, partial_loss/deprel_loss: 0.4549, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6443, loss: 0.7980, batch_reg_loss: 0.2035, reg_loss: 0.2032 ||:  68%|######8   | 65/95 [00:47<00:21,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8456, UAS: 0.9409, LAS: 0.8918, UEM: 0.5969, LEM: 0.3633, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2274, partial_loss/deprel_loss: 0.9883, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2397, loss: 0.8019, batch_reg_loss: 0.2036, reg_loss: 0.2032 ||:  73%|#######2  | 69/95 [00:49<00:17,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8948, UAS: 0.9411, LAS: 0.8920, UEM: 0.5903, LEM: 0.3565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5339, partial_loss/deprel_loss: 0.5342, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7377, loss: 0.7999, batch_reg_loss: 0.2036, reg_loss: 0.2032 ||:  77%|#######6  | 73/95 [00:51<00:13,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8681, UAS: 0.9417, LAS: 0.8925, UEM: 0.5943, LEM: 0.3578, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7405, partial_loss/deprel_loss: 0.7185, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9266, loss: 0.7955, batch_reg_loss: 0.2037, reg_loss: 0.2033 ||:  81%|########1 | 77/95 [00:55<00:12,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9421, LAS: 0.8926, UEM: 0.5890, LEM: 0.3515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4679, partial_loss/deprel_loss: 0.5708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7539, loss: 0.7955, batch_reg_loss: 0.2037, reg_loss: 0.2033 ||:  85%|########5 | 81/95 [00:57<00:09,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9419, LAS: 0.8923, UEM: 0.5810, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3783, partial_loss/deprel_loss: 0.4980, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6778, loss: 0.7979, batch_reg_loss: 0.2037, reg_loss: 0.2033 ||:  89%|########9 | 85/95 [01:00<00:06,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9415, LAS: 0.8918, UEM: 0.5821, LEM: 0.3465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1365, partial_loss/deprel_loss: 0.3036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4739, loss: 0.8018, batch_reg_loss: 0.2038, reg_loss: 0.2033 ||:  94%|#########3| 89/95 [01:03<00:04,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9416, LAS: 0.8919, UEM: 0.5845, LEM: 0.3482, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1603, partial_loss/deprel_loss: 0.3629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5262, loss: 0.8018, batch_reg_loss: 0.2038, reg_loss: 0.2033 ||:  98%|#########7| 93/95 [01:05<00:01,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9416, LAS: 0.8919, UEM: 0.5828, LEM: 0.3457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4139, partial_loss/deprel_loss: 0.4960, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6835, loss: 0.8025, batch_reg_loss: 0.2038, reg_loss: 0.2033 ||: 100%|##########| 95/95 [01:06<00:00,  1.42it/s]\n",
+      "2023-04-07 00:34:35,742 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:34:35,742 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.203  |       N/A\n",
+      "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - UEM                      |     0.583  |       N/A\n",
+      "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - LEM                      |     0.346  |       N/A\n",
+      "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - EM                       |     0.910  |       N/A\n",
+      "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.414  |       N/A\n",
+      "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - UAS                      |     0.942  |       N/A\n",
+      "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.496  |       N/A\n",
+      "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - loss                     |     0.802  |       N/A\n",
+      "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - LAS                      |     0.892  |       N/A\n",
+      "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:34:35,743 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:34:35,744 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:34:35,744 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:34:35,744 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:34:35,744 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:34:35,744 - INFO - combo.training.trainer - Epoch duration: 0:01:06.855109\n",
+      "2023-04-07 00:34:35,744 - INFO - combo.training.trainer - Estimated training time remaining: 5:41:47\n",
+      "2023-04-07 00:34:35,745 - INFO - allennlp.training.trainer - Epoch 94/399\n",
+      "2023-04-07 00:34:35,745 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:34:35,745 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:34:35,753 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9148, UAS: 0.9513, LAS: 0.9046, UEM: 0.5646, LEM: 0.3078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3975, partial_loss/deprel_loss: 0.4403, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6356, loss: 0.7113, batch_reg_loss: 0.2039, reg_loss: 0.2039 ||:   4%|4         | 4/95 [00:02<00:47,  1.91it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8557, UAS: 0.9367, LAS: 0.8890, UEM: 0.4240, LEM: 0.2018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1801, partial_loss/deprel_loss: 0.8011, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0808, loss: 0.8297, batch_reg_loss: 0.2040, reg_loss: 0.2039 ||:   9%|9         | 9/95 [00:04<00:43,  1.98it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9369, LAS: 0.8891, UEM: 0.4268, LEM: 0.2037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7108, partial_loss/deprel_loss: 0.7335, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9330, loss: 0.8324, batch_reg_loss: 0.2040, reg_loss: 0.2039 ||:  15%|#4        | 14/95 [00:06<00:40,  2.00it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9375, LAS: 0.8899, UEM: 0.4594, LEM: 0.2311, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4623, partial_loss/deprel_loss: 0.4910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6893, loss: 0.8311, batch_reg_loss: 0.2041, reg_loss: 0.2040 ||:  20%|##        | 19/95 [00:09<00:36,  2.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8762, UAS: 0.9387, LAS: 0.8913, UEM: 0.4626, LEM: 0.2315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7904, partial_loss/deprel_loss: 0.7270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9438, loss: 0.8208, batch_reg_loss: 0.2041, reg_loss: 0.2040 ||:  24%|##4       | 23/95 [00:11<00:39,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9386, LAS: 0.8912, UEM: 0.4765, LEM: 0.2432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2933, partial_loss/deprel_loss: 0.4570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6284, loss: 0.8215, batch_reg_loss: 0.2042, reg_loss: 0.2040 ||:  28%|##8       | 27/95 [00:15<00:42,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9134, UAS: 0.9376, LAS: 0.8897, UEM: 0.4675, LEM: 0.2369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4014, partial_loss/deprel_loss: 0.5172, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6982, loss: 0.8359, batch_reg_loss: 0.2042, reg_loss: 0.2040 ||:  32%|###1      | 30/95 [00:17<00:44,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8587, UAS: 0.9386, LAS: 0.8901, UEM: 0.4836, LEM: 0.2459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9247, partial_loss/deprel_loss: 0.8234, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0479, loss: 0.8314, batch_reg_loss: 0.2043, reg_loss: 0.2041 ||:  35%|###4      | 33/95 [00:19<00:43,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9388, LAS: 0.8902, UEM: 0.4774, LEM: 0.2380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5193, partial_loss/deprel_loss: 0.5783, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7708, loss: 0.8284, batch_reg_loss: 0.2043, reg_loss: 0.2041 ||:  38%|###7      | 36/95 [00:21<00:41,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9017, UAS: 0.9411, LAS: 0.8928, UEM: 0.5396, LEM: 0.3127, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4171, partial_loss/deprel_loss: 0.5062, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6927, loss: 0.8082, batch_reg_loss: 0.2043, reg_loss: 0.2041 ||:  41%|####1     | 39/95 [00:24<00:41,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9422, LAS: 0.8936, UEM: 0.5387, LEM: 0.3054, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3443, partial_loss/deprel_loss: 0.4676, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6473, loss: 0.7998, batch_reg_loss: 0.2044, reg_loss: 0.2041 ||:  45%|####5     | 43/95 [00:26<00:36,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9170, UAS: 0.9431, LAS: 0.8946, UEM: 0.5445, LEM: 0.3058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2948, partial_loss/deprel_loss: 0.4587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6303, loss: 0.7902, batch_reg_loss: 0.2044, reg_loss: 0.2041 ||:  48%|####8     | 46/95 [00:28<00:33,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9439, LAS: 0.8954, UEM: 0.5561, LEM: 0.3143, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2306, partial_loss/deprel_loss: 0.3991, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5699, loss: 0.7827, batch_reg_loss: 0.2044, reg_loss: 0.2042 ||:  52%|#####1    | 49/95 [00:31<00:33,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8119, UAS: 0.9432, LAS: 0.8948, UEM: 0.5649, LEM: 0.3245, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8301, partial_loss/deprel_loss: 0.9899, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3624, loss: 0.7852, batch_reg_loss: 0.2044, reg_loss: 0.2042 ||:  55%|#####4    | 52/95 [00:33<00:31,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8069, UAS: 0.9416, LAS: 0.8934, UEM: 0.5631, LEM: 0.3224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8940, partial_loss/deprel_loss: 1.1273, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4851, loss: 0.7968, batch_reg_loss: 0.2045, reg_loss: 0.2042 ||:  59%|#####8    | 56/95 [00:36<00:27,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9414, LAS: 0.8927, UEM: 0.5574, LEM: 0.3150, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4748, partial_loss/deprel_loss: 0.5441, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7347, loss: 0.8009, batch_reg_loss: 0.2045, reg_loss: 0.2042 ||:  62%|######2   | 59/95 [00:38<00:25,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9412, LAS: 0.8925, UEM: 0.5639, LEM: 0.3238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1639, partial_loss/deprel_loss: 0.3403, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5095, loss: 0.8021, batch_reg_loss: 0.2045, reg_loss: 0.2042 ||:  65%|######5   | 62/95 [00:40<00:23,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8751, UAS: 0.9414, LAS: 0.8924, UEM: 0.5631, LEM: 0.3221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6976, partial_loss/deprel_loss: 0.7252, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9242, loss: 0.8013, batch_reg_loss: 0.2046, reg_loss: 0.2042 ||:  68%|######8   | 65/95 [00:42<00:21,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9421, LAS: 0.8934, UEM: 0.5750, LEM: 0.3340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2649, partial_loss/deprel_loss: 0.3962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5746, loss: 0.7934, batch_reg_loss: 0.2046, reg_loss: 0.2043 ||:  72%|#######1  | 68/95 [00:44<00:19,  1.37it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9427, LAS: 0.8940, UEM: 0.5783, LEM: 0.3373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7786, partial_loss/deprel_loss: 0.6708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8970, loss: 0.7895, batch_reg_loss: 0.2046, reg_loss: 0.2043 ||:  76%|#######5  | 72/95 [00:47<00:16,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8442, UAS: 0.9425, LAS: 0.8938, UEM: 0.5854, LEM: 0.3503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0491, partial_loss/deprel_loss: 0.8937, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1294, loss: 0.7899, batch_reg_loss: 0.2047, reg_loss: 0.2043 ||:  79%|#######8  | 75/95 [00:49<00:14,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9426, LAS: 0.8938, UEM: 0.5852, LEM: 0.3480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2761, partial_loss/deprel_loss: 0.4332, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6065, loss: 0.7891, batch_reg_loss: 0.2047, reg_loss: 0.2043 ||:  83%|########3 | 79/95 [00:52<00:11,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8884, UAS: 0.9423, LAS: 0.8934, UEM: 0.5851, LEM: 0.3475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6654, partial_loss/deprel_loss: 0.6460, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8547, loss: 0.7922, batch_reg_loss: 0.2048, reg_loss: 0.2043 ||:  86%|########6 | 82/95 [00:54<00:09,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9428, LAS: 0.8939, UEM: 0.5892, LEM: 0.3501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5734, partial_loss/deprel_loss: 0.6591, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8468, loss: 0.7884, batch_reg_loss: 0.2048, reg_loss: 0.2043 ||:  89%|########9 | 85/95 [00:56<00:07,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9427, LAS: 0.8937, UEM: 0.5876, LEM: 0.3491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1283, partial_loss/deprel_loss: 0.3194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4860, loss: 0.7909, batch_reg_loss: 0.2048, reg_loss: 0.2044 ||:  94%|#########3| 89/95 [00:59<00:04,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9421, LAS: 0.8930, UEM: 0.5862, LEM: 0.3484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1924, partial_loss/deprel_loss: 0.3718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5408, loss: 0.7960, batch_reg_loss: 0.2049, reg_loss: 0.2044 ||:  98%|#########7| 93/95 [01:01<00:01,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9149, UAS: 0.9426, LAS: 0.8934, UEM: 0.5887, LEM: 0.3481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2714, partial_loss/deprel_loss: 0.4715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6364, loss: 0.7931, batch_reg_loss: 0.2049, reg_loss: 0.2044 ||: 100%|##########| 95/95 [01:03<00:00,  1.50it/s]\n",
+      "2023-04-07 00:35:38,887 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:35:38,887 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 00:35:38,887 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.204  |       N/A\n",
+      "2023-04-07 00:35:38,887 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - UEM                      |     0.589  |       N/A\n",
+      "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - LEM                      |     0.348  |       N/A\n",
+      "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - EM                       |     0.915  |       N/A\n",
+      "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.271  |       N/A\n",
+      "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - UAS                      |     0.943  |       N/A\n",
+      "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.471  |       N/A\n",
+      "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - loss                     |     0.793  |       N/A\n",
+      "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - LAS                      |     0.893  |       N/A\n",
+      "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:35:38,888 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:35:38,889 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:35:38,889 - INFO - combo.training.trainer - Epoch duration: 0:01:03.144660\n",
+      "2023-04-07 00:35:38,889 - INFO - combo.training.trainer - Estimated training time remaining: 5:40:27\n",
+      "2023-04-07 00:35:38,889 - INFO - allennlp.training.trainer - Epoch 95/399\n",
+      "2023-04-07 00:35:38,890 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:35:38,890 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:35:38,897 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8799, UAS: 0.9242, LAS: 0.8762, UEM: 0.2850, LEM: 0.0992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8615, partial_loss/deprel_loss: 0.7358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9659, loss: 0.9411, batch_reg_loss: 0.2049, reg_loss: 0.2049 ||:   4%|4         | 4/95 [00:02<00:58,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8991, UAS: 0.9353, LAS: 0.8858, UEM: 0.3636, LEM: 0.1408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4285, partial_loss/deprel_loss: 0.5383, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7213, loss: 0.8561, batch_reg_loss: 0.2050, reg_loss: 0.2049 ||:   8%|8         | 8/95 [00:05<00:56,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9352, LAS: 0.8868, UEM: 0.3439, LEM: 0.1287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6405, partial_loss/deprel_loss: 0.6543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8566, loss: 0.8527, batch_reg_loss: 0.2050, reg_loss: 0.2050 ||:  13%|#2        | 12/95 [00:07<00:53,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9419, LAS: 0.8933, UEM: 0.4871, LEM: 0.2392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4230, partial_loss/deprel_loss: 0.5419, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7232, loss: 0.7997, batch_reg_loss: 0.2051, reg_loss: 0.2050 ||:  16%|#5        | 15/95 [00:10<00:54,  1.47it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8907, UAS: 0.9448, LAS: 0.8961, UEM: 0.5225, LEM: 0.2569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5661, partial_loss/deprel_loss: 0.6213, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8153, loss: 0.7767, batch_reg_loss: 0.2051, reg_loss: 0.2050 ||:  20%|##        | 19/95 [00:12<00:50,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9486, LAS: 0.9009, UEM: 0.6363, LEM: 0.4029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2845, partial_loss/deprel_loss: 0.4368, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6115, loss: 0.7372, batch_reg_loss: 0.2051, reg_loss: 0.2050 ||:  23%|##3       | 22/95 [00:15<00:55,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9464, LAS: 0.8982, UEM: 0.6087, LEM: 0.3770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9626, partial_loss/deprel_loss: 0.7642, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0090, loss: 0.7555, batch_reg_loss: 0.2052, reg_loss: 0.2050 ||:  27%|##7       | 26/95 [00:17<00:49,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9468, LAS: 0.8986, UEM: 0.6059, LEM: 0.3733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2224, partial_loss/deprel_loss: 0.4072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5754, loss: 0.7529, batch_reg_loss: 0.2052, reg_loss: 0.2050 ||:  31%|###       | 29/95 [00:20<00:47,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9165, UAS: 0.9478, LAS: 0.8997, UEM: 0.6138, LEM: 0.3754, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2597, partial_loss/deprel_loss: 0.3947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5729, loss: 0.7434, batch_reg_loss: 0.2052, reg_loss: 0.2051 ||:  34%|###3      | 32/95 [00:22<00:44,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9495, LAS: 0.9011, UEM: 0.6279, LEM: 0.3809, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3057, partial_loss/deprel_loss: 0.5072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6721, loss: 0.7326, batch_reg_loss: 0.2052, reg_loss: 0.2051 ||:  37%|###6      | 35/95 [00:24<00:42,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8034, UAS: 0.9477, LAS: 0.8993, UEM: 0.6249, LEM: 0.3763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0380, partial_loss/deprel_loss: 1.1467, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5302, loss: 0.7497, batch_reg_loss: 0.2053, reg_loss: 0.2051 ||:  41%|####1     | 39/95 [00:26<00:36,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9058, UAS: 0.9494, LAS: 0.9009, UEM: 0.6406, LEM: 0.3918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3377, partial_loss/deprel_loss: 0.5077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6790, loss: 0.7387, batch_reg_loss: 0.2053, reg_loss: 0.2051 ||:  46%|####6     | 44/95 [00:28<00:30,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8523, UAS: 0.9472, LAS: 0.8982, UEM: 0.6176, LEM: 0.3726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9144, partial_loss/deprel_loss: 0.7901, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0203, loss: 0.7603, batch_reg_loss: 0.2053, reg_loss: 0.2051 ||:  52%|#####1    | 49/95 [00:30<00:25,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9459, LAS: 0.8968, UEM: 0.6143, LEM: 0.3702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2365, partial_loss/deprel_loss: 0.3803, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5569, loss: 0.7709, batch_reg_loss: 0.2054, reg_loss: 0.2052 ||:  57%|#####6    | 54/95 [00:33<00:22,  1.86it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9220, UAS: 0.9452, LAS: 0.8961, UEM: 0.6056, LEM: 0.3626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3120, partial_loss/deprel_loss: 0.4476, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6259, loss: 0.7803, batch_reg_loss: 0.2054, reg_loss: 0.2052 ||:  61%|######1   | 58/95 [00:36<00:22,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8185, UAS: 0.9436, LAS: 0.8946, UEM: 0.5940, LEM: 0.3539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5388, partial_loss/deprel_loss: 0.9766, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2945, loss: 0.7898, batch_reg_loss: 0.2055, reg_loss: 0.2052 ||:  65%|######5   | 62/95 [00:39<00:21,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9433, LAS: 0.8943, UEM: 0.6019, LEM: 0.3633, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1397, partial_loss/deprel_loss: 0.3211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4903, loss: 0.7921, batch_reg_loss: 0.2055, reg_loss: 0.2052 ||:  69%|######9   | 66/95 [00:42<00:20,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9036, UAS: 0.9427, LAS: 0.8936, UEM: 0.5969, LEM: 0.3575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3676, partial_loss/deprel_loss: 0.5613, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7281, loss: 0.7958, batch_reg_loss: 0.2056, reg_loss: 0.2052 ||:  74%|#######3  | 70/95 [00:45<00:16,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9272, UAS: 0.9431, LAS: 0.8940, UEM: 0.5940, LEM: 0.3524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2323, partial_loss/deprel_loss: 0.4260, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5929, loss: 0.7930, batch_reg_loss: 0.2056, reg_loss: 0.2052 ||:  78%|#######7  | 74/95 [00:47<00:13,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8280, UAS: 0.9425, LAS: 0.8933, UEM: 0.5922, LEM: 0.3492, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3858, partial_loss/deprel_loss: 1.0559, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3275, loss: 0.7993, batch_reg_loss: 0.2057, reg_loss: 0.2053 ||:  82%|########2 | 78/95 [00:50<00:11,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8458, UAS: 0.9417, LAS: 0.8922, UEM: 0.5842, LEM: 0.3430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0717, partial_loss/deprel_loss: 0.8968, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1375, loss: 0.8070, batch_reg_loss: 0.2057, reg_loss: 0.2053 ||:  86%|########6 | 82/95 [00:52<00:08,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8705, UAS: 0.9414, LAS: 0.8918, UEM: 0.5776, LEM: 0.3366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8504, partial_loss/deprel_loss: 0.7947, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0116, loss: 0.8100, batch_reg_loss: 0.2058, reg_loss: 0.2053 ||:  91%|######### | 86/95 [00:55<00:05,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9236, UAS: 0.9421, LAS: 0.8925, UEM: 0.5823, LEM: 0.3392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3176, partial_loss/deprel_loss: 0.3931, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5838, loss: 0.8046, batch_reg_loss: 0.2058, reg_loss: 0.2053 ||:  95%|#########4| 90/95 [00:58<00:03,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9054, UAS: 0.9418, LAS: 0.8923, UEM: 0.5858, LEM: 0.3442, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3271, partial_loss/deprel_loss: 0.5019, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6728, loss: 0.8063, batch_reg_loss: 0.2059, reg_loss: 0.2054 ||:  99%|#########8| 94/95 [01:01<00:00,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9420, LAS: 0.8924, UEM: 0.5895, LEM: 0.3480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3248, partial_loss/deprel_loss: 0.4186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6058, loss: 0.8041, batch_reg_loss: 0.2059, reg_loss: 0.2054 ||: 100%|##########| 95/95 [01:02<00:00,  1.53it/s]\n",
+      "2023-04-07 00:36:41,183 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8706, UAS: 0.9553, LAS: 0.9034, UEM: 0.7548, LEM: 0.4632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1291, partial_loss/deprel_loss: 40.7917, partial_loss/cycle_loss: 0.0000, batch_loss: 32.8592, loss: 22.6777, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  18%|#8        | 2/11 [00:02<00:10,  1.15s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9617, LAS: 0.9134, UEM: 0.7913, LEM: 0.5315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1664, partial_loss/deprel_loss: 8.7585, partial_loss/cycle_loss: 0.0000, batch_loss: 7.0401, loss: 16.5296, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:05<00:06,  1.10s/it]  \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8689, UAS: 0.9586, LAS: 0.9074, UEM: 0.7498, LEM: 0.4686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0857, partial_loss/deprel_loss: 36.9741, partial_loss/cycle_loss: 0.0000, batch_loss: 29.7964, loss: 18.5827, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  73%|#######2  | 8/11 [00:08<00:03,  1.05s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8486, UAS: 0.9500, LAS: 0.8971, UEM: 0.6831, LEM: 0.4110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5525, partial_loss/deprel_loss: 46.8248, partial_loss/cycle_loss: 0.0000, batch_loss: 37.7703, loss: 20.8966, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:11<00:00,  1.05s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8486, UAS: 0.9500, LAS: 0.8971, UEM: 0.6831, LEM: 0.4110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5525, partial_loss/deprel_loss: 46.8248, partial_loss/cycle_loss: 0.0000, batch_loss: 37.7703, loss: 20.8966, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:11<00:00,  1.02s/it]\n",
+      "2023-04-07 00:36:52,373 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:36:52,373 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.205  |     0.000\n",
+      "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - UEM                      |     0.589  |     0.683\n",
+      "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - LEM                      |     0.348  |     0.411\n",
+      "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - EM                       |     0.909  |     0.849\n",
+      "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.325  |     1.552\n",
+      "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - UAS                      |     0.942  |     0.950\n",
+      "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.419  |    46.825\n",
+      "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - loss                     |     0.804  |    20.897\n",
+      "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - LAS                      |     0.892  |     0.897\n",
+      "2023-04-07 00:36:52,374 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:36:52,375 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:36:52,375 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:36:52,375 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:36:52,375 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:36:52,375 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 00:36:52,375 - INFO - combo.training.trainer - Epoch duration: 0:01:13.485998\n",
+      "2023-04-07 00:36:52,376 - INFO - combo.training.trainer - Estimated training time remaining: 5:39:41\n",
+      "2023-04-07 00:36:52,376 - INFO - allennlp.training.trainer - Epoch 96/399\n",
+      "2023-04-07 00:36:52,376 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:36:52,376 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:36:52,383 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8639, UAS: 0.9413, LAS: 0.8866, UEM: 0.4235, LEM: 0.1511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9159, partial_loss/deprel_loss: 0.7699, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0051, loss: 0.8340, batch_reg_loss: 0.2059, reg_loss: 0.2059 ||:   4%|4         | 4/95 [00:02<00:57,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9493, LAS: 0.8960, UEM: 0.4964, LEM: 0.1846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3313, partial_loss/deprel_loss: 0.4901, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6643, loss: 0.7739, batch_reg_loss: 0.2060, reg_loss: 0.2059 ||:   8%|8         | 8/95 [00:05<00:54,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9267, UAS: 0.9466, LAS: 0.8944, UEM: 0.5602, LEM: 0.2649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2165, partial_loss/deprel_loss: 0.3485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5281, loss: 0.7727, batch_reg_loss: 0.2060, reg_loss: 0.2060 ||:  12%|#1        | 11/95 [00:07<00:56,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9620, UAS: 0.9500, LAS: 0.8998, UEM: 0.6595, LEM: 0.4138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0433, partial_loss/deprel_loss: 0.1511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3356, loss: 0.7380, batch_reg_loss: 0.2060, reg_loss: 0.2060 ||:  15%|#4        | 14/95 [00:10<00:59,  1.35it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9471, LAS: 0.8967, UEM: 0.6291, LEM: 0.3841, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3546, partial_loss/deprel_loss: 0.4325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6230, loss: 0.7544, batch_reg_loss: 0.2061, reg_loss: 0.2060 ||:  19%|#8        | 18/95 [00:12<00:52,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9243, UAS: 0.9463, LAS: 0.8958, UEM: 0.6229, LEM: 0.3779, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2154, partial_loss/deprel_loss: 0.3593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5367, loss: 0.7659, batch_reg_loss: 0.2061, reg_loss: 0.2060 ||:  23%|##3       | 22/95 [00:14<00:49,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9074, UAS: 0.9458, LAS: 0.8956, UEM: 0.6195, LEM: 0.3767, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4023, partial_loss/deprel_loss: 0.5209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7033, loss: 0.7639, batch_reg_loss: 0.2061, reg_loss: 0.2060 ||:  26%|##6       | 25/95 [00:17<00:48,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9280, UAS: 0.9459, LAS: 0.8957, UEM: 0.6239, LEM: 0.3779, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2624, partial_loss/deprel_loss: 0.3390, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5298, loss: 0.7614, batch_reg_loss: 0.2061, reg_loss: 0.2060 ||:  29%|##9       | 28/95 [00:19<00:46,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9443, LAS: 0.8943, UEM: 0.6144, LEM: 0.3737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1972, partial_loss/deprel_loss: 0.3533, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5282, loss: 0.7762, batch_reg_loss: 0.2062, reg_loss: 0.2060 ||:  34%|###3      | 32/95 [00:22<00:43,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8697, UAS: 0.9448, LAS: 0.8948, UEM: 0.6088, LEM: 0.3649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7992, partial_loss/deprel_loss: 0.7865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9952, loss: 0.7765, batch_reg_loss: 0.2062, reg_loss: 0.2061 ||:  38%|###7      | 36/95 [00:24<00:39,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9458, LAS: 0.8959, UEM: 0.6143, LEM: 0.3668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2885, partial_loss/deprel_loss: 0.4762, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6449, loss: 0.7664, batch_reg_loss: 0.2063, reg_loss: 0.2061 ||:  41%|####1     | 39/95 [00:27<00:42,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9465, LAS: 0.8968, UEM: 0.6353, LEM: 0.3910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1215, partial_loss/deprel_loss: 0.2574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4366, loss: 0.7600, batch_reg_loss: 0.2063, reg_loss: 0.2061 ||:  44%|####4     | 42/95 [00:29<00:39,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8433, UAS: 0.9437, LAS: 0.8938, UEM: 0.6203, LEM: 0.3796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2840, partial_loss/deprel_loss: 0.8396, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1348, loss: 0.7827, batch_reg_loss: 0.2063, reg_loss: 0.2061 ||:  48%|####8     | 46/95 [00:32<00:35,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9449, LAS: 0.8952, UEM: 0.6273, LEM: 0.3820, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2722, partial_loss/deprel_loss: 0.4272, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6025, loss: 0.7730, batch_reg_loss: 0.2064, reg_loss: 0.2061 ||:  52%|#####1    | 49/95 [00:34<00:34,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8993, UAS: 0.9463, LAS: 0.8967, UEM: 0.6405, LEM: 0.3941, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4555, partial_loss/deprel_loss: 0.5259, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7182, loss: 0.7622, batch_reg_loss: 0.2064, reg_loss: 0.2061 ||:  56%|#####5    | 53/95 [00:36<00:28,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9452, LAS: 0.8955, UEM: 0.6223, LEM: 0.3794, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4067, partial_loss/deprel_loss: 0.5368, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7172, loss: 0.7743, batch_reg_loss: 0.2064, reg_loss: 0.2062 ||:  61%|######1   | 58/95 [00:39<00:22,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9459, LAS: 0.8959, UEM: 0.6254, LEM: 0.3805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2003, partial_loss/deprel_loss: 0.3466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5238, loss: 0.7719, batch_reg_loss: 0.2065, reg_loss: 0.2062 ||:  65%|######5   | 62/95 [00:41<00:19,  1.71it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9453, LAS: 0.8955, UEM: 0.6218, LEM: 0.3792, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1490, partial_loss/deprel_loss: 0.3464, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5134, loss: 0.7788, batch_reg_loss: 0.2065, reg_loss: 0.2062 ||:  69%|######9   | 66/95 [00:43<00:16,  1.77it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9442, LAS: 0.8941, UEM: 0.6146, LEM: 0.3722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3394, partial_loss/deprel_loss: 0.5111, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6833, loss: 0.7902, batch_reg_loss: 0.2066, reg_loss: 0.2062 ||:  74%|#######3  | 70/95 [00:45<00:13,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9428, LAS: 0.8925, UEM: 0.6090, LEM: 0.3669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2194, partial_loss/deprel_loss: 0.4330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5969, loss: 0.8012, batch_reg_loss: 0.2066, reg_loss: 0.2062 ||:  78%|#######7  | 74/95 [00:48<00:12,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8795, UAS: 0.9431, LAS: 0.8928, UEM: 0.6043, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7139, partial_loss/deprel_loss: 0.7457, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9460, loss: 0.7995, batch_reg_loss: 0.2067, reg_loss: 0.2063 ||:  82%|########2 | 78/95 [00:51<00:11,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9426, LAS: 0.8923, UEM: 0.6025, LEM: 0.3565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3274, partial_loss/deprel_loss: 0.4576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6383, loss: 0.8013, batch_reg_loss: 0.2067, reg_loss: 0.2063 ||:  86%|########6 | 82/95 [00:53<00:08,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8730, UAS: 0.9425, LAS: 0.8922, UEM: 0.5929, LEM: 0.3480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6534, partial_loss/deprel_loss: 0.8070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9830, loss: 0.8033, batch_reg_loss: 0.2068, reg_loss: 0.2063 ||:  91%|######### | 86/95 [00:56<00:06,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9428, LAS: 0.8924, UEM: 0.5966, LEM: 0.3514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4715, partial_loss/deprel_loss: 0.5699, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7570, loss: 0.8010, batch_reg_loss: 0.2068, reg_loss: 0.2063 ||:  95%|#########4| 90/95 [00:59<00:03,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9426, LAS: 0.8921, UEM: 0.5884, LEM: 0.3437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9063, partial_loss/deprel_loss: 0.7899, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0201, loss: 0.8040, batch_reg_loss: 0.2069, reg_loss: 0.2064 ||:  99%|#########8| 94/95 [01:02<00:00,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9199, UAS: 0.9429, LAS: 0.8924, UEM: 0.5906, LEM: 0.3454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2550, partial_loss/deprel_loss: 0.4591, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6251, loss: 0.8021, batch_reg_loss: 0.2069, reg_loss: 0.2064 ||: 100%|##########| 95/95 [01:02<00:00,  1.51it/s]\n",
+      "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.206  |       N/A\n",
+      "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - UEM                      |     0.591  |       N/A\n",
+      "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - LEM                      |     0.345  |       N/A\n",
+      "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - EM                       |     0.920  |       N/A\n",
+      "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.255  |       N/A\n",
+      "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:37:55,219 - INFO - combo.training.tensorboard_writer - UAS                      |     0.943  |       N/A\n",
+      "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.459  |       N/A\n",
+      "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - loss                     |     0.802  |       N/A\n",
+      "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - LAS                      |     0.892  |       N/A\n",
+      "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:37:55,220 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:37:55,221 - INFO - combo.training.trainer - Epoch duration: 0:01:02.845131\n",
+      "2023-04-07 00:37:55,221 - INFO - combo.training.trainer - Estimated training time remaining: 5:38:21\n",
+      "2023-04-07 00:37:55,221 - INFO - allennlp.training.trainer - Epoch 97/399\n",
+      "2023-04-07 00:37:55,221 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:37:55,222 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:37:55,228 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8821, UAS: 0.9419, LAS: 0.8920, UEM: 0.3952, LEM: 0.1597, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6851, partial_loss/deprel_loss: 0.6447, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8597, loss: 0.8136, batch_reg_loss: 0.2069, reg_loss: 0.2069 ||:   4%|4         | 4/95 [00:02<00:58,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9512, LAS: 0.9010, UEM: 0.5581, LEM: 0.2760, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2635, partial_loss/deprel_loss: 0.4261, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6006, loss: 0.7490, batch_reg_loss: 0.2070, reg_loss: 0.2069 ||:   8%|8         | 8/95 [00:05<00:57,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9235, UAS: 0.9556, LAS: 0.9075, UEM: 0.6934, LEM: 0.4679, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1694, partial_loss/deprel_loss: 0.3743, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5404, loss: 0.7027, batch_reg_loss: 0.2070, reg_loss: 0.2070 ||:  12%|#1        | 11/95 [00:07<00:59,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9558, LAS: 0.9078, UEM: 0.6931, LEM: 0.4594, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1622, partial_loss/deprel_loss: 0.3335, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5062, loss: 0.6936, batch_reg_loss: 0.2070, reg_loss: 0.2070 ||:  15%|#4        | 14/95 [00:09<00:57,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9506, LAS: 0.9026, UEM: 0.6768, LEM: 0.4441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4128, partial_loss/deprel_loss: 0.5209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7064, loss: 0.7229, batch_reg_loss: 0.2071, reg_loss: 0.2070 ||:  19%|#8        | 18/95 [00:12<00:53,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9455, LAS: 0.8965, UEM: 0.6393, LEM: 0.4103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4682, partial_loss/deprel_loss: 0.5416, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7340, loss: 0.7679, batch_reg_loss: 0.2071, reg_loss: 0.2070 ||:  23%|##3       | 22/95 [00:14<00:48,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9432, LAS: 0.8937, UEM: 0.6066, LEM: 0.3802, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7097, partial_loss/deprel_loss: 0.6215, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8462, loss: 0.7868, batch_reg_loss: 0.2071, reg_loss: 0.2070 ||:  27%|##7       | 26/95 [00:17<00:44,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9442, LAS: 0.8947, UEM: 0.6040, LEM: 0.3739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5019, partial_loss/deprel_loss: 0.5566, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7528, loss: 0.7828, batch_reg_loss: 0.2072, reg_loss: 0.2070 ||:  31%|###       | 29/95 [00:19<00:46,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9453, LAS: 0.8959, UEM: 0.6047, LEM: 0.3694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2139, partial_loss/deprel_loss: 0.4008, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5707, loss: 0.7728, batch_reg_loss: 0.2072, reg_loss: 0.2071 ||:  34%|###3      | 32/95 [00:21<00:43,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9460, LAS: 0.8969, UEM: 0.6114, LEM: 0.3718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1764, partial_loss/deprel_loss: 0.4010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5633, loss: 0.7677, batch_reg_loss: 0.2072, reg_loss: 0.2071 ||:  37%|###6      | 35/95 [00:24<00:41,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8802, UAS: 0.9461, LAS: 0.8968, UEM: 0.6037, LEM: 0.3620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6509, partial_loss/deprel_loss: 0.7461, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9344, loss: 0.7692, batch_reg_loss: 0.2073, reg_loss: 0.2071 ||:  40%|####      | 38/95 [00:26<00:39,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9477, LAS: 0.8984, UEM: 0.6260, LEM: 0.3804, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3298, partial_loss/deprel_loss: 0.3937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5882, loss: 0.7543, batch_reg_loss: 0.2073, reg_loss: 0.2071 ||:  43%|####3     | 41/95 [00:28<00:38,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9481, LAS: 0.8990, UEM: 0.6309, LEM: 0.3845, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1242, partial_loss/deprel_loss: 0.2849, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4601, loss: 0.7516, batch_reg_loss: 0.2073, reg_loss: 0.2071 ||:  47%|####7     | 45/95 [00:31<00:35,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9477, LAS: 0.8984, UEM: 0.6278, LEM: 0.3815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2397, partial_loss/deprel_loss: 0.3821, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5610, loss: 0.7560, batch_reg_loss: 0.2073, reg_loss: 0.2071 ||:  51%|#####     | 48/95 [00:33<00:34,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8796, UAS: 0.9461, LAS: 0.8966, UEM: 0.6145, LEM: 0.3716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7759, partial_loss/deprel_loss: 0.7306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9470, loss: 0.7712, batch_reg_loss: 0.2074, reg_loss: 0.2071 ||:  54%|#####3    | 51/95 [00:35<00:31,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8963, UAS: 0.9462, LAS: 0.8964, UEM: 0.6060, LEM: 0.3621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5400, partial_loss/deprel_loss: 0.5703, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7716, loss: 0.7712, batch_reg_loss: 0.2074, reg_loss: 0.2072 ||:  58%|#####7    | 55/95 [00:38<00:27,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9458, LAS: 0.8962, UEM: 0.6014, LEM: 0.3579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5700, partial_loss/deprel_loss: 0.6182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8160, loss: 0.7742, batch_reg_loss: 0.2074, reg_loss: 0.2072 ||:  61%|######1   | 58/95 [00:40<00:26,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8592, UAS: 0.9459, LAS: 0.8965, UEM: 0.6113, LEM: 0.3727, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0668, partial_loss/deprel_loss: 0.8189, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0759, loss: 0.7712, batch_reg_loss: 0.2075, reg_loss: 0.2072 ||:  64%|######4   | 61/95 [00:42<00:24,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8791, UAS: 0.9458, LAS: 0.8966, UEM: 0.6046, LEM: 0.3656, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8410, partial_loss/deprel_loss: 0.8078, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0220, loss: 0.7762, batch_reg_loss: 0.2075, reg_loss: 0.2072 ||:  68%|######8   | 65/95 [00:45<00:20,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8704, UAS: 0.9458, LAS: 0.8967, UEM: 0.6065, LEM: 0.3682, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8679, partial_loss/deprel_loss: 0.8099, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0290, loss: 0.7760, batch_reg_loss: 0.2075, reg_loss: 0.2072 ||:  72%|#######1  | 68/95 [00:47<00:19,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8635, UAS: 0.9443, LAS: 0.8950, UEM: 0.5978, LEM: 0.3619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9440, partial_loss/deprel_loss: 0.7764, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0175, loss: 0.7895, batch_reg_loss: 0.2076, reg_loss: 0.2072 ||:  75%|#######4  | 71/95 [00:49<00:16,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9446, LAS: 0.8952, UEM: 0.5970, LEM: 0.3585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2569, partial_loss/deprel_loss: 0.4455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6154, loss: 0.7879, batch_reg_loss: 0.2076, reg_loss: 0.2073 ||:  78%|#######7  | 74/95 [00:51<00:14,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9256, UAS: 0.9448, LAS: 0.8955, UEM: 0.6005, LEM: 0.3605, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2562, partial_loss/deprel_loss: 0.4092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5862, loss: 0.7862, batch_reg_loss: 0.2076, reg_loss: 0.2073 ||:  81%|########1 | 77/95 [00:53<00:12,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9451, LAS: 0.8959, UEM: 0.6014, LEM: 0.3599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2525, partial_loss/deprel_loss: 0.4257, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5987, loss: 0.7830, batch_reg_loss: 0.2077, reg_loss: 0.2073 ||:  84%|########4 | 80/95 [00:55<00:10,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8159, UAS: 0.9433, LAS: 0.8938, UEM: 0.5915, LEM: 0.3525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6011, partial_loss/deprel_loss: 0.9215, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2651, loss: 0.7986, batch_reg_loss: 0.2077, reg_loss: 0.2073 ||:  88%|########8 | 84/95 [00:58<00:07,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8293, UAS: 0.9430, LAS: 0.8936, UEM: 0.5878, LEM: 0.3483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4834, partial_loss/deprel_loss: 1.0250, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3245, loss: 0.8012, batch_reg_loss: 0.2078, reg_loss: 0.2073 ||:  93%|#########2| 88/95 [01:00<00:04,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8049, UAS: 0.9427, LAS: 0.8933, UEM: 0.5894, LEM: 0.3490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9498, partial_loss/deprel_loss: 1.1388, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5088, loss: 0.8028, batch_reg_loss: 0.2078, reg_loss: 0.2073 ||:  98%|#########7| 93/95 [01:03<00:01,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8831, UAS: 0.9428, LAS: 0.8935, UEM: 0.5891, LEM: 0.3490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7368, partial_loss/deprel_loss: 0.6611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8841, loss: 0.8013, batch_reg_loss: 0.2079, reg_loss: 0.2074 ||: 100%|##########| 95/95 [01:04<00:00,  1.48it/s]\n",
+      "2023-04-07 00:38:59,486 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.207  |       N/A\n",
+      "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - UEM                      |     0.589  |       N/A\n",
+      "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - LEM                      |     0.349  |       N/A\n",
+      "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - EM                       |     0.883  |       N/A\n",
+      "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.737  |       N/A\n",
+      "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - UAS                      |     0.943  |       N/A\n",
+      "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.661  |       N/A\n",
+      "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - loss                     |     0.801  |       N/A\n",
+      "2023-04-07 00:38:59,487 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:38:59,488 - INFO - combo.training.tensorboard_writer - LAS                      |     0.894  |       N/A\n",
+      "2023-04-07 00:38:59,488 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:38:59,488 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:38:59,488 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:38:59,488 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:38:59,488 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:38:59,488 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:38:59,489 - INFO - combo.training.trainer - Epoch duration: 0:01:04.267507\n",
+      "2023-04-07 00:38:59,489 - INFO - combo.training.trainer - Estimated training time remaining: 5:37:05\n",
+      "2023-04-07 00:38:59,489 - INFO - allennlp.training.trainer - Epoch 98/399\n",
+      "2023-04-07 00:38:59,489 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:38:59,489 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:38:59,496 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8261, UAS: 0.9357, LAS: 0.8838, UEM: 0.4643, LEM: 0.2083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4956, partial_loss/deprel_loss: 0.9264, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2482, loss: 0.8428, batch_reg_loss: 0.2079, reg_loss: 0.2079 ||:   4%|4         | 4/95 [00:02<00:51,  1.78it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9330, LAS: 0.8817, UEM: 0.3829, LEM: 0.1561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6764, partial_loss/deprel_loss: 0.6329, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8496, loss: 0.8622, batch_reg_loss: 0.2079, reg_loss: 0.2079 ||:   7%|7         | 7/95 [00:04<00:52,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9588, UAS: 0.9421, LAS: 0.8942, UEM: 0.6039, LEM: 0.4192, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0606, partial_loss/deprel_loss: 0.1576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3462, loss: 0.7862, batch_reg_loss: 0.2080, reg_loss: 0.2079 ||:  12%|#1        | 11/95 [00:06<00:51,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8824, UAS: 0.9335, LAS: 0.8849, UEM: 0.5404, LEM: 0.3637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6843, partial_loss/deprel_loss: 0.6419, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8585, loss: 0.8607, batch_reg_loss: 0.2080, reg_loss: 0.2080 ||:  16%|#5        | 15/95 [00:09<00:49,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9392, LAS: 0.8904, UEM: 0.5790, LEM: 0.3651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3560, partial_loss/deprel_loss: 0.5223, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6972, loss: 0.8190, batch_reg_loss: 0.2081, reg_loss: 0.2080 ||:  20%|##        | 19/95 [00:11<00:46,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9406, LAS: 0.8923, UEM: 0.5903, LEM: 0.3695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4466, partial_loss/deprel_loss: 0.6045, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7811, loss: 0.8112, batch_reg_loss: 0.2082, reg_loss: 0.2080 ||:  25%|##5       | 24/95 [00:14<00:40,  1.73it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9406, LAS: 0.8917, UEM: 0.5703, LEM: 0.3458, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3396, partial_loss/deprel_loss: 0.4890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6673, loss: 0.8141, batch_reg_loss: 0.2082, reg_loss: 0.2080 ||:  29%|##9       | 28/95 [00:16<00:37,  1.79it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9413, LAS: 0.8924, UEM: 0.5910, LEM: 0.3653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2402, partial_loss/deprel_loss: 0.4076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5824, loss: 0.8062, batch_reg_loss: 0.2082, reg_loss: 0.2081 ||:  34%|###3      | 32/95 [00:19<00:37,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8917, UAS: 0.9426, LAS: 0.8939, UEM: 0.6176, LEM: 0.3962, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5229, partial_loss/deprel_loss: 0.6118, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8023, loss: 0.7957, batch_reg_loss: 0.2083, reg_loss: 0.2081 ||:  38%|###7      | 36/95 [00:22<00:37,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8441, UAS: 0.9405, LAS: 0.8914, UEM: 0.5972, LEM: 0.3772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2203, partial_loss/deprel_loss: 0.8665, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1456, loss: 0.8147, batch_reg_loss: 0.2083, reg_loss: 0.2081 ||:  42%|####2     | 40/95 [00:25<00:36,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9418, LAS: 0.8925, UEM: 0.5959, LEM: 0.3695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4846, partial_loss/deprel_loss: 0.5749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7652, loss: 0.8076, batch_reg_loss: 0.2083, reg_loss: 0.2081 ||:  45%|####5     | 43/95 [00:27<00:37,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9430, LAS: 0.8936, UEM: 0.6003, LEM: 0.3643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2596, partial_loss/deprel_loss: 0.4677, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6345, loss: 0.7996, batch_reg_loss: 0.2084, reg_loss: 0.2081 ||:  48%|####8     | 46/95 [00:29<00:34,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9437, LAS: 0.8944, UEM: 0.6065, LEM: 0.3667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6041, partial_loss/deprel_loss: 0.5779, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7916, loss: 0.7918, batch_reg_loss: 0.2084, reg_loss: 0.2081 ||:  52%|#####1    | 49/95 [00:31<00:33,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9444, LAS: 0.8952, UEM: 0.6066, LEM: 0.3645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2550, partial_loss/deprel_loss: 0.4441, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6147, loss: 0.7877, batch_reg_loss: 0.2084, reg_loss: 0.2082 ||:  56%|#####5    | 53/95 [00:34<00:30,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9051, UAS: 0.9438, LAS: 0.8943, UEM: 0.5992, LEM: 0.3573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3584, partial_loss/deprel_loss: 0.5268, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7016, loss: 0.7940, batch_reg_loss: 0.2085, reg_loss: 0.2082 ||:  59%|#####8    | 56/95 [00:37<00:28,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9423, LAS: 0.8927, UEM: 0.5927, LEM: 0.3515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2788, partial_loss/deprel_loss: 0.4532, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6268, loss: 0.8044, batch_reg_loss: 0.2085, reg_loss: 0.2082 ||:  63%|######3   | 60/95 [00:39<00:24,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8752, UAS: 0.9423, LAS: 0.8927, UEM: 0.5862, LEM: 0.3456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7276, partial_loss/deprel_loss: 0.7248, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9339, loss: 0.8041, batch_reg_loss: 0.2085, reg_loss: 0.2082 ||:  67%|######7   | 64/95 [00:41<00:20,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9426, LAS: 0.8929, UEM: 0.5919, LEM: 0.3501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1745, partial_loss/deprel_loss: 0.3670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5371, loss: 0.8006, batch_reg_loss: 0.2086, reg_loss: 0.2082 ||:  72%|#######1  | 68/95 [00:45<00:18,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9438, LAS: 0.8942, UEM: 0.6073, LEM: 0.3640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1129, partial_loss/deprel_loss: 0.3218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4886, loss: 0.7909, batch_reg_loss: 0.2086, reg_loss: 0.2083 ||:  75%|#######4  | 71/95 [00:47<00:17,  1.37it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8983, UAS: 0.9430, LAS: 0.8932, UEM: 0.5973, LEM: 0.3557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5020, partial_loss/deprel_loss: 0.6178, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8033, loss: 0.7991, batch_reg_loss: 0.2086, reg_loss: 0.2083 ||:  79%|#######8  | 75/95 [00:49<00:14,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9435, LAS: 0.8939, UEM: 0.5990, LEM: 0.3556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4111, partial_loss/deprel_loss: 0.5059, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6956, loss: 0.7938, batch_reg_loss: 0.2087, reg_loss: 0.2083 ||:  82%|########2 | 78/95 [00:52<00:11,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8671, UAS: 0.9432, LAS: 0.8937, UEM: 0.5940, LEM: 0.3506, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8354, partial_loss/deprel_loss: 0.7642, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9871, loss: 0.7941, batch_reg_loss: 0.2087, reg_loss: 0.2083 ||:  85%|########5 | 81/95 [00:54<00:10,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8602, UAS: 0.9433, LAS: 0.8938, UEM: 0.5930, LEM: 0.3489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9581, partial_loss/deprel_loss: 0.8794, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1039, loss: 0.7942, batch_reg_loss: 0.2087, reg_loss: 0.2083 ||:  88%|########8 | 84/95 [00:56<00:08,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9430, LAS: 0.8934, UEM: 0.5933, LEM: 0.3494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3019, partial_loss/deprel_loss: 0.3971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5868, loss: 0.7963, batch_reg_loss: 0.2087, reg_loss: 0.2083 ||:  92%|#########1| 87/95 [00:58<00:05,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9431, LAS: 0.8936, UEM: 0.5931, LEM: 0.3497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1640, partial_loss/deprel_loss: 0.3750, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5416, loss: 0.7952, batch_reg_loss: 0.2088, reg_loss: 0.2084 ||:  96%|#########5| 91/95 [01:01<00:02,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8618, UAS: 0.9427, LAS: 0.8931, UEM: 0.5890, LEM: 0.3454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8521, partial_loss/deprel_loss: 0.7966, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0165, loss: 0.7985, batch_reg_loss: 0.2088, reg_loss: 0.2084 ||: 100%|##########| 95/95 [01:04<00:00,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8618, UAS: 0.9427, LAS: 0.8931, UEM: 0.5890, LEM: 0.3454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8521, partial_loss/deprel_loss: 0.7966, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0165, loss: 0.7985, batch_reg_loss: 0.2088, reg_loss: 0.2084 ||: 100%|##########| 95/95 [01:04<00:00,  1.48it/s]\n",
+      "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.208  |       N/A\n",
+      "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - UEM                      |     0.589  |       N/A\n",
+      "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - LEM                      |     0.345  |       N/A\n",
+      "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - EM                       |     0.862  |       N/A\n",
+      "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.852  |       N/A\n",
+      "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - UAS                      |     0.943  |       N/A\n",
+      "2023-04-07 00:40:03,536 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:40:03,537 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.797  |       N/A\n",
+      "2023-04-07 00:40:03,537 - INFO - combo.training.tensorboard_writer - loss                     |     0.799  |       N/A\n",
+      "2023-04-07 00:40:03,537 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:40:03,537 - INFO - combo.training.tensorboard_writer - LAS                      |     0.893  |       N/A\n",
+      "2023-04-07 00:40:03,537 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:40:03,537 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:40:03,537 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:40:03,537 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:40:03,537 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:40:03,537 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:40:03,538 - INFO - combo.training.trainer - Epoch duration: 0:01:04.049029\n",
+      "2023-04-07 00:40:03,538 - INFO - combo.training.trainer - Estimated training time remaining: 5:35:49\n",
+      "2023-04-07 00:40:03,538 - INFO - allennlp.training.trainer - Epoch 99/399\n",
+      "2023-04-07 00:40:03,538 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:40:03,539 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:40:03,546 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8253, UAS: 0.9333, LAS: 0.8825, UEM: 0.5525, LEM: 0.2898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5290, partial_loss/deprel_loss: 0.9262, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2556, loss: 0.8527, batch_reg_loss: 0.2089, reg_loss: 0.2089 ||:   4%|4         | 4/95 [00:02<00:58,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8642, UAS: 0.9410, LAS: 0.8895, UEM: 0.6034, LEM: 0.3393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8687, partial_loss/deprel_loss: 0.8306, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0471, loss: 0.8119, batch_reg_loss: 0.2089, reg_loss: 0.2089 ||:   7%|7         | 7/95 [00:04<01:00,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9387, LAS: 0.8878, UEM: 0.5300, LEM: 0.2876, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5496, partial_loss/deprel_loss: 0.5826, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7849, loss: 0.8348, batch_reg_loss: 0.2089, reg_loss: 0.2089 ||:  11%|#         | 10/95 [00:07<00:59,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8724, UAS: 0.9403, LAS: 0.8906, UEM: 0.5537, LEM: 0.3095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8904, partial_loss/deprel_loss: 0.6754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9274, loss: 0.8144, batch_reg_loss: 0.2090, reg_loss: 0.2089 ||:  15%|#4        | 14/95 [00:09<00:55,  1.47it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8571, UAS: 0.9414, LAS: 0.8922, UEM: 0.5599, LEM: 0.3146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0540, partial_loss/deprel_loss: 0.8520, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1014, loss: 0.8022, batch_reg_loss: 0.2090, reg_loss: 0.2089 ||:  19%|#8        | 18/95 [00:12<00:51,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9432, LAS: 0.8941, UEM: 0.5652, LEM: 0.3178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3522, partial_loss/deprel_loss: 0.4730, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6578, loss: 0.7904, batch_reg_loss: 0.2090, reg_loss: 0.2089 ||:  22%|##2       | 21/95 [00:14<00:51,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9442, LAS: 0.8951, UEM: 0.5852, LEM: 0.3321, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2949, partial_loss/deprel_loss: 0.4758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6487, loss: 0.7812, batch_reg_loss: 0.2091, reg_loss: 0.2090 ||:  25%|##5       | 24/95 [00:16<00:49,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8923, UAS: 0.9427, LAS: 0.8933, UEM: 0.5612, LEM: 0.3138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5461, partial_loss/deprel_loss: 0.6731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8568, loss: 0.7966, batch_reg_loss: 0.2091, reg_loss: 0.2090 ||:  28%|##8       | 27/95 [00:18<00:47,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8621, UAS: 0.9407, LAS: 0.8915, UEM: 0.5802, LEM: 0.3399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1346, partial_loss/deprel_loss: 0.8412, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1090, loss: 0.8129, batch_reg_loss: 0.2091, reg_loss: 0.2090 ||:  32%|###1      | 30/95 [00:20<00:46,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8709, UAS: 0.9411, LAS: 0.8917, UEM: 0.5738, LEM: 0.3303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8135, partial_loss/deprel_loss: 0.7104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9402, loss: 0.8104, batch_reg_loss: 0.2092, reg_loss: 0.2090 ||:  35%|###4      | 33/95 [00:23<00:43,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8804, UAS: 0.9415, LAS: 0.8922, UEM: 0.5693, LEM: 0.3282, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7584, partial_loss/deprel_loss: 0.7292, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9442, loss: 0.8085, batch_reg_loss: 0.2092, reg_loss: 0.2090 ||:  38%|###7      | 36/95 [00:25<00:42,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9165, UAS: 0.9415, LAS: 0.8923, UEM: 0.5604, LEM: 0.3206, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3089, partial_loss/deprel_loss: 0.4514, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6322, loss: 0.8075, batch_reg_loss: 0.2092, reg_loss: 0.2090 ||:  41%|####1     | 39/95 [00:27<00:40,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8806, UAS: 0.9395, LAS: 0.8899, UEM: 0.5407, LEM: 0.3060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7474, partial_loss/deprel_loss: 0.6663, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8918, loss: 0.8278, batch_reg_loss: 0.2093, reg_loss: 0.2091 ||:  45%|####5     | 43/95 [00:29<00:35,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9398, LAS: 0.8902, UEM: 0.5434, LEM: 0.3088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5106, partial_loss/deprel_loss: 0.6244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8110, loss: 0.8263, batch_reg_loss: 0.2093, reg_loss: 0.2091 ||:  49%|####9     | 47/95 [00:31<00:30,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9403, LAS: 0.8907, UEM: 0.5577, LEM: 0.3189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4097, partial_loss/deprel_loss: 0.5707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7479, loss: 0.8212, batch_reg_loss: 0.2094, reg_loss: 0.2091 ||:  54%|#####3    | 51/95 [00:33<00:26,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.9402, LAS: 0.8905, UEM: 0.5506, LEM: 0.3130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9492, partial_loss/deprel_loss: 0.7954, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0356, loss: 0.8245, batch_reg_loss: 0.2094, reg_loss: 0.2091 ||:  58%|#####7    | 55/95 [00:35<00:22,  1.77it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9418, LAS: 0.8922, UEM: 0.5665, LEM: 0.3246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2009, partial_loss/deprel_loss: 0.4485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6085, loss: 0.8104, batch_reg_loss: 0.2095, reg_loss: 0.2092 ||:  63%|######3   | 60/95 [00:38<00:18,  1.87it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7850, UAS: 0.9407, LAS: 0.8909, UEM: 0.5628, LEM: 0.3217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0868, partial_loss/deprel_loss: 1.1629, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5572, loss: 0.8184, batch_reg_loss: 0.2095, reg_loss: 0.2092 ||:  67%|######7   | 64/95 [00:41<00:18,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8952, UAS: 0.9420, LAS: 0.8927, UEM: 0.5980, LEM: 0.3701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5500, partial_loss/deprel_loss: 0.5586, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7665, loss: 0.8049, batch_reg_loss: 0.2096, reg_loss: 0.2092 ||:  72%|#######1  | 68/95 [00:44<00:17,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8860, UAS: 0.9424, LAS: 0.8931, UEM: 0.5918, LEM: 0.3619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5943, partial_loss/deprel_loss: 0.6195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8240, loss: 0.8010, batch_reg_loss: 0.2096, reg_loss: 0.2092 ||:  76%|#######5  | 72/95 [00:47<00:15,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9425, LAS: 0.8932, UEM: 0.5915, LEM: 0.3590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2137, partial_loss/deprel_loss: 0.3890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5636, loss: 0.8016, batch_reg_loss: 0.2097, reg_loss: 0.2092 ||:  80%|########  | 76/95 [00:49<00:12,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9054, UAS: 0.9430, LAS: 0.8936, UEM: 0.5961, LEM: 0.3600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3083, partial_loss/deprel_loss: 0.4880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6618, loss: 0.7945, batch_reg_loss: 0.2097, reg_loss: 0.2093 ||:  84%|########4 | 80/95 [00:52<00:10,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9074, UAS: 0.9434, LAS: 0.8940, UEM: 0.5974, LEM: 0.3589, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4523, partial_loss/deprel_loss: 0.5423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7340, loss: 0.7911, batch_reg_loss: 0.2097, reg_loss: 0.2093 ||:  88%|########8 | 84/95 [00:55<00:07,  1.41it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8644, UAS: 0.9434, LAS: 0.8940, UEM: 0.5952, LEM: 0.3560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9780, partial_loss/deprel_loss: 0.7898, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0372, loss: 0.7914, batch_reg_loss: 0.2097, reg_loss: 0.2093 ||:  92%|#########1| 87/95 [00:57<00:05,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8814, UAS: 0.9431, LAS: 0.8936, UEM: 0.5911, LEM: 0.3513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5983, partial_loss/deprel_loss: 0.5760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7902, loss: 0.7939, batch_reg_loss: 0.2098, reg_loss: 0.2093 ||:  95%|#########4| 90/95 [00:59<00:03,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9432, LAS: 0.8937, UEM: 0.5890, LEM: 0.3484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3280, partial_loss/deprel_loss: 0.4128, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6056, loss: 0.7929, batch_reg_loss: 0.2098, reg_loss: 0.2093 ||:  98%|#########7| 93/95 [01:01<00:01,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8516, UAS: 0.9429, LAS: 0.8933, UEM: 0.5858, LEM: 0.3452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2694, partial_loss/deprel_loss: 0.8741, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1630, loss: 0.7965, batch_reg_loss: 0.2098, reg_loss: 0.2093 ||: 100%|##########| 95/95 [01:03<00:00,  1.50it/s]\n",
+      "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.209  |       N/A\n",
+      "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - UEM                      |     0.586  |       N/A\n",
+      "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - LEM                      |     0.345  |       N/A\n",
+      "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - EM                       |     0.852  |       N/A\n",
+      "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.269  |       N/A\n",
+      "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:41:06,737 - INFO - combo.training.tensorboard_writer - UAS                      |     0.943  |       N/A\n",
+      "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.874  |       N/A\n",
+      "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - loss                     |     0.796  |       N/A\n",
+      "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - LAS                      |     0.893  |       N/A\n",
+      "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:41:06,738 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:41:06,739 - INFO - combo.training.trainer - Epoch duration: 0:01:03.200859\n",
+      "2023-04-07 00:41:06,739 - INFO - combo.training.trainer - Estimated training time remaining: 5:34:31\n",
+      "2023-04-07 00:41:06,739 - INFO - allennlp.training.trainer - Epoch 100/399\n",
+      "2023-04-07 00:41:06,739 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:41:06,740 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:41:06,760 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8500, UAS: 0.8957, LAS: 0.8423, UEM: 0.0505, LEM: 0.0051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0992, partial_loss/deprel_loss: 0.8315, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0949, loss: 1.1352, batch_reg_loss: 0.2098, reg_loss: 0.2098 ||:   3%|3         | 3/95 [00:02<01:05,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8435, UAS: 0.9169, LAS: 0.8659, UEM: 0.5052, LEM: 0.3154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3273, partial_loss/deprel_loss: 0.7813, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1003, loss: 0.9686, batch_reg_loss: 0.2099, reg_loss: 0.2098 ||:   6%|6         | 6/95 [00:04<01:02,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8731, UAS: 0.9282, LAS: 0.8775, UEM: 0.5276, LEM: 0.3131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7433, partial_loss/deprel_loss: 0.7389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9497, loss: 0.8948, batch_reg_loss: 0.2099, reg_loss: 0.2099 ||:  11%|#         | 10/95 [00:06<00:57,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9314, LAS: 0.8817, UEM: 0.5023, LEM: 0.2814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5311, partial_loss/deprel_loss: 0.5343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7436, loss: 0.8731, batch_reg_loss: 0.2100, reg_loss: 0.2099 ||:  15%|#4        | 14/95 [00:09<00:52,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9361, LAS: 0.8869, UEM: 0.5188, LEM: 0.2836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4068, partial_loss/deprel_loss: 0.4875, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6814, loss: 0.8388, batch_reg_loss: 0.2100, reg_loss: 0.2099 ||:  18%|#7        | 17/95 [00:11<00:51,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8536, UAS: 0.9375, LAS: 0.8890, UEM: 0.5690, LEM: 0.3367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1092, partial_loss/deprel_loss: 0.7372, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0216, loss: 0.8185, batch_reg_loss: 0.2100, reg_loss: 0.2099 ||:  21%|##1       | 20/95 [00:13<00:51,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9375, LAS: 0.8888, UEM: 0.5810, LEM: 0.3489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1757, partial_loss/deprel_loss: 0.3448, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5210, loss: 0.8215, batch_reg_loss: 0.2101, reg_loss: 0.2100 ||:  25%|##5       | 24/95 [00:15<00:48,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9141, UAS: 0.9397, LAS: 0.8913, UEM: 0.6007, LEM: 0.3634, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2510, partial_loss/deprel_loss: 0.3993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5797, loss: 0.8017, batch_reg_loss: 0.2101, reg_loss: 0.2100 ||:  28%|##8       | 27/95 [00:18<00:49,  1.36it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9592, UAS: 0.9424, LAS: 0.8944, UEM: 0.6485, LEM: 0.4256, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0601, partial_loss/deprel_loss: 0.1583, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3488, loss: 0.7807, batch_reg_loss: 0.2101, reg_loss: 0.2100 ||:  32%|###1      | 30/95 [00:21<00:51,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9431, LAS: 0.8954, UEM: 0.6496, LEM: 0.4226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2603, partial_loss/deprel_loss: 0.4238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6013, loss: 0.7749, batch_reg_loss: 0.2102, reg_loss: 0.2100 ||:  35%|###4      | 33/95 [00:23<00:47,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9422, LAS: 0.8947, UEM: 0.6246, LEM: 0.4012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4997, partial_loss/deprel_loss: 0.5338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7372, loss: 0.7804, batch_reg_loss: 0.2102, reg_loss: 0.2100 ||:  39%|###8      | 37/95 [00:25<00:42,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9418, LAS: 0.8939, UEM: 0.6084, LEM: 0.3839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2840, partial_loss/deprel_loss: 0.4502, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6271, loss: 0.7889, batch_reg_loss: 0.2102, reg_loss: 0.2100 ||:  43%|####3     | 41/95 [00:28<00:37,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9417, LAS: 0.8937, UEM: 0.6145, LEM: 0.3926, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1120, partial_loss/deprel_loss: 0.3045, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4762, loss: 0.7902, batch_reg_loss: 0.2102, reg_loss: 0.2101 ||:  47%|####7     | 45/95 [00:31<00:34,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8940, UAS: 0.9424, LAS: 0.8945, UEM: 0.6130, LEM: 0.3880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5984, partial_loss/deprel_loss: 0.6446, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8456, loss: 0.7852, batch_reg_loss: 0.2103, reg_loss: 0.2101 ||:  51%|#####     | 48/95 [00:33<00:32,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9061, UAS: 0.9436, LAS: 0.8956, UEM: 0.6165, LEM: 0.3840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3159, partial_loss/deprel_loss: 0.4886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6643, loss: 0.7776, batch_reg_loss: 0.2103, reg_loss: 0.2101 ||:  54%|#####3    | 51/95 [00:35<00:30,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9439, LAS: 0.8957, UEM: 0.6090, LEM: 0.3745, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6701, partial_loss/deprel_loss: 0.6689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8795, loss: 0.7781, batch_reg_loss: 0.2103, reg_loss: 0.2101 ||:  57%|#####6    | 54/95 [00:37<00:28,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8189, UAS: 0.9428, LAS: 0.8945, UEM: 0.6073, LEM: 0.3725, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6892, partial_loss/deprel_loss: 1.0752, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4083, loss: 0.7886, batch_reg_loss: 0.2103, reg_loss: 0.2101 ||:  60%|######    | 57/95 [00:39<00:26,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8767, UAS: 0.9428, LAS: 0.8944, UEM: 0.5981, LEM: 0.3632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0034, partial_loss/deprel_loss: 0.7920, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0447, loss: 0.7907, batch_reg_loss: 0.2104, reg_loss: 0.2101 ||:  64%|######4   | 61/95 [00:42<00:23,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9423, LAS: 0.8939, UEM: 0.5922, LEM: 0.3567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3401, partial_loss/deprel_loss: 0.4997, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6782, loss: 0.7958, batch_reg_loss: 0.2104, reg_loss: 0.2101 ||:  68%|######8   | 65/95 [00:44<00:19,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9430, LAS: 0.8946, UEM: 0.5994, LEM: 0.3619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2576, partial_loss/deprel_loss: 0.4229, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6003, loss: 0.7904, batch_reg_loss: 0.2105, reg_loss: 0.2102 ||:  73%|#######2  | 69/95 [00:47<00:18,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8811, UAS: 0.9433, LAS: 0.8948, UEM: 0.5953, LEM: 0.3574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6593, partial_loss/deprel_loss: 0.6696, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8781, loss: 0.7900, batch_reg_loss: 0.2105, reg_loss: 0.2102 ||:  77%|#######6  | 73/95 [00:50<00:14,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8730, UAS: 0.9430, LAS: 0.8946, UEM: 0.5979, LEM: 0.3656, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8570, partial_loss/deprel_loss: 0.6944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9374, loss: 0.7903, batch_reg_loss: 0.2105, reg_loss: 0.2102 ||:  81%|########1 | 77/95 [00:52<00:12,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8996, UAS: 0.9436, LAS: 0.8948, UEM: 0.5961, LEM: 0.3601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3584, partial_loss/deprel_loss: 0.5289, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7054, loss: 0.7883, batch_reg_loss: 0.2106, reg_loss: 0.2102 ||:  86%|########6 | 82/95 [00:55<00:08,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8454, UAS: 0.9435, LAS: 0.8946, UEM: 0.5942, LEM: 0.3578, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0259, partial_loss/deprel_loss: 0.8515, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0970, loss: 0.7897, batch_reg_loss: 0.2106, reg_loss: 0.2102 ||:  91%|######### | 86/95 [00:57<00:05,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9424, LAS: 0.8932, UEM: 0.5910, LEM: 0.3536, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2694, partial_loss/deprel_loss: 0.5058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6692, loss: 0.8006, batch_reg_loss: 0.2107, reg_loss: 0.2103 ||:  95%|#########4| 90/95 [00:59<00:02,  1.76it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8833, UAS: 0.9428, LAS: 0.8936, UEM: 0.5896, LEM: 0.3501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6038, partial_loss/deprel_loss: 0.7466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9288, loss: 0.7983, batch_reg_loss: 0.2107, reg_loss: 0.2103 ||:  99%|#########8| 94/95 [01:01<00:00,  1.73it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9430, LAS: 0.8937, UEM: 0.5892, LEM: 0.3494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4186, partial_loss/deprel_loss: 0.6067, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7798, loss: 0.7981, batch_reg_loss: 0.2107, reg_loss: 0.2103 ||: 100%|##########| 95/95 [01:02<00:00,  1.52it/s]\n",
+      "2023-04-07 00:42:09,402 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8899, UAS: 0.9232, LAS: 0.8683, UEM: 0.2793, LEM: 0.0670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8644, partial_loss/deprel_loss: 23.3140, partial_loss/cycle_loss: 0.0000, batch_loss: 18.8241, loss: 25.2268, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  18%|#8        | 2/11 [00:02<00:09,  1.06s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8613, UAS: 0.9332, LAS: 0.8790, UEM: 0.4771, LEM: 0.2306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0162, partial_loss/deprel_loss: 30.2918, partial_loss/cycle_loss: 0.0000, batch_loss: 24.4367, loss: 19.9516, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:04<00:06,  1.02s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9460, LAS: 0.8955, UEM: 0.6681, LEM: 0.4200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2215, partial_loss/deprel_loss: 6.6622, partial_loss/cycle_loss: 0.0000, batch_loss: 5.3741, loss: 16.2766, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  73%|#######2  | 8/11 [00:07<00:02,  1.02it/s]  \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9493, LAS: 0.8990, UEM: 0.6866, LEM: 0.4231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1776, partial_loss/deprel_loss: 10.1514, partial_loss/cycle_loss: 0.0000, batch_loss: 8.1566, loss: 15.0778, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  91%|######### | 10/11 [00:09<00:01,  1.01s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8706, UAS: 0.9473, LAS: 0.8964, UEM: 0.6672, LEM: 0.4064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1476, partial_loss/deprel_loss: 34.2343, partial_loss/cycle_loss: 0.0000, batch_loss: 27.6170, loss: 16.2177, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.02it/s]\n",
+      "2023-04-07 00:42:20,193 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:42:20,200 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 00:42:20,200 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.210  |     0.000\n",
+      "2023-04-07 00:42:20,200 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:42:20,200 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - UEM                      |     0.589  |     0.667\n",
+      "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - LEM                      |     0.349  |     0.406\n",
+      "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - EM                       |     0.903  |     0.871\n",
+      "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.419  |     1.148\n",
+      "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - UAS                      |     0.943  |     0.947\n",
+      "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.607  |    34.234\n",
+      "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - loss                     |     0.798  |    16.218\n",
+      "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - LAS                      |     0.894  |     0.896\n",
+      "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:42:20,201 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 00:42:23,127 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 00:42:24,821 - INFO - combo.training.trainer - Epoch duration: 0:01:18.082225\n",
+      "2023-04-07 00:42:24,822 - INFO - combo.training.trainer - Estimated training time remaining: 5:33:57\n",
+      "2023-04-07 00:42:24,822 - INFO - allennlp.training.trainer - Epoch 101/399\n",
+      "2023-04-07 00:42:24,822 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:42:24,822 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:42:24,830 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8817, UAS: 0.9455, LAS: 0.8939, UEM: 0.5151, LEM: 0.2694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6720, partial_loss/deprel_loss: 0.6995, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9047, loss: 0.7793, batch_reg_loss: 0.2108, reg_loss: 0.2108 ||:   3%|3         | 3/95 [00:02<01:12,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8845, UAS: 0.9327, LAS: 0.8829, UEM: 0.4016, LEM: 0.1922, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7709, partial_loss/deprel_loss: 0.6747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9048, loss: 0.8643, batch_reg_loss: 0.2108, reg_loss: 0.2108 ||:   7%|7         | 7/95 [00:04<01:03,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9364, LAS: 0.8876, UEM: 0.4195, LEM: 0.1982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6654, partial_loss/deprel_loss: 0.5985, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8227, loss: 0.8277, batch_reg_loss: 0.2109, reg_loss: 0.2108 ||:  12%|#1        | 11/95 [00:06<00:56,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9379, LAS: 0.8884, UEM: 0.4110, LEM: 0.1858, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4987, partial_loss/deprel_loss: 0.5354, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7389, loss: 0.8165, batch_reg_loss: 0.2109, reg_loss: 0.2108 ||:  15%|#4        | 14/95 [00:09<00:55,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8844, UAS: 0.9357, LAS: 0.8852, UEM: 0.4233, LEM: 0.1953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5996, partial_loss/deprel_loss: 0.6657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8634, loss: 0.8442, batch_reg_loss: 0.2109, reg_loss: 0.2108 ||:  19%|#8        | 18/95 [00:11<00:51,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8659, UAS: 0.9327, LAS: 0.8823, UEM: 0.3946, LEM: 0.1790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8833, partial_loss/deprel_loss: 0.7777, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0098, loss: 0.8695, batch_reg_loss: 0.2110, reg_loss: 0.2109 ||:  22%|##2       | 21/95 [00:13<00:49,  1.50it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8762, UAS: 0.9345, LAS: 0.8844, UEM: 0.4073, LEM: 0.1858, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8482, partial_loss/deprel_loss: 0.7386, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9715, loss: 0.8596, batch_reg_loss: 0.2110, reg_loss: 0.2109 ||:  25%|##5       | 24/95 [00:16<00:50,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9266, UAS: 0.9341, LAS: 0.8841, UEM: 0.4211, LEM: 0.1965, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2279, partial_loss/deprel_loss: 0.3688, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5517, loss: 0.8643, batch_reg_loss: 0.2110, reg_loss: 0.2109 ||:  28%|##8       | 27/95 [00:18<00:50,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9099, UAS: 0.9359, LAS: 0.8858, UEM: 0.4352, LEM: 0.2046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2679, partial_loss/deprel_loss: 0.4803, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6489, loss: 0.8506, batch_reg_loss: 0.2111, reg_loss: 0.2109 ||:  32%|###1      | 30/95 [00:20<00:46,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9387, LAS: 0.8888, UEM: 0.4930, LEM: 0.2517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2998, partial_loss/deprel_loss: 0.4433, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6257, loss: 0.8265, batch_reg_loss: 0.2111, reg_loss: 0.2109 ||:  35%|###4      | 33/95 [00:22<00:44,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9138, UAS: 0.9402, LAS: 0.8904, UEM: 0.5115, LEM: 0.2644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3645, partial_loss/deprel_loss: 0.4926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6782, loss: 0.8160, batch_reg_loss: 0.2112, reg_loss: 0.2109 ||:  38%|###7      | 36/95 [00:24<00:43,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8625, UAS: 0.9406, LAS: 0.8904, UEM: 0.5123, LEM: 0.2619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9386, partial_loss/deprel_loss: 0.8632, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0895, loss: 0.8178, batch_reg_loss: 0.2112, reg_loss: 0.2110 ||:  41%|####1     | 39/95 [00:27<00:41,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9191, UAS: 0.9419, LAS: 0.8919, UEM: 0.5254, LEM: 0.2739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3000, partial_loss/deprel_loss: 0.4581, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6377, loss: 0.8079, batch_reg_loss: 0.2112, reg_loss: 0.2110 ||:  44%|####4     | 42/95 [00:29<00:40,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8600, UAS: 0.9404, LAS: 0.8904, UEM: 0.5121, LEM: 0.2658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0808, partial_loss/deprel_loss: 0.8916, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1407, loss: 0.8215, batch_reg_loss: 0.2113, reg_loss: 0.2110 ||:  47%|####7     | 45/95 [00:31<00:37,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8757, UAS: 0.9407, LAS: 0.8910, UEM: 0.5141, LEM: 0.2688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7744, partial_loss/deprel_loss: 0.7258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9468, loss: 0.8184, batch_reg_loss: 0.2113, reg_loss: 0.2110 ||:  51%|#####     | 48/95 [00:33<00:35,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8842, UAS: 0.9412, LAS: 0.8917, UEM: 0.5137, LEM: 0.2666, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7934, partial_loss/deprel_loss: 0.6631, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9005, loss: 0.8133, batch_reg_loss: 0.2113, reg_loss: 0.2110 ||:  54%|#####3    | 51/95 [00:36<00:32,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9420, LAS: 0.8925, UEM: 0.5334, LEM: 0.2870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1297, partial_loss/deprel_loss: 0.3139, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4885, loss: 0.8087, batch_reg_loss: 0.2114, reg_loss: 0.2111 ||:  57%|#####6    | 54/95 [00:38<00:29,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8419, UAS: 0.9412, LAS: 0.8917, UEM: 0.5325, LEM: 0.2885, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3427, partial_loss/deprel_loss: 0.9391, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2313, loss: 0.8169, batch_reg_loss: 0.2114, reg_loss: 0.2111 ||:  60%|######    | 57/95 [00:40<00:27,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9424, LAS: 0.8928, UEM: 0.5456, LEM: 0.2975, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1766, partial_loss/deprel_loss: 0.3578, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5330, loss: 0.8107, batch_reg_loss: 0.2114, reg_loss: 0.2111 ||:  64%|######4   | 61/95 [00:43<00:24,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8594, UAS: 0.9427, LAS: 0.8930, UEM: 0.5506, LEM: 0.3031, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8510, partial_loss/deprel_loss: 0.8349, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0496, loss: 0.8082, batch_reg_loss: 0.2115, reg_loss: 0.2111 ||:  67%|######7   | 64/95 [00:45<00:23,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9224, UAS: 0.9438, LAS: 0.8942, UEM: 0.5588, LEM: 0.3070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2555, partial_loss/deprel_loss: 0.4168, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5961, loss: 0.7995, batch_reg_loss: 0.2115, reg_loss: 0.2111 ||:  72%|#######1  | 68/95 [00:48<00:19,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9438, LAS: 0.8941, UEM: 0.5529, LEM: 0.3017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3956, partial_loss/deprel_loss: 0.5128, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7009, loss: 0.8012, batch_reg_loss: 0.2115, reg_loss: 0.2112 ||:  76%|#######5  | 72/95 [00:50<00:15,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9436, LAS: 0.8938, UEM: 0.5466, LEM: 0.2960, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4656, partial_loss/deprel_loss: 0.5490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7439, loss: 0.8015, batch_reg_loss: 0.2116, reg_loss: 0.2112 ||:  80%|########  | 76/95 [00:52<00:12,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9447, LAS: 0.8953, UEM: 0.5698, LEM: 0.3204, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2514, partial_loss/deprel_loss: 0.3880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5723, loss: 0.7901, batch_reg_loss: 0.2116, reg_loss: 0.2112 ||:  84%|########4 | 80/95 [00:55<00:09,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8843, UAS: 0.9440, LAS: 0.8948, UEM: 0.5618, LEM: 0.3149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7325, partial_loss/deprel_loss: 0.6691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8934, loss: 0.7958, batch_reg_loss: 0.2116, reg_loss: 0.2112 ||:  89%|########9 | 85/95 [00:57<00:06,  1.65it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9434, LAS: 0.8941, UEM: 0.5681, LEM: 0.3212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1874, partial_loss/deprel_loss: 0.3598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5370, loss: 0.8008, batch_reg_loss: 0.2117, reg_loss: 0.2112 ||:  94%|#########3| 89/95 [01:00<00:03,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8478, UAS: 0.9432, LAS: 0.8939, UEM: 0.5741, LEM: 0.3298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0500, partial_loss/deprel_loss: 0.8519, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1033, loss: 0.8011, batch_reg_loss: 0.2117, reg_loss: 0.2113 ||:  98%|#########7| 93/95 [01:02<00:01,  1.77it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8289, UAS: 0.9430, LAS: 0.8939, UEM: 0.5884, LEM: 0.3516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4152, partial_loss/deprel_loss: 0.9883, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2854, loss: 0.8015, batch_reg_loss: 0.2117, reg_loss: 0.2113 ||: 100%|##########| 95/95 [01:03<00:00,  1.50it/s]\n",
+      "2023-04-07 00:43:30,616 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:43:30,616 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.211  |       N/A\n",
+      "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - UEM                      |     0.588  |       N/A\n",
+      "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - LEM                      |     0.352  |       N/A\n",
+      "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - EM                       |     0.829  |       N/A\n",
+      "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.415  |       N/A\n",
+      "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - UAS                      |     0.943  |       N/A\n",
+      "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.988  |       N/A\n",
+      "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - loss                     |     0.801  |       N/A\n",
+      "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - LAS                      |     0.894  |       N/A\n",
+      "2023-04-07 00:43:30,617 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:43:30,618 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:43:30,618 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:43:30,618 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:43:30,618 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:43:30,618 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:43:30,622 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 00:43:35,495 - INFO - combo.training.trainer - Epoch duration: 0:01:10.672863\n",
+      "2023-04-07 00:43:35,495 - INFO - combo.training.trainer - Estimated training time remaining: 5:33:01\n",
+      "2023-04-07 00:43:35,495 - INFO - allennlp.training.trainer - Epoch 102/399\n",
+      "2023-04-07 00:43:35,495 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:43:35,496 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:43:35,504 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9521, LAS: 0.9062, UEM: 0.7124, LEM: 0.4650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1537, partial_loss/deprel_loss: 0.3345, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5101, loss: 0.6921, batch_reg_loss: 0.2118, reg_loss: 0.2118 ||:   3%|3         | 3/95 [00:02<01:07,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8952, UAS: 0.9536, LAS: 0.9073, UEM: 0.6696, LEM: 0.4063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5607, partial_loss/deprel_loss: 0.6313, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8290, loss: 0.6918, batch_reg_loss: 0.2118, reg_loss: 0.2118 ||:   6%|6         | 6/95 [00:04<01:05,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9520, LAS: 0.9068, UEM: 0.6532, LEM: 0.3979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1500, partial_loss/deprel_loss: 0.2989, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4809, loss: 0.6883, batch_reg_loss: 0.2118, reg_loss: 0.2118 ||:   9%|9         | 9/95 [00:06<01:02,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9259, UAS: 0.9549, LAS: 0.9105, UEM: 0.6647, LEM: 0.4062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1886, partial_loss/deprel_loss: 0.3493, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5289, loss: 0.6660, batch_reg_loss: 0.2118, reg_loss: 0.2118 ||:  13%|#2        | 12/95 [00:08<01:00,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9064, UAS: 0.9532, LAS: 0.9078, UEM: 0.6495, LEM: 0.3949, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3812, partial_loss/deprel_loss: 0.4743, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6674, loss: 0.6793, batch_reg_loss: 0.2118, reg_loss: 0.2118 ||:  16%|#5        | 15/95 [00:10<00:58,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9506, LAS: 0.9038, UEM: 0.6323, LEM: 0.3787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2353, partial_loss/deprel_loss: 0.4131, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5893, loss: 0.7058, batch_reg_loss: 0.2118, reg_loss: 0.2118 ||:  20%|##        | 19/95 [00:13<00:54,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9511, LAS: 0.9037, UEM: 0.6248, LEM: 0.3679, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3517, partial_loss/deprel_loss: 0.5103, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6903, loss: 0.7073, batch_reg_loss: 0.2117, reg_loss: 0.2118 ||:  24%|##4       | 23/95 [00:16<00:50,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9505, LAS: 0.9030, UEM: 0.6142, LEM: 0.3564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3182, partial_loss/deprel_loss: 0.4879, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6657, loss: 0.7166, batch_reg_loss: 0.2117, reg_loss: 0.2118 ||:  27%|##7       | 26/95 [00:18<00:50,  1.37it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9508, LAS: 0.9032, UEM: 0.6042, LEM: 0.3456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3389, partial_loss/deprel_loss: 0.4671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6532, loss: 0.7163, batch_reg_loss: 0.2117, reg_loss: 0.2118 ||:  31%|###       | 29/95 [00:20<00:46,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9487, LAS: 0.9009, UEM: 0.5931, LEM: 0.3384, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4692, partial_loss/deprel_loss: 0.5537, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7485, loss: 0.7315, batch_reg_loss: 0.2117, reg_loss: 0.2117 ||:  34%|###3      | 32/95 [00:23<00:45,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9486, LAS: 0.9007, UEM: 0.5894, LEM: 0.3354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2707, partial_loss/deprel_loss: 0.3305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5302, loss: 0.7299, batch_reg_loss: 0.2117, reg_loss: 0.2117 ||:  38%|###7      | 36/95 [00:25<00:42,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8570, UAS: 0.9455, LAS: 0.8975, UEM: 0.5728, LEM: 0.3236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2140, partial_loss/deprel_loss: 0.8312, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1194, loss: 0.7540, batch_reg_loss: 0.2117, reg_loss: 0.2117 ||:  42%|####2     | 40/95 [00:28<00:38,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8705, UAS: 0.9460, LAS: 0.8981, UEM: 0.5713, LEM: 0.3193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0632, partial_loss/deprel_loss: 0.8227, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0824, loss: 0.7558, batch_reg_loss: 0.2116, reg_loss: 0.2117 ||:  46%|####6     | 44/95 [00:31<00:34,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9459, LAS: 0.8983, UEM: 0.5647, LEM: 0.3146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6393, partial_loss/deprel_loss: 0.5721, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7971, loss: 0.7581, batch_reg_loss: 0.2116, reg_loss: 0.2117 ||:  51%|#####     | 48/95 [00:33<00:31,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8615, UAS: 0.9431, LAS: 0.8953, UEM: 0.5522, LEM: 0.3067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8668, partial_loss/deprel_loss: 0.8258, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0456, loss: 0.7828, batch_reg_loss: 0.2116, reg_loss: 0.2117 ||:  55%|#####4    | 52/95 [00:36<00:28,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8759, UAS: 0.9428, LAS: 0.8952, UEM: 0.5478, LEM: 0.3052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8932, partial_loss/deprel_loss: 0.7050, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9542, loss: 0.7836, batch_reg_loss: 0.2116, reg_loss: 0.2117 ||:  59%|#####8    | 56/95 [00:38<00:25,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9425, LAS: 0.8947, UEM: 0.5395, LEM: 0.2988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7946, partial_loss/deprel_loss: 0.6991, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9298, loss: 0.7874, batch_reg_loss: 0.2116, reg_loss: 0.2117 ||:  63%|######3   | 60/95 [00:41<00:24,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9430, LAS: 0.8951, UEM: 0.5460, LEM: 0.3048, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1893, partial_loss/deprel_loss: 0.3831, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5559, loss: 0.7838, batch_reg_loss: 0.2116, reg_loss: 0.2117 ||:  66%|######6   | 63/95 [00:44<00:23,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9072, UAS: 0.9428, LAS: 0.8948, UEM: 0.5391, LEM: 0.2976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4142, partial_loss/deprel_loss: 0.4686, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6693, loss: 0.7874, batch_reg_loss: 0.2116, reg_loss: 0.2117 ||:  71%|#######   | 67/95 [00:46<00:19,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9201, UAS: 0.9441, LAS: 0.8964, UEM: 0.5725, LEM: 0.3342, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2495, partial_loss/deprel_loss: 0.4079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5878, loss: 0.7745, batch_reg_loss: 0.2116, reg_loss: 0.2117 ||:  74%|#######3  | 70/95 [00:49<00:18,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8851, UAS: 0.9441, LAS: 0.8966, UEM: 0.5679, LEM: 0.3309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6874, partial_loss/deprel_loss: 0.5693, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8045, loss: 0.7731, batch_reg_loss: 0.2115, reg_loss: 0.2117 ||:  78%|#######7  | 74/95 [00:52<00:15,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9201, UAS: 0.9446, LAS: 0.8970, UEM: 0.5734, LEM: 0.3342, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2100, partial_loss/deprel_loss: 0.3634, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5443, loss: 0.7715, batch_reg_loss: 0.2115, reg_loss: 0.2117 ||:  82%|########2 | 78/95 [00:54<00:11,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9452, LAS: 0.8977, UEM: 0.5832, LEM: 0.3450, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1146, partial_loss/deprel_loss: 0.2876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4645, loss: 0.7671, batch_reg_loss: 0.2115, reg_loss: 0.2117 ||:  86%|########6 | 82/95 [00:57<00:09,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9608, UAS: 0.9459, LAS: 0.8986, UEM: 0.5984, LEM: 0.3671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0602, partial_loss/deprel_loss: 0.1530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3459, loss: 0.7613, batch_reg_loss: 0.2115, reg_loss: 0.2117 ||:  89%|########9 | 85/95 [01:01<00:09,  1.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.9454, LAS: 0.8981, UEM: 0.5941, LEM: 0.3636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8619, partial_loss/deprel_loss: 0.7147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9556, loss: 0.7658, batch_reg_loss: 0.2115, reg_loss: 0.2116 ||:  93%|#########2| 88/95 [01:04<00:06,  1.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9458, LAS: 0.8986, UEM: 0.5942, LEM: 0.3626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2808, partial_loss/deprel_loss: 0.3974, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5855, loss: 0.7629, batch_reg_loss: 0.2114, reg_loss: 0.2116 ||:  96%|#########5| 91/95 [01:06<00:03,  1.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9449, LAS: 0.8977, UEM: 0.5913, LEM: 0.3593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2987, partial_loss/deprel_loss: 0.4296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6148, loss: 0.7685, batch_reg_loss: 0.2114, reg_loss: 0.2116 ||: 100%|##########| 95/95 [01:08<00:00,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9449, LAS: 0.8977, UEM: 0.5913, LEM: 0.3593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2987, partial_loss/deprel_loss: 0.4296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6148, loss: 0.7685, batch_reg_loss: 0.2114, reg_loss: 0.2116 ||: 100%|##########| 95/95 [01:08<00:00,  1.38it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.212  |       N/A\n",
+      "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - UEM                      |     0.591  |       N/A\n",
+      "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - LEM                      |     0.359  |       N/A\n",
+      "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - EM                       |     0.914  |       N/A\n",
+      "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.299  |       N/A\n",
+      "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - UAS                      |     0.945  |       N/A\n",
+      "2023-04-07 00:44:47,224 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:44:47,225 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.430  |       N/A\n",
+      "2023-04-07 00:44:47,225 - INFO - combo.training.tensorboard_writer - loss                     |     0.769  |       N/A\n",
+      "2023-04-07 00:44:47,225 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:44:47,225 - INFO - combo.training.tensorboard_writer - LAS                      |     0.898  |       N/A\n",
+      "2023-04-07 00:44:47,225 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:44:47,225 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:44:47,225 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:44:47,225 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:44:47,225 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:44:47,225 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:44:47,229 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 00:44:53,279 - INFO - combo.training.trainer - Epoch duration: 0:01:17.783558\n",
+      "2023-04-07 00:44:53,279 - INFO - combo.training.trainer - Estimated training time remaining: 5:32:25\n",
+      "2023-04-07 00:44:53,279 - INFO - allennlp.training.trainer - Epoch 103/399\n",
+      "2023-04-07 00:44:53,279 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:44:53,280 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:44:53,288 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9603, LAS: 0.9123, UEM: 0.6606, LEM: 0.3670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3014, partial_loss/deprel_loss: 0.4709, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6484, loss: 0.6638, batch_reg_loss: 0.2114, reg_loss: 0.2114 ||:   4%|4         | 4/95 [00:02<00:58,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9543, LAS: 0.9080, UEM: 0.5909, LEM: 0.3128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5996, partial_loss/deprel_loss: 0.6053, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8156, loss: 0.6955, batch_reg_loss: 0.2114, reg_loss: 0.2114 ||:   7%|7         | 7/95 [00:04<00:59,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9574, LAS: 0.9098, UEM: 0.6177, LEM: 0.3288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3169, partial_loss/deprel_loss: 0.4794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6583, loss: 0.6811, batch_reg_loss: 0.2114, reg_loss: 0.2114 ||:  11%|#         | 10/95 [00:07<00:59,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.9529, LAS: 0.9052, UEM: 0.6078, LEM: 0.3407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0751, partial_loss/deprel_loss: 0.8086, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0733, loss: 0.7161, batch_reg_loss: 0.2114, reg_loss: 0.2114 ||:  14%|#3        | 13/95 [00:09<00:58,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9220, UAS: 0.9530, LAS: 0.9058, UEM: 0.6004, LEM: 0.3327, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3120, partial_loss/deprel_loss: 0.4136, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6046, loss: 0.7144, batch_reg_loss: 0.2113, reg_loss: 0.2114 ||:  17%|#6        | 16/95 [00:11<00:57,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9515, LAS: 0.9047, UEM: 0.5861, LEM: 0.3248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7027, partial_loss/deprel_loss: 0.6695, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8874, loss: 0.7294, batch_reg_loss: 0.2113, reg_loss: 0.2114 ||:  21%|##1       | 20/95 [00:14<00:52,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9515, LAS: 0.9044, UEM: 0.5928, LEM: 0.3289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3325, partial_loss/deprel_loss: 0.4349, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6257, loss: 0.7300, batch_reg_loss: 0.2113, reg_loss: 0.2114 ||:  24%|##4       | 23/95 [00:16<00:49,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9509, LAS: 0.9040, UEM: 0.5738, LEM: 0.3118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4470, partial_loss/deprel_loss: 0.4292, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6441, loss: 0.7313, batch_reg_loss: 0.2113, reg_loss: 0.2114 ||:  28%|##8       | 27/95 [00:18<00:45,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8563, UAS: 0.9473, LAS: 0.9004, UEM: 0.5564, LEM: 0.2981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1648, partial_loss/deprel_loss: 0.7256, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0247, loss: 0.7556, batch_reg_loss: 0.2113, reg_loss: 0.2113 ||:  33%|###2      | 31/95 [00:20<00:41,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9468, LAS: 0.8999, UEM: 0.5468, LEM: 0.2900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7834, partial_loss/deprel_loss: 0.6629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8982, loss: 0.7612, batch_reg_loss: 0.2113, reg_loss: 0.2113 ||:  36%|###5      | 34/95 [00:23<00:41,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9481, LAS: 0.9013, UEM: 0.5603, LEM: 0.3008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2875, partial_loss/deprel_loss: 0.4270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6104, loss: 0.7508, batch_reg_loss: 0.2112, reg_loss: 0.2113 ||:  40%|####      | 38/95 [00:25<00:37,  1.52it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9485, LAS: 0.9018, UEM: 0.5788, LEM: 0.3239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8666, partial_loss/deprel_loss: 0.7088, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9516, loss: 0.7468, batch_reg_loss: 0.2112, reg_loss: 0.2113 ||:  43%|####3     | 41/95 [00:27<00:36,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9472, LAS: 0.9004, UEM: 0.5676, LEM: 0.3140, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2658, partial_loss/deprel_loss: 0.4552, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6285, loss: 0.7578, batch_reg_loss: 0.2112, reg_loss: 0.2113 ||:  47%|####7     | 45/95 [00:30<00:32,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8621, UAS: 0.9471, LAS: 0.9004, UEM: 0.5813, LEM: 0.3358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1070, partial_loss/deprel_loss: 0.7919, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0661, loss: 0.7578, batch_reg_loss: 0.2112, reg_loss: 0.2113 ||:  52%|#####1    | 49/95 [00:33<00:31,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9476, LAS: 0.9013, UEM: 0.5869, LEM: 0.3436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2432, partial_loss/deprel_loss: 0.3426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5339, loss: 0.7513, batch_reg_loss: 0.2112, reg_loss: 0.2113 ||:  56%|#####5    | 53/95 [00:35<00:28,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9472, LAS: 0.9009, UEM: 0.5792, LEM: 0.3357, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3781, partial_loss/deprel_loss: 0.5024, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6887, loss: 0.7536, batch_reg_loss: 0.2112, reg_loss: 0.2113 ||:  60%|######    | 57/95 [00:38<00:25,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9458, LAS: 0.8993, UEM: 0.5723, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4452, partial_loss/deprel_loss: 0.5259, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7209, loss: 0.7673, batch_reg_loss: 0.2111, reg_loss: 0.2113 ||:  64%|######4   | 61/95 [00:41<00:23,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9708, UAS: 0.9462, LAS: 0.9001, UEM: 0.5942, LEM: 0.3635, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0553, partial_loss/deprel_loss: 0.1266, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3235, loss: 0.7626, batch_reg_loss: 0.2111, reg_loss: 0.2113 ||:  67%|######7   | 64/95 [00:43<00:22,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9468, LAS: 0.9008, UEM: 0.5974, LEM: 0.3659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2163, partial_loss/deprel_loss: 0.3673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5482, loss: 0.7570, batch_reg_loss: 0.2111, reg_loss: 0.2113 ||:  71%|#######   | 67/95 [00:46<00:20,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9470, LAS: 0.9007, UEM: 0.5963, LEM: 0.3643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1547, partial_loss/deprel_loss: 0.3192, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4974, loss: 0.7582, batch_reg_loss: 0.2111, reg_loss: 0.2113 ||:  75%|#######4  | 71/95 [00:48<00:17,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8727, UAS: 0.9467, LAS: 0.9004, UEM: 0.5969, LEM: 0.3659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9089, partial_loss/deprel_loss: 0.7662, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0058, loss: 0.7609, batch_reg_loss: 0.2111, reg_loss: 0.2112 ||:  78%|#######7  | 74/95 [00:50<00:15,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9472, LAS: 0.9008, UEM: 0.6026, LEM: 0.3699, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1965, partial_loss/deprel_loss: 0.3498, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5303, loss: 0.7568, batch_reg_loss: 0.2111, reg_loss: 0.2112 ||:  81%|########1 | 77/95 [00:52<00:12,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9479, LAS: 0.9014, UEM: 0.6057, LEM: 0.3696, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2890, partial_loss/deprel_loss: 0.5286, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6917, loss: 0.7527, batch_reg_loss: 0.2111, reg_loss: 0.2112 ||:  85%|########5 | 81/95 [00:55<00:09,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9479, LAS: 0.9015, UEM: 0.6086, LEM: 0.3742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6256, partial_loss/deprel_loss: 0.5794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7997, loss: 0.7518, batch_reg_loss: 0.2110, reg_loss: 0.2112 ||:  88%|########8 | 84/95 [00:57<00:07,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9481, LAS: 0.9018, UEM: 0.6058, LEM: 0.3705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3206, partial_loss/deprel_loss: 0.4056, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5996, loss: 0.7494, batch_reg_loss: 0.2110, reg_loss: 0.2112 ||:  92%|#########1| 87/95 [00:59<00:05,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9486, LAS: 0.9023, UEM: 0.6125, LEM: 0.3747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4127, partial_loss/deprel_loss: 0.4841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6809, loss: 0.7445, batch_reg_loss: 0.2110, reg_loss: 0.2112 ||:  95%|#########4| 90/95 [01:01<00:03,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8883, UAS: 0.9485, LAS: 0.9022, UEM: 0.6137, LEM: 0.3766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6325, partial_loss/deprel_loss: 0.5781, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8000, loss: 0.7444, batch_reg_loss: 0.2110, reg_loss: 0.2112 ||:  98%|#########7| 93/95 [01:04<00:01,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9090, UAS: 0.9485, LAS: 0.9021, UEM: 0.6115, LEM: 0.3741, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3744, partial_loss/deprel_loss: 0.4893, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6773, loss: 0.7451, batch_reg_loss: 0.2110, reg_loss: 0.2112 ||: 100%|##########| 95/95 [01:05<00:00,  1.45it/s]\n",
+      "2023-04-07 00:46:02,149 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.211  |       N/A\n",
+      "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - UEM                      |     0.612  |       N/A\n",
+      "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - LEM                      |     0.374  |       N/A\n",
+      "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - EM                       |     0.909  |       N/A\n",
+      "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.374  |       N/A\n",
+      "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - UAS                      |     0.948  |       N/A\n",
+      "2023-04-07 00:46:02,150 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:46:02,151 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.489  |       N/A\n",
+      "2023-04-07 00:46:02,151 - INFO - combo.training.tensorboard_writer - loss                     |     0.745  |       N/A\n",
+      "2023-04-07 00:46:02,151 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:46:02,151 - INFO - combo.training.tensorboard_writer - LAS                      |     0.902  |       N/A\n",
+      "2023-04-07 00:46:02,151 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:46:02,151 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:46:02,151 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:46:02,151 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:46:02,151 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:46:02,151 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:46:02,156 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:46:07,469 - INFO - combo.training.trainer - Epoch duration: 0:01:14.189764\n",
+      "2023-04-07 00:46:07,469 - INFO - combo.training.trainer - Estimated training time remaining: 5:31:38\n",
+      "2023-04-07 00:46:07,470 - INFO - allennlp.training.trainer - Epoch 104/399\n",
+      "2023-04-07 00:46:07,470 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:46:07,470 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:46:07,477 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8761, UAS: 0.9486, LAS: 0.9035, UEM: 0.5426, LEM: 0.2815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9259, partial_loss/deprel_loss: 0.6544, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9197, loss: 0.7281, batch_reg_loss: 0.2110, reg_loss: 0.2110 ||:   5%|5         | 5/95 [00:02<00:42,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8653, UAS: 0.9336, LAS: 0.8878, UEM: 0.4455, LEM: 0.2218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1320, partial_loss/deprel_loss: 0.7576, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0434, loss: 0.8465, batch_reg_loss: 0.2109, reg_loss: 0.2110 ||:   9%|9         | 9/95 [00:04<00:45,  1.91it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9352, LAS: 0.8884, UEM: 0.4043, LEM: 0.1875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7125, partial_loss/deprel_loss: 0.6259, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8541, loss: 0.8350, batch_reg_loss: 0.2109, reg_loss: 0.2109 ||:  14%|#3        | 13/95 [00:07<00:43,  1.87it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9405, LAS: 0.8939, UEM: 0.5158, LEM: 0.2835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1708, partial_loss/deprel_loss: 0.3469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5226, loss: 0.7897, batch_reg_loss: 0.2109, reg_loss: 0.2109 ||:  17%|#6        | 16/95 [00:09<00:50,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9267, UAS: 0.9449, LAS: 0.8988, UEM: 0.5457, LEM: 0.2957, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2295, partial_loss/deprel_loss: 0.3936, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5717, loss: 0.7572, batch_reg_loss: 0.2109, reg_loss: 0.2109 ||:  21%|##1       | 20/95 [00:12<00:46,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9488, LAS: 0.9029, UEM: 0.5981, LEM: 0.3401, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3027, partial_loss/deprel_loss: 0.4291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6147, loss: 0.7248, batch_reg_loss: 0.2109, reg_loss: 0.2109 ||:  25%|##5       | 24/95 [00:14<00:43,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9475, LAS: 0.9023, UEM: 0.6085, LEM: 0.3682, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7056, partial_loss/deprel_loss: 0.6024, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8339, loss: 0.7343, batch_reg_loss: 0.2108, reg_loss: 0.2109 ||:  31%|###       | 29/95 [00:16<00:38,  1.74it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9636, UAS: 0.9477, LAS: 0.9031, UEM: 0.6416, LEM: 0.4193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0509, partial_loss/deprel_loss: 0.1444, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3365, loss: 0.7310, batch_reg_loss: 0.2108, reg_loss: 0.2109 ||:  36%|###5      | 34/95 [00:20<00:35,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8956, UAS: 0.9469, LAS: 0.9021, UEM: 0.6232, LEM: 0.4020, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6437, partial_loss/deprel_loss: 0.5984, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8182, loss: 0.7407, batch_reg_loss: 0.2108, reg_loss: 0.2109 ||:  40%|####      | 38/95 [00:22<00:34,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9347, UAS: 0.9484, LAS: 0.9038, UEM: 0.6286, LEM: 0.4029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2140, partial_loss/deprel_loss: 0.3781, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5560, loss: 0.7318, batch_reg_loss: 0.2108, reg_loss: 0.2109 ||:  44%|####4     | 42/95 [00:25<00:34,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8276, UAS: 0.9474, LAS: 0.9025, UEM: 0.6257, LEM: 0.3976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5362, partial_loss/deprel_loss: 0.9158, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2506, loss: 0.7397, batch_reg_loss: 0.2108, reg_loss: 0.2109 ||:  48%|####8     | 46/95 [00:28<00:32,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9482, LAS: 0.9034, UEM: 0.6346, LEM: 0.4070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5049, partial_loss/deprel_loss: 0.5597, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7595, loss: 0.7305, batch_reg_loss: 0.2107, reg_loss: 0.2109 ||:  52%|#####1    | 49/95 [00:30<00:32,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9312, UAS: 0.9499, LAS: 0.9054, UEM: 0.6560, LEM: 0.4268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1969, partial_loss/deprel_loss: 0.3742, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5495, loss: 0.7160, batch_reg_loss: 0.2107, reg_loss: 0.2109 ||:  55%|#####4    | 52/95 [00:33<00:31,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9496, LAS: 0.9051, UEM: 0.6522, LEM: 0.4231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2033, partial_loss/deprel_loss: 0.3288, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5144, loss: 0.7190, batch_reg_loss: 0.2107, reg_loss: 0.2108 ||:  58%|#####7    | 55/95 [00:35<00:28,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8153, UAS: 0.9488, LAS: 0.9044, UEM: 0.6488, LEM: 0.4191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7446, partial_loss/deprel_loss: 1.0545, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4032, loss: 0.7245, batch_reg_loss: 0.2107, reg_loss: 0.2108 ||:  62%|######2   | 59/95 [00:38<00:25,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8850, UAS: 0.9483, LAS: 0.9038, UEM: 0.6402, LEM: 0.4112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6970, partial_loss/deprel_loss: 0.6823, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8959, loss: 0.7292, batch_reg_loss: 0.2107, reg_loss: 0.2108 ||:  65%|######5   | 62/95 [00:40<00:22,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9486, LAS: 0.9038, UEM: 0.6324, LEM: 0.4012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4369, partial_loss/deprel_loss: 0.5940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7732, loss: 0.7300, batch_reg_loss: 0.2107, reg_loss: 0.2108 ||:  69%|######9   | 66/95 [00:42<00:19,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9483, LAS: 0.9037, UEM: 0.6228, LEM: 0.3921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7550, partial_loss/deprel_loss: 0.6404, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8740, loss: 0.7323, batch_reg_loss: 0.2106, reg_loss: 0.2108 ||:  74%|#######3  | 70/95 [00:45<00:16,  1.51it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9474, LAS: 0.9025, UEM: 0.6128, LEM: 0.3836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4196, partial_loss/deprel_loss: 0.4898, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6863, loss: 0.7416, batch_reg_loss: 0.2106, reg_loss: 0.2108 ||:  78%|#######7  | 74/95 [00:47<00:14,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9110, UAS: 0.9474, LAS: 0.9026, UEM: 0.6179, LEM: 0.3899, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3672, partial_loss/deprel_loss: 0.4953, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6803, loss: 0.7409, batch_reg_loss: 0.2106, reg_loss: 0.2108 ||:  81%|########1 | 77/95 [00:50<00:12,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9096, UAS: 0.9479, LAS: 0.9032, UEM: 0.6182, LEM: 0.3884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4544, partial_loss/deprel_loss: 0.4467, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6589, loss: 0.7365, batch_reg_loss: 0.2106, reg_loss: 0.2108 ||:  84%|########4 | 80/95 [00:52<00:11,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9003, UAS: 0.9478, LAS: 0.9030, UEM: 0.6133, LEM: 0.3834, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5621, partial_loss/deprel_loss: 0.5379, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7533, loss: 0.7377, batch_reg_loss: 0.2106, reg_loss: 0.2108 ||:  87%|########7 | 83/95 [00:54<00:08,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8845, UAS: 0.9480, LAS: 0.9029, UEM: 0.6098, LEM: 0.3783, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7110, partial_loss/deprel_loss: 0.6598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8806, loss: 0.7389, batch_reg_loss: 0.2106, reg_loss: 0.2108 ||:  92%|#########1| 87/95 [00:57<00:05,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9485, LAS: 0.9037, UEM: 0.6098, LEM: 0.3768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4768, partial_loss/deprel_loss: 0.5769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7674, loss: 0.7351, batch_reg_loss: 0.2106, reg_loss: 0.2108 ||:  96%|#########5| 91/95 [00:59<00:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9490, LAS: 0.9040, UEM: 0.6130, LEM: 0.3783, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3877, partial_loss/deprel_loss: 0.4527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6502, loss: 0.7312, batch_reg_loss: 0.2105, reg_loss: 0.2108 ||: 100%|##########| 95/95 [01:02<00:00,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9490, LAS: 0.9040, UEM: 0.6130, LEM: 0.3783, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3877, partial_loss/deprel_loss: 0.4527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6502, loss: 0.7312, batch_reg_loss: 0.2105, reg_loss: 0.2108 ||: 100%|##########| 95/95 [01:02<00:00,  1.52it/s]\n",
+      "2023-04-07 00:47:13,057 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:47:13,057 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 00:47:13,057 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.211  |       N/A\n",
+      "2023-04-07 00:47:13,057 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:47:13,057 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:47:13,057 - INFO - combo.training.tensorboard_writer - UEM                      |     0.613  |       N/A\n",
+      "2023-04-07 00:47:13,057 - INFO - combo.training.tensorboard_writer - LEM                      |     0.378  |       N/A\n",
+      "2023-04-07 00:47:13,057 - INFO - combo.training.tensorboard_writer - EM                       |     0.909  |       N/A\n",
+      "2023-04-07 00:47:13,057 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.388  |       N/A\n",
+      "2023-04-07 00:47:13,057 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - UAS                      |     0.949  |       N/A\n",
+      "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.453  |       N/A\n",
+      "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - loss                     |     0.731  |       N/A\n",
+      "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - LAS                      |     0.904  |       N/A\n",
+      "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:47:13,058 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:47:13,063 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 00:47:18,026 - INFO - combo.training.trainer - Epoch duration: 0:01:10.556335\n",
+      "2023-04-07 00:47:18,026 - INFO - combo.training.trainer - Estimated training time remaining: 5:30:40\n",
+      "2023-04-07 00:47:18,027 - INFO - allennlp.training.trainer - Epoch 105/399\n",
+      "2023-04-07 00:47:18,027 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:47:18,027 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:47:18,036 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9570, LAS: 0.9120, UEM: 0.5975, LEM: 0.2888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2832, partial_loss/deprel_loss: 0.4190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6024, loss: 0.6560, batch_reg_loss: 0.2105, reg_loss: 0.2105 ||:   4%|4         | 4/95 [00:02<00:59,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9531, LAS: 0.9077, UEM: 0.5550, LEM: 0.2548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3870, partial_loss/deprel_loss: 0.5263, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7089, loss: 0.6960, batch_reg_loss: 0.2105, reg_loss: 0.2105 ||:   8%|8         | 8/95 [00:05<00:55,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8835, UAS: 0.9463, LAS: 0.9007, UEM: 0.4835, LEM: 0.2113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8110, partial_loss/deprel_loss: 0.6490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8919, loss: 0.7512, batch_reg_loss: 0.2105, reg_loss: 0.2105 ||:  13%|#2        | 12/95 [00:07<00:53,  1.54it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8968, UAS: 0.9457, LAS: 0.8996, UEM: 0.4813, LEM: 0.2167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5843, partial_loss/deprel_loss: 0.6242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8267, loss: 0.7601, batch_reg_loss: 0.2105, reg_loss: 0.2105 ||:  16%|#5        | 15/95 [00:09<00:53,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8903, UAS: 0.9465, LAS: 0.9008, UEM: 0.4827, LEM: 0.2172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7159, partial_loss/deprel_loss: 0.5946, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8293, loss: 0.7534, batch_reg_loss: 0.2104, reg_loss: 0.2105 ||:  19%|#8        | 18/95 [00:11<00:51,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9498, LAS: 0.9052, UEM: 0.5952, LEM: 0.3621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1832, partial_loss/deprel_loss: 0.3887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5580, loss: 0.7230, batch_reg_loss: 0.2104, reg_loss: 0.2105 ||:  22%|##2       | 21/95 [00:14<00:52,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9324, UAS: 0.9503, LAS: 0.9058, UEM: 0.5896, LEM: 0.3530, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1957, partial_loss/deprel_loss: 0.3786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5524, loss: 0.7190, batch_reg_loss: 0.2104, reg_loss: 0.2105 ||:  25%|##5       | 24/95 [00:16<00:49,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9052, UAS: 0.9507, LAS: 0.9063, UEM: 0.5772, LEM: 0.3384, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4686, partial_loss/deprel_loss: 0.4857, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6927, loss: 0.7133, batch_reg_loss: 0.2104, reg_loss: 0.2105 ||:  29%|##9       | 28/95 [00:18<00:44,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9513, LAS: 0.9068, UEM: 0.5866, LEM: 0.3481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3569, partial_loss/deprel_loss: 0.4758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6624, loss: 0.7079, batch_reg_loss: 0.2104, reg_loss: 0.2105 ||:  33%|###2      | 31/95 [00:20<00:44,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9532, LAS: 0.9094, UEM: 0.6135, LEM: 0.3745, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2121, partial_loss/deprel_loss: 0.3423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5267, loss: 0.6891, batch_reg_loss: 0.2104, reg_loss: 0.2104 ||:  37%|###6      | 35/95 [00:23<00:40,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8089, UAS: 0.9516, LAS: 0.9077, UEM: 0.6169, LEM: 0.3743, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7495, partial_loss/deprel_loss: 1.0144, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3718, loss: 0.6998, batch_reg_loss: 0.2103, reg_loss: 0.2104 ||:  41%|####1     | 39/95 [00:25<00:35,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9532, LAS: 0.9088, UEM: 0.6282, LEM: 0.3755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2260, partial_loss/deprel_loss: 0.3663, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5485, loss: 0.6905, batch_reg_loss: 0.2103, reg_loss: 0.2104 ||:  46%|####6     | 44/95 [00:27<00:29,  1.72it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9531, LAS: 0.9086, UEM: 0.6165, LEM: 0.3636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5207, partial_loss/deprel_loss: 0.5418, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7478, loss: 0.6937, batch_reg_loss: 0.2103, reg_loss: 0.2104 ||:  52%|#####1    | 49/95 [00:29<00:24,  1.89it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9533, LAS: 0.9089, UEM: 0.6172, LEM: 0.3623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3151, partial_loss/deprel_loss: 0.4696, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6490, loss: 0.6927, batch_reg_loss: 0.2102, reg_loss: 0.2104 ||:  57%|#####6    | 54/95 [00:32<00:22,  1.85it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8837, UAS: 0.9532, LAS: 0.9088, UEM: 0.6171, LEM: 0.3637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7426, partial_loss/deprel_loss: 0.7018, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9202, loss: 0.6939, batch_reg_loss: 0.2102, reg_loss: 0.2104 ||:  61%|######1   | 58/95 [00:35<00:21,  1.73it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8225, UAS: 0.9519, LAS: 0.9073, UEM: 0.6183, LEM: 0.3682, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6574, partial_loss/deprel_loss: 0.9583, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3083, loss: 0.7046, batch_reg_loss: 0.2102, reg_loss: 0.2104 ||:  65%|######5   | 62/95 [00:38<00:20,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9259, UAS: 0.9515, LAS: 0.9069, UEM: 0.6156, LEM: 0.3664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2118, partial_loss/deprel_loss: 0.3798, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5564, loss: 0.7087, batch_reg_loss: 0.2102, reg_loss: 0.2104 ||:  69%|######9   | 66/95 [00:40<00:17,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9520, LAS: 0.9076, UEM: 0.6303, LEM: 0.3844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1286, partial_loss/deprel_loss: 0.2056, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4004, loss: 0.7020, batch_reg_loss: 0.2102, reg_loss: 0.2104 ||:  74%|#######3  | 70/95 [00:43<00:16,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9517, LAS: 0.9071, UEM: 0.6325, LEM: 0.3852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2563, partial_loss/deprel_loss: 0.4714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6385, loss: 0.7048, batch_reg_loss: 0.2101, reg_loss: 0.2103 ||:  78%|#######7  | 74/95 [00:47<00:15,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9508, LAS: 0.9060, UEM: 0.6239, LEM: 0.3776, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4800, partial_loss/deprel_loss: 0.5786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7690, loss: 0.7125, batch_reg_loss: 0.2101, reg_loss: 0.2103 ||:  82%|########2 | 78/95 [00:49<00:11,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9070, UAS: 0.9497, LAS: 0.9048, UEM: 0.6149, LEM: 0.3708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3706, partial_loss/deprel_loss: 0.5104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6926, loss: 0.7231, batch_reg_loss: 0.2101, reg_loss: 0.2103 ||:  86%|########6 | 82/95 [00:52<00:08,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8908, UAS: 0.9496, LAS: 0.9047, UEM: 0.6108, LEM: 0.3679, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8035, partial_loss/deprel_loss: 0.6049, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8548, loss: 0.7240, batch_reg_loss: 0.2101, reg_loss: 0.2103 ||:  91%|######### | 86/95 [00:54<00:06,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9504, LAS: 0.9054, UEM: 0.6188, LEM: 0.3744, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3558, partial_loss/deprel_loss: 0.5337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7082, loss: 0.7201, batch_reg_loss: 0.2101, reg_loss: 0.2103 ||:  95%|#########4| 90/95 [00:58<00:03,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8643, UAS: 0.9502, LAS: 0.9051, UEM: 0.6203, LEM: 0.3784, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0376, partial_loss/deprel_loss: 0.7604, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0259, loss: 0.7230, batch_reg_loss: 0.2101, reg_loss: 0.2103 ||:  98%|#########7| 93/95 [01:00<00:01,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9504, LAS: 0.9055, UEM: 0.6219, LEM: 0.3790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4298, partial_loss/deprel_loss: 0.4989, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6951, loss: 0.7205, batch_reg_loss: 0.2101, reg_loss: 0.2103 ||: 100%|##########| 95/95 [01:01<00:00,  1.54it/s]\n",
+      "2023-04-07 00:48:22,720 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8673, UAS: 0.9526, LAS: 0.9053, UEM: 0.7958, LEM: 0.6181, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0069, partial_loss/deprel_loss: 28.5755, partial_loss/cycle_loss: 0.0000, batch_loss: 23.0618, loss: 14.0415, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  18%|#8        | 2/11 [00:02<00:09,  1.01s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9514, LAS: 0.9038, UEM: 0.6964, LEM: 0.4699, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6319, partial_loss/deprel_loss: 14.2944, partial_loss/cycle_loss: 0.0000, batch_loss: 11.5619, loss: 13.0727, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:04<00:05,  1.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9563, LAS: 0.9079, UEM: 0.7305, LEM: 0.4721, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4565, partial_loss/deprel_loss: 15.2645, partial_loss/cycle_loss: 0.0000, batch_loss: 12.3029, loss: 12.1444, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  64%|######3   | 7/11 [00:06<00:03,  1.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9524, LAS: 0.9031, UEM: 0.7130, LEM: 0.4540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3994, partial_loss/deprel_loss: 10.5160, partial_loss/cycle_loss: 0.0000, batch_loss: 8.4927, loss: 13.7313, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  82%|########1 | 9/11 [00:08<00:01,  1.01it/s] \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8899, UAS: 0.9500, LAS: 0.8992, UEM: 0.6770, LEM: 0.4156, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8960, partial_loss/deprel_loss: 21.6052, partial_loss/cycle_loss: 0.0000, batch_loss: 17.4634, loss: 15.1769, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.03it/s]\n",
+      "2023-04-07 00:48:33,390 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:48:33,390 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.210  |     0.000\n",
+      "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - UEM                      |     0.622  |     0.677\n",
+      "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - LEM                      |     0.379  |     0.416\n",
+      "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - EM                       |     0.912  |     0.890\n",
+      "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.430  |     0.896\n",
+      "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - UAS                      |     0.950  |     0.950\n",
+      "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.499  |    21.605\n",
+      "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - loss                     |     0.720  |    15.177\n",
+      "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - LAS                      |     0.905  |     0.899\n",
+      "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:48:33,391 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:48:33,392 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:48:33,392 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:48:33,392 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 00:48:33,396 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 00:48:38,203 - INFO - combo.training.trainer - Epoch duration: 0:01:20.176690\n",
+      "2023-04-07 00:48:38,204 - INFO - combo.training.trainer - Estimated training time remaining: 5:30:08\n",
+      "2023-04-07 00:48:38,204 - INFO - allennlp.training.trainer - Epoch 106/399\n",
+      "2023-04-07 00:48:38,204 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:48:38,205 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:48:38,215 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8952, UAS: 0.9498, LAS: 0.9024, UEM: 0.4920, LEM: 0.2301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5409, partial_loss/deprel_loss: 0.5081, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7247, loss: 0.7104, batch_reg_loss: 0.2101, reg_loss: 0.2101 ||:   3%|3         | 3/95 [00:02<01:12,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8803, UAS: 0.9462, LAS: 0.9003, UEM: 0.5475, LEM: 0.3201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7342, partial_loss/deprel_loss: 0.6105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8453, loss: 0.7253, batch_reg_loss: 0.2100, reg_loss: 0.2101 ||:   6%|6         | 6/95 [00:04<01:09,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9498, LAS: 0.9057, UEM: 0.6378, LEM: 0.4287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1322, partial_loss/deprel_loss: 0.2281, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4189, loss: 0.6960, batch_reg_loss: 0.2100, reg_loss: 0.2100 ||:   9%|9         | 9/95 [00:06<01:05,  1.31it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9505, LAS: 0.9063, UEM: 0.6819, LEM: 0.4650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1668, partial_loss/deprel_loss: 0.3607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5320, loss: 0.6906, batch_reg_loss: 0.2100, reg_loss: 0.2100 ||:  13%|#2        | 12/95 [00:09<01:03,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9255, UAS: 0.9497, LAS: 0.9052, UEM: 0.6633, LEM: 0.4399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2834, partial_loss/deprel_loss: 0.4268, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6081, loss: 0.7021, batch_reg_loss: 0.2100, reg_loss: 0.2100 ||:  16%|#5        | 15/95 [00:11<00:58,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9518, LAS: 0.9075, UEM: 0.6630, LEM: 0.4276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2743, partial_loss/deprel_loss: 0.3698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5607, loss: 0.6882, batch_reg_loss: 0.2100, reg_loss: 0.2100 ||:  19%|#8        | 18/95 [00:13<00:58,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9543, LAS: 0.9107, UEM: 0.6664, LEM: 0.4255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2467, partial_loss/deprel_loss: 0.3821, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5650, loss: 0.6702, batch_reg_loss: 0.2100, reg_loss: 0.2100 ||:  23%|##3       | 22/95 [00:15<00:50,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9533, LAS: 0.9099, UEM: 0.6436, LEM: 0.4015, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3590, partial_loss/deprel_loss: 0.4570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6474, loss: 0.6792, batch_reg_loss: 0.2099, reg_loss: 0.2100 ||:  27%|##7       | 26/95 [00:18<00:46,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9548, LAS: 0.9112, UEM: 0.6559, LEM: 0.4081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2568, partial_loss/deprel_loss: 0.4226, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5993, loss: 0.6713, batch_reg_loss: 0.2099, reg_loss: 0.2100 ||:  31%|###       | 29/95 [00:20<00:44,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9549, LAS: 0.9112, UEM: 0.6425, LEM: 0.3937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4614, partial_loss/deprel_loss: 0.4829, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6885, loss: 0.6705, batch_reg_loss: 0.2099, reg_loss: 0.2100 ||:  34%|###3      | 32/95 [00:22<00:42,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9560, LAS: 0.9123, UEM: 0.6523, LEM: 0.4023, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3046, partial_loss/deprel_loss: 0.4142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6021, loss: 0.6607, batch_reg_loss: 0.2099, reg_loss: 0.2100 ||:  38%|###7      | 36/95 [00:24<00:38,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9521, LAS: 0.9079, UEM: 0.6326, LEM: 0.3877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5551, partial_loss/deprel_loss: 0.5666, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7742, loss: 0.6933, batch_reg_loss: 0.2099, reg_loss: 0.2100 ||:  42%|####2     | 40/95 [00:26<00:33,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9514, LAS: 0.9071, UEM: 0.6180, LEM: 0.3734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2428, partial_loss/deprel_loss: 0.4172, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5922, loss: 0.6998, batch_reg_loss: 0.2098, reg_loss: 0.2100 ||:  47%|####7     | 45/95 [00:29<00:28,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9517, LAS: 0.9073, UEM: 0.6297, LEM: 0.3848, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1789, partial_loss/deprel_loss: 0.3202, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5018, loss: 0.6986, batch_reg_loss: 0.2098, reg_loss: 0.2099 ||:  52%|#####1    | 49/95 [00:31<00:25,  1.82it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9510, LAS: 0.9064, UEM: 0.6171, LEM: 0.3746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7447, partial_loss/deprel_loss: 0.7049, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9226, loss: 0.7078, batch_reg_loss: 0.2098, reg_loss: 0.2099 ||:  56%|#####5    | 53/95 [00:33<00:23,  1.82it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9518, LAS: 0.9075, UEM: 0.6210, LEM: 0.3760, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6031, partial_loss/deprel_loss: 0.5276, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7524, loss: 0.7021, batch_reg_loss: 0.2098, reg_loss: 0.2099 ||:  60%|######    | 57/95 [00:36<00:23,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9244, UAS: 0.9513, LAS: 0.9070, UEM: 0.6121, LEM: 0.3668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3028, partial_loss/deprel_loss: 0.4520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6319, loss: 0.7062, batch_reg_loss: 0.2098, reg_loss: 0.2099 ||:  64%|######4   | 61/95 [00:38<00:20,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9509, LAS: 0.9065, UEM: 0.6052, LEM: 0.3606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6779, partial_loss/deprel_loss: 0.6311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8502, loss: 0.7111, batch_reg_loss: 0.2097, reg_loss: 0.2099 ||:  68%|######8   | 65/95 [00:41<00:18,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9506, LAS: 0.9060, UEM: 0.6054, LEM: 0.3617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3979, partial_loss/deprel_loss: 0.4622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6591, loss: 0.7159, batch_reg_loss: 0.2097, reg_loss: 0.2099 ||:  73%|#######2  | 69/95 [00:44<00:16,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9499, LAS: 0.9054, UEM: 0.6007, LEM: 0.3559, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6178, partial_loss/deprel_loss: 0.6083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8199, loss: 0.7208, batch_reg_loss: 0.2097, reg_loss: 0.2099 ||:  77%|#######6  | 73/95 [00:46<00:13,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9501, LAS: 0.9055, UEM: 0.5959, LEM: 0.3501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3291, partial_loss/deprel_loss: 0.4398, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6274, loss: 0.7204, batch_reg_loss: 0.2097, reg_loss: 0.2099 ||:  81%|########1 | 77/95 [00:49<00:11,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9508, LAS: 0.9062, UEM: 0.6101, LEM: 0.3644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0923, partial_loss/deprel_loss: 0.2688, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4432, loss: 0.7151, batch_reg_loss: 0.2097, reg_loss: 0.2099 ||:  85%|########5 | 81/95 [00:52<00:09,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9513, LAS: 0.9068, UEM: 0.6119, LEM: 0.3658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2397, partial_loss/deprel_loss: 0.4208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5942, loss: 0.7124, batch_reg_loss: 0.2097, reg_loss: 0.2099 ||:  88%|########8 | 84/95 [00:55<00:07,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9515, LAS: 0.9071, UEM: 0.6116, LEM: 0.3640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9780, partial_loss/deprel_loss: 0.7000, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9652, loss: 0.7113, batch_reg_loss: 0.2096, reg_loss: 0.2098 ||:  93%|#########2| 88/95 [00:57<00:04,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9511, LAS: 0.9067, UEM: 0.6071, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4269, partial_loss/deprel_loss: 0.4868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6845, loss: 0.7147, batch_reg_loss: 0.2096, reg_loss: 0.2098 ||:  97%|#########6| 92/95 [01:00<00:02,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9516, LAS: 0.9075, UEM: 0.6207, LEM: 0.3808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4486, partial_loss/deprel_loss: 0.4183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6339, loss: 0.7087, batch_reg_loss: 0.2096, reg_loss: 0.2098 ||: 100%|##########| 95/95 [01:02<00:00,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9516, LAS: 0.9075, UEM: 0.6207, LEM: 0.3808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4486, partial_loss/deprel_loss: 0.4183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6339, loss: 0.7087, batch_reg_loss: 0.2096, reg_loss: 0.2098 ||: 100%|##########| 95/95 [01:02<00:00,  1.51it/s]\n",
+      "2023-04-07 00:49:43,998 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.210  |       N/A\n",
+      "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - UEM                      |     0.621  |       N/A\n",
+      "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - LEM                      |     0.381  |       N/A\n",
+      "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - EM                       |     0.917  |       N/A\n",
+      "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.449  |       N/A\n",
+      "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - UAS                      |     0.952  |       N/A\n",
+      "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.418  |       N/A\n",
+      "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - loss                     |     0.709  |       N/A\n",
+      "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - LAS                      |     0.908  |       N/A\n",
+      "2023-04-07 00:49:43,999 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:49:44,000 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:49:44,000 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:49:44,000 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:49:44,000 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:49:44,000 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:49:44,005 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 00:49:48,752 - INFO - combo.training.trainer - Epoch duration: 0:01:10.547947\n",
+      "2023-04-07 00:49:48,752 - INFO - combo.training.trainer - Estimated training time remaining: 5:29:10\n",
+      "2023-04-07 00:49:48,752 - INFO - allennlp.training.trainer - Epoch 107/399\n",
+      "2023-04-07 00:49:48,753 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:49:48,753 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:49:48,763 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8829, UAS: 0.9279, LAS: 0.8832, UEM: 0.2030, LEM: 0.0752, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7221, partial_loss/deprel_loss: 0.6773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8958, loss: 0.9065, batch_reg_loss: 0.2096, reg_loss: 0.2096 ||:   3%|3         | 3/95 [00:02<01:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9239, UAS: 0.9411, LAS: 0.8992, UEM: 0.6315, LEM: 0.4673, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2852, partial_loss/deprel_loss: 0.3978, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5848, loss: 0.7685, batch_reg_loss: 0.2096, reg_loss: 0.2096 ||:   6%|6         | 6/95 [00:04<01:01,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9118, UAS: 0.9444, LAS: 0.9015, UEM: 0.6124, LEM: 0.4050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3404, partial_loss/deprel_loss: 0.4668, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6510, loss: 0.7529, batch_reg_loss: 0.2095, reg_loss: 0.2096 ||:  11%|#         | 10/95 [00:06<00:56,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9440, LAS: 0.9006, UEM: 0.6267, LEM: 0.4070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2018, partial_loss/deprel_loss: 0.3549, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5338, loss: 0.7550, batch_reg_loss: 0.2095, reg_loss: 0.2096 ||:  14%|#3        | 13/95 [00:09<01:00,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9447, LAS: 0.9009, UEM: 0.6051, LEM: 0.3819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3996, partial_loss/deprel_loss: 0.4868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6789, loss: 0.7548, batch_reg_loss: 0.2095, reg_loss: 0.2095 ||:  18%|#7        | 17/95 [00:12<00:55,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9475, LAS: 0.9039, UEM: 0.6153, LEM: 0.3838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3382, partial_loss/deprel_loss: 0.4225, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6152, loss: 0.7260, batch_reg_loss: 0.2095, reg_loss: 0.2095 ||:  21%|##1       | 20/95 [00:14<00:53,  1.39it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9208, UAS: 0.9497, LAS: 0.9067, UEM: 0.6197, LEM: 0.3832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3754, partial_loss/deprel_loss: 0.4243, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6240, loss: 0.7098, batch_reg_loss: 0.2095, reg_loss: 0.2095 ||:  24%|##4       | 23/95 [00:16<00:51,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9518, LAS: 0.9089, UEM: 0.6527, LEM: 0.4164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1493, partial_loss/deprel_loss: 0.2967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4767, loss: 0.6938, batch_reg_loss: 0.2095, reg_loss: 0.2095 ||:  27%|##7       | 26/95 [00:18<00:51,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9525, LAS: 0.9096, UEM: 0.6346, LEM: 0.3964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4358, partial_loss/deprel_loss: 0.4881, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6871, loss: 0.6928, batch_reg_loss: 0.2095, reg_loss: 0.2095 ||:  32%|###1      | 30/95 [00:21<00:45,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8768, UAS: 0.9512, LAS: 0.9084, UEM: 0.6289, LEM: 0.3937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7776, partial_loss/deprel_loss: 0.6976, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9230, loss: 0.7011, batch_reg_loss: 0.2094, reg_loss: 0.2095 ||:  35%|###4      | 33/95 [00:23<00:45,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8602, UAS: 0.9497, LAS: 0.9069, UEM: 0.6102, LEM: 0.3786, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1460, partial_loss/deprel_loss: 0.7777, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0608, loss: 0.7117, batch_reg_loss: 0.2094, reg_loss: 0.2095 ||:  39%|###8      | 37/95 [00:26<00:40,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9268, UAS: 0.9505, LAS: 0.9075, UEM: 0.6062, LEM: 0.3720, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2654, partial_loss/deprel_loss: 0.4050, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5865, loss: 0.7071, batch_reg_loss: 0.2094, reg_loss: 0.2095 ||:  42%|####2     | 40/95 [00:28<00:38,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9146, UAS: 0.9510, LAS: 0.9079, UEM: 0.6074, LEM: 0.3697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3733, partial_loss/deprel_loss: 0.4304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6283, loss: 0.7037, batch_reg_loss: 0.2094, reg_loss: 0.2095 ||:  46%|####6     | 44/95 [00:30<00:33,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8829, UAS: 0.9505, LAS: 0.9074, UEM: 0.6036, LEM: 0.3676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7993, partial_loss/deprel_loss: 0.6920, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9228, loss: 0.7085, batch_reg_loss: 0.2094, reg_loss: 0.2095 ||:  51%|#####     | 48/95 [00:32<00:29,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9042, UAS: 0.9510, LAS: 0.9079, UEM: 0.6014, LEM: 0.3623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4517, partial_loss/deprel_loss: 0.5461, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7366, loss: 0.7052, batch_reg_loss: 0.2093, reg_loss: 0.2095 ||:  55%|#####4    | 52/95 [00:34<00:25,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9512, LAS: 0.9079, UEM: 0.5973, LEM: 0.3566, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4527, partial_loss/deprel_loss: 0.5273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7217, loss: 0.7043, batch_reg_loss: 0.2093, reg_loss: 0.2095 ||:  60%|######    | 57/95 [00:37<00:21,  1.80it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9517, LAS: 0.9084, UEM: 0.6008, LEM: 0.3591, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2877, partial_loss/deprel_loss: 0.4465, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6240, loss: 0.7005, batch_reg_loss: 0.2093, reg_loss: 0.2094 ||:  65%|######5   | 62/95 [00:39<00:17,  1.90it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9507, LAS: 0.9072, UEM: 0.5863, LEM: 0.3460, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5253, partial_loss/deprel_loss: 0.5571, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7600, loss: 0.7086, batch_reg_loss: 0.2093, reg_loss: 0.2094 ||:  71%|#######   | 67/95 [00:41<00:13,  2.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9510, LAS: 0.9074, UEM: 0.5902, LEM: 0.3499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3831, partial_loss/deprel_loss: 0.4447, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6416, loss: 0.7070, batch_reg_loss: 0.2092, reg_loss: 0.2094 ||:  76%|#######5  | 72/95 [00:45<00:13,  1.73it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9507, LAS: 0.9074, UEM: 0.6074, LEM: 0.3759, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3002, partial_loss/deprel_loss: 0.4206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6057, loss: 0.7075, batch_reg_loss: 0.2092, reg_loss: 0.2094 ||:  80%|########  | 76/95 [00:48<00:12,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9512, LAS: 0.9079, UEM: 0.6104, LEM: 0.3769, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3422, partial_loss/deprel_loss: 0.4635, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6485, loss: 0.7034, batch_reg_loss: 0.2092, reg_loss: 0.2094 ||:  84%|########4 | 80/95 [00:51<00:09,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9517, LAS: 0.9086, UEM: 0.6212, LEM: 0.3883, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1150, partial_loss/deprel_loss: 0.2780, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4546, loss: 0.6978, batch_reg_loss: 0.2092, reg_loss: 0.2094 ||:  88%|########8 | 84/95 [00:53<00:06,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8233, UAS: 0.9509, LAS: 0.9077, UEM: 0.6160, LEM: 0.3835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6555, partial_loss/deprel_loss: 0.9330, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2867, loss: 0.7047, batch_reg_loss: 0.2092, reg_loss: 0.2094 ||:  93%|#########2| 88/95 [00:56<00:04,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9077, UAS: 0.9509, LAS: 0.9076, UEM: 0.6166, LEM: 0.3856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5582, partial_loss/deprel_loss: 0.5507, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7613, loss: 0.7061, batch_reg_loss: 0.2091, reg_loss: 0.2094 ||:  97%|#########6| 92/95 [00:59<00:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9042, UAS: 0.9514, LAS: 0.9081, UEM: 0.6205, LEM: 0.3876, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4833, partial_loss/deprel_loss: 0.5759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7664, loss: 0.7025, batch_reg_loss: 0.2091, reg_loss: 0.2094 ||: 100%|##########| 95/95 [01:01<00:00,  1.55it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:50:52,802 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.209  |       N/A\n",
+      "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - UEM                      |     0.621  |       N/A\n",
+      "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - LEM                      |     0.388  |       N/A\n",
+      "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - EM                       |     0.904  |       N/A\n",
+      "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.483  |       N/A\n",
+      "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - UAS                      |     0.951  |       N/A\n",
+      "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:50:52,803 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.576  |       N/A\n",
+      "2023-04-07 00:50:52,804 - INFO - combo.training.tensorboard_writer - loss                     |     0.702  |       N/A\n",
+      "2023-04-07 00:50:52,804 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:50:52,804 - INFO - combo.training.tensorboard_writer - LAS                      |     0.908  |       N/A\n",
+      "2023-04-07 00:50:52,804 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:50:52,804 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:50:52,804 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:50:52,804 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:50:52,804 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:50:52,804 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:50:52,809 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 00:50:58,225 - INFO - combo.training.trainer - Epoch duration: 0:01:09.472212\n",
+      "2023-04-07 00:50:58,225 - INFO - combo.training.trainer - Estimated training time remaining: 5:28:08\n",
+      "2023-04-07 00:50:58,226 - INFO - allennlp.training.trainer - Epoch 108/399\n",
+      "2023-04-07 00:50:58,226 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:50:58,227 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:50:58,237 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9390, UAS: 0.9554, LAS: 0.9106, UEM: 0.5932, LEM: 0.3364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1861, partial_loss/deprel_loss: 0.3261, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5072, loss: 0.7211, batch_reg_loss: 0.2091, reg_loss: 0.2091 ||:   3%|3         | 3/95 [00:02<01:11,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8598, UAS: 0.9537, LAS: 0.9107, UEM: 0.7085, LEM: 0.4866, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1022, partial_loss/deprel_loss: 0.7836, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0564, loss: 0.7066, batch_reg_loss: 0.2091, reg_loss: 0.2091 ||:   7%|7         | 7/95 [00:04<01:04,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9208, UAS: 0.9580, LAS: 0.9153, UEM: 0.7221, LEM: 0.4892, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3536, partial_loss/deprel_loss: 0.4257, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6203, loss: 0.6625, batch_reg_loss: 0.2091, reg_loss: 0.2091 ||:  11%|#         | 10/95 [00:07<01:02,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9138, UAS: 0.9570, LAS: 0.9129, UEM: 0.6728, LEM: 0.4317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3364, partial_loss/deprel_loss: 0.4736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6552, loss: 0.6820, batch_reg_loss: 0.2090, reg_loss: 0.2091 ||:  15%|#4        | 14/95 [00:09<00:56,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9569, LAS: 0.9138, UEM: 0.6635, LEM: 0.4250, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4624, partial_loss/deprel_loss: 0.4495, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6611, loss: 0.6735, batch_reg_loss: 0.2090, reg_loss: 0.2091 ||:  19%|#8        | 18/95 [00:12<00:53,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9581, LAS: 0.9150, UEM: 0.6645, LEM: 0.4206, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2707, partial_loss/deprel_loss: 0.4033, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5858, loss: 0.6635, batch_reg_loss: 0.2090, reg_loss: 0.2091 ||:  22%|##2       | 21/95 [00:14<00:53,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9243, UAS: 0.9588, LAS: 0.9162, UEM: 0.6591, LEM: 0.4108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2285, partial_loss/deprel_loss: 0.4090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5819, loss: 0.6562, batch_reg_loss: 0.2090, reg_loss: 0.2090 ||:  26%|##6       | 25/95 [00:17<00:49,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8835, UAS: 0.9580, LAS: 0.9155, UEM: 0.6468, LEM: 0.4008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7635, partial_loss/deprel_loss: 0.6478, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8799, loss: 0.6586, batch_reg_loss: 0.2090, reg_loss: 0.2090 ||:  31%|###       | 29/95 [00:19<00:45,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9563, LAS: 0.9135, UEM: 0.6265, LEM: 0.3832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7999, partial_loss/deprel_loss: 0.6219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8664, loss: 0.6706, batch_reg_loss: 0.2089, reg_loss: 0.2090 ||:  34%|###3      | 32/95 [00:21<00:43,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9566, LAS: 0.9138, UEM: 0.6330, LEM: 0.3886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5881, partial_loss/deprel_loss: 0.4875, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7165, loss: 0.6644, batch_reg_loss: 0.2089, reg_loss: 0.2090 ||:  37%|###6      | 35/95 [00:24<00:42,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8839, UAS: 0.9557, LAS: 0.9128, UEM: 0.6217, LEM: 0.3803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8190, partial_loss/deprel_loss: 0.6872, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9225, loss: 0.6715, batch_reg_loss: 0.2089, reg_loss: 0.2090 ||:  41%|####1     | 39/95 [00:26<00:38,  1.44it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9537, LAS: 0.9106, UEM: 0.6048, LEM: 0.3663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5283, partial_loss/deprel_loss: 0.5358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7432, loss: 0.6887, batch_reg_loss: 0.2089, reg_loss: 0.2090 ||:  45%|####5     | 43/95 [00:29<00:33,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9538, LAS: 0.9108, UEM: 0.6031, LEM: 0.3657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5701, partial_loss/deprel_loss: 0.4870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7125, loss: 0.6881, batch_reg_loss: 0.2089, reg_loss: 0.2090 ||:  49%|####9     | 47/95 [00:31<00:31,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9124, UAS: 0.9543, LAS: 0.9113, UEM: 0.6065, LEM: 0.3670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4044, partial_loss/deprel_loss: 0.4574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6556, loss: 0.6834, batch_reg_loss: 0.2088, reg_loss: 0.2090 ||:  54%|#####3    | 51/95 [00:34<00:29,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8581, UAS: 0.9541, LAS: 0.9109, UEM: 0.6083, LEM: 0.3668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1321, partial_loss/deprel_loss: 0.7378, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0255, loss: 0.6860, batch_reg_loss: 0.2088, reg_loss: 0.2090 ||:  58%|#####7    | 55/95 [00:37<00:27,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9532, LAS: 0.9099, UEM: 0.6028, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2816, partial_loss/deprel_loss: 0.4076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5912, loss: 0.6913, batch_reg_loss: 0.2088, reg_loss: 0.2089 ||:  62%|######2   | 59/95 [00:39<00:24,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9016, UAS: 0.9522, LAS: 0.9089, UEM: 0.5919, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5001, partial_loss/deprel_loss: 0.5308, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7334, loss: 0.6973, batch_reg_loss: 0.2088, reg_loss: 0.2089 ||:  66%|######6   | 63/95 [00:42<00:21,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9524, LAS: 0.9093, UEM: 0.6102, LEM: 0.3798, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5797, partial_loss/deprel_loss: 0.6738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8638, loss: 0.6955, batch_reg_loss: 0.2088, reg_loss: 0.2089 ||:  71%|#######   | 67/95 [00:45<00:19,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9510, LAS: 0.9080, UEM: 0.6014, LEM: 0.3723, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4449, partial_loss/deprel_loss: 0.4204, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6341, loss: 0.7026, batch_reg_loss: 0.2088, reg_loss: 0.2089 ||:  75%|#######4  | 71/95 [00:47<00:15,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9517, LAS: 0.9088, UEM: 0.6074, LEM: 0.3770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3527, partial_loss/deprel_loss: 0.3824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5852, loss: 0.6971, batch_reg_loss: 0.2087, reg_loss: 0.2089 ||:  80%|########  | 76/95 [00:50<00:11,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9527, LAS: 0.9099, UEM: 0.6241, LEM: 0.3919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2745, partial_loss/deprel_loss: 0.4041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5869, loss: 0.6882, batch_reg_loss: 0.2087, reg_loss: 0.2089 ||:  84%|########4 | 80/95 [00:52<00:08,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8853, UAS: 0.9521, LAS: 0.9091, UEM: 0.6147, LEM: 0.3834, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6618, partial_loss/deprel_loss: 0.6279, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8434, loss: 0.6943, batch_reg_loss: 0.2087, reg_loss: 0.2089 ||:  89%|########9 | 85/95 [00:54<00:05,  1.86it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9519, LAS: 0.9088, UEM: 0.6121, LEM: 0.3817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6193, partial_loss/deprel_loss: 0.6511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8534, loss: 0.6958, batch_reg_loss: 0.2087, reg_loss: 0.2089 ||:  94%|#########3| 89/95 [00:56<00:03,  1.85it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9138, UAS: 0.9526, LAS: 0.9094, UEM: 0.6191, LEM: 0.3860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3453, partial_loss/deprel_loss: 0.4614, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6468, loss: 0.6909, batch_reg_loss: 0.2087, reg_loss: 0.2089 ||:  98%|#########7| 93/95 [00:59<00:01,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9523, LAS: 0.9091, UEM: 0.6216, LEM: 0.3892, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1122, partial_loss/deprel_loss: 0.2778, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4534, loss: 0.6928, batch_reg_loss: 0.2086, reg_loss: 0.2089 ||: 100%|##########| 95/95 [01:01<00:00,  1.55it/s]\n",
+      "2023-04-07 00:52:02,857 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:52:02,857 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 00:52:02,857 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.209  |       N/A\n",
+      "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - UEM                      |     0.622  |       N/A\n",
+      "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - LEM                      |     0.389  |       N/A\n",
+      "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - EM                       |     0.940  |       N/A\n",
+      "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.112  |       N/A\n",
+      "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - UAS                      |     0.952  |       N/A\n",
+      "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.278  |       N/A\n",
+      "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - loss                     |     0.693  |       N/A\n",
+      "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - LAS                      |     0.909  |       N/A\n",
+      "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:52:02,858 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:52:02,859 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:52:02,859 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:52:02,859 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:52:02,863 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:52:07,709 - INFO - combo.training.trainer - Epoch duration: 0:01:09.483094\n",
+      "2023-04-07 00:52:07,709 - INFO - combo.training.trainer - Estimated training time remaining: 5:27:06\n",
+      "2023-04-07 00:52:07,709 - INFO - allennlp.training.trainer - Epoch 109/399\n",
+      "2023-04-07 00:52:07,709 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:52:07,710 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:52:07,717 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9737, LAS: 0.9335, UEM: 0.8213, LEM: 0.5670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1799, partial_loss/deprel_loss: 0.3374, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5145, loss: 0.4883, batch_reg_loss: 0.2086, reg_loss: 0.2086 ||:   3%|3         | 3/95 [00:02<01:05,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9638, LAS: 0.9217, UEM: 0.7067, LEM: 0.4425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3636, partial_loss/deprel_loss: 0.4693, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6568, loss: 0.6022, batch_reg_loss: 0.2086, reg_loss: 0.2086 ||:   7%|7         | 7/95 [00:04<01:00,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8980, UAS: 0.9561, LAS: 0.9129, UEM: 0.6724, LEM: 0.4154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5529, partial_loss/deprel_loss: 0.5999, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7991, loss: 0.6619, batch_reg_loss: 0.2086, reg_loss: 0.2086 ||:  11%|#         | 10/95 [00:06<00:59,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9543, LAS: 0.9103, UEM: 0.6235, LEM: 0.3683, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3306, partial_loss/deprel_loss: 0.5062, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6797, loss: 0.6850, batch_reg_loss: 0.2086, reg_loss: 0.2086 ||:  15%|#4        | 14/95 [00:09<00:54,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9574, LAS: 0.9142, UEM: 0.6780, LEM: 0.4364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1156, partial_loss/deprel_loss: 0.2067, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3970, loss: 0.6520, batch_reg_loss: 0.2085, reg_loss: 0.2086 ||:  18%|#7        | 17/95 [00:11<00:54,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9594, LAS: 0.9161, UEM: 0.6983, LEM: 0.4522, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2219, partial_loss/deprel_loss: 0.4078, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5791, loss: 0.6379, batch_reg_loss: 0.2085, reg_loss: 0.2086 ||:  21%|##1       | 20/95 [00:13<00:54,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9587, LAS: 0.9145, UEM: 0.6847, LEM: 0.4386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5254, partial_loss/deprel_loss: 0.5624, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7635, loss: 0.6516, batch_reg_loss: 0.2085, reg_loss: 0.2086 ||:  24%|##4       | 23/95 [00:16<00:52,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9586, LAS: 0.9149, UEM: 0.6768, LEM: 0.4302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3560, partial_loss/deprel_loss: 0.4095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6073, loss: 0.6530, batch_reg_loss: 0.2085, reg_loss: 0.2086 ||:  27%|##7       | 26/95 [00:18<00:51,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8679, UAS: 0.9536, LAS: 0.9092, UEM: 0.6545, LEM: 0.4147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9298, partial_loss/deprel_loss: 0.6837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9414, loss: 0.6911, batch_reg_loss: 0.2085, reg_loss: 0.2086 ||:  31%|###       | 29/95 [00:20<00:47,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9550, LAS: 0.9107, UEM: 0.6705, LEM: 0.4313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4781, partial_loss/deprel_loss: 0.5187, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7190, loss: 0.6806, batch_reg_loss: 0.2085, reg_loss: 0.2086 ||:  34%|###3      | 32/95 [00:22<00:46,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9550, LAS: 0.9108, UEM: 0.6640, LEM: 0.4253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2077, partial_loss/deprel_loss: 0.3057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4946, loss: 0.6793, batch_reg_loss: 0.2085, reg_loss: 0.2085 ||:  37%|###6      | 35/95 [00:25<00:44,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9554, LAS: 0.9116, UEM: 0.6613, LEM: 0.4234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1922, partial_loss/deprel_loss: 0.2809, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4716, loss: 0.6733, batch_reg_loss: 0.2084, reg_loss: 0.2085 ||:  40%|####      | 38/95 [00:27<00:42,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9545, LAS: 0.9108, UEM: 0.6472, LEM: 0.4103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4890, partial_loss/deprel_loss: 0.5500, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7462, loss: 0.6796, batch_reg_loss: 0.2084, reg_loss: 0.2085 ||:  43%|####3     | 41/95 [00:29<00:40,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9124, UAS: 0.9557, LAS: 0.9123, UEM: 0.6722, LEM: 0.4444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3647, partial_loss/deprel_loss: 0.4614, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6505, loss: 0.6698, batch_reg_loss: 0.2084, reg_loss: 0.2085 ||:  46%|####6     | 44/95 [00:32<00:39,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9557, LAS: 0.9123, UEM: 0.6712, LEM: 0.4408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3744, partial_loss/deprel_loss: 0.5112, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6922, loss: 0.6716, batch_reg_loss: 0.2084, reg_loss: 0.2085 ||:  51%|#####     | 48/95 [00:34<00:34,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8761, UAS: 0.9554, LAS: 0.9121, UEM: 0.6678, LEM: 0.4371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8979, partial_loss/deprel_loss: 0.7309, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9726, loss: 0.6757, batch_reg_loss: 0.2084, reg_loss: 0.2085 ||:  54%|#####3    | 51/95 [00:36<00:32,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9561, LAS: 0.9128, UEM: 0.6685, LEM: 0.4339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2373, partial_loss/deprel_loss: 0.3559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5406, loss: 0.6699, batch_reg_loss: 0.2084, reg_loss: 0.2085 ||:  57%|#####6    | 54/95 [00:39<00:31,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9295, UAS: 0.9567, LAS: 0.9137, UEM: 0.6687, LEM: 0.4315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2389, partial_loss/deprel_loss: 0.3803, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5603, loss: 0.6649, batch_reg_loss: 0.2083, reg_loss: 0.2085 ||:  61%|######1   | 58/95 [00:42<00:27,  1.34it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9560, LAS: 0.9128, UEM: 0.6614, LEM: 0.4244, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5460, partial_loss/deprel_loss: 0.6238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8166, loss: 0.6726, batch_reg_loss: 0.2083, reg_loss: 0.2085 ||:  64%|######4   | 61/95 [00:44<00:24,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9563, LAS: 0.9133, UEM: 0.6652, LEM: 0.4291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1201, partial_loss/deprel_loss: 0.2667, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4457, loss: 0.6687, batch_reg_loss: 0.2083, reg_loss: 0.2085 ||:  67%|######7   | 64/95 [00:46<00:23,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9556, LAS: 0.9127, UEM: 0.6565, LEM: 0.4214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7757, partial_loss/deprel_loss: 0.6345, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8710, loss: 0.6739, batch_reg_loss: 0.2083, reg_loss: 0.2085 ||:  72%|#######1  | 68/95 [00:49<00:19,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9118, UAS: 0.9551, LAS: 0.9123, UEM: 0.6508, LEM: 0.4154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5849, partial_loss/deprel_loss: 0.4252, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6654, loss: 0.6765, batch_reg_loss: 0.2083, reg_loss: 0.2084 ||:  76%|#######5  | 72/95 [00:51<00:16,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9544, LAS: 0.9115, UEM: 0.6458, LEM: 0.4108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4878, partial_loss/deprel_loss: 0.4385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6566, loss: 0.6817, batch_reg_loss: 0.2082, reg_loss: 0.2084 ||:  80%|########  | 76/95 [00:54<00:12,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9547, LAS: 0.9119, UEM: 0.6430, LEM: 0.4057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5226, partial_loss/deprel_loss: 0.5032, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7153, loss: 0.6791, batch_reg_loss: 0.2082, reg_loss: 0.2084 ||:  84%|########4 | 80/95 [00:56<00:09,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9538, LAS: 0.9108, UEM: 0.6404, LEM: 0.4044, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1304, partial_loss/deprel_loss: 0.3280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4967, loss: 0.6843, batch_reg_loss: 0.2082, reg_loss: 0.2084 ||:  88%|########8 | 84/95 [00:59<00:07,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9537, LAS: 0.9106, UEM: 0.6383, LEM: 0.4030, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5488, partial_loss/deprel_loss: 0.5528, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7602, loss: 0.6862, batch_reg_loss: 0.2082, reg_loss: 0.2084 ||:  93%|#########2| 88/95 [01:01<00:04,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8967, UAS: 0.9532, LAS: 0.9100, UEM: 0.6286, LEM: 0.3940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7232, partial_loss/deprel_loss: 0.5868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8223, loss: 0.6904, batch_reg_loss: 0.2082, reg_loss: 0.2084 ||:  98%|#########7| 93/95 [01:03<00:01,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9532, LAS: 0.9100, UEM: 0.6285, LEM: 0.3930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1779, partial_loss/deprel_loss: 0.3895, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5553, loss: 0.6906, batch_reg_loss: 0.2082, reg_loss: 0.2084 ||: 100%|##########| 95/95 [01:05<00:00,  1.46it/s]\n",
+      "2023-04-07 00:53:15,569 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:53:15,569 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 00:53:15,569 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.208  |       N/A\n",
+      "2023-04-07 00:53:15,569 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:53:15,569 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:53:15,569 - INFO - combo.training.tensorboard_writer - UEM                      |     0.629  |       N/A\n",
+      "2023-04-07 00:53:15,569 - INFO - combo.training.tensorboard_writer - LEM                      |     0.393  |       N/A\n",
+      "2023-04-07 00:53:15,569 - INFO - combo.training.tensorboard_writer - EM                       |     0.933  |       N/A\n",
+      "2023-04-07 00:53:15,569 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.178  |       N/A\n",
+      "2023-04-07 00:53:15,569 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - UAS                      |     0.953  |       N/A\n",
+      "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.389  |       N/A\n",
+      "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - loss                     |     0.691  |       N/A\n",
+      "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - LAS                      |     0.910  |       N/A\n",
+      "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:53:15,570 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:53:15,575 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 00:53:20,146 - INFO - combo.training.trainer - Epoch duration: 0:01:12.436840\n",
+      "2023-04-07 00:53:20,147 - INFO - combo.training.trainer - Estimated training time remaining: 5:26:12\n",
+      "2023-04-07 00:53:20,147 - INFO - allennlp.training.trainer - Epoch 110/399\n",
+      "2023-04-07 00:53:20,147 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:53:20,148 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:53:20,156 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9398, UAS: 0.9701, LAS: 0.9316, UEM: 0.8100, LEM: 0.6100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1711, partial_loss/deprel_loss: 0.3258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5030, loss: 0.5320, batch_reg_loss: 0.2082, reg_loss: 0.2082 ||:   4%|4         | 4/95 [00:02<00:47,  1.92it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9099, UAS: 0.9519, LAS: 0.9116, UEM: 0.6588, LEM: 0.4655, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4492, partial_loss/deprel_loss: 0.4790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6811, loss: 0.6690, batch_reg_loss: 0.2081, reg_loss: 0.2081 ||:   9%|9         | 9/95 [00:04<00:42,  2.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8418, UAS: 0.9484, LAS: 0.9073, UEM: 0.6214, LEM: 0.4200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3577, partial_loss/deprel_loss: 0.7750, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0997, loss: 0.6918, batch_reg_loss: 0.2081, reg_loss: 0.2081 ||:  14%|#3        | 13/95 [00:06<00:43,  1.89it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9496, LAS: 0.9090, UEM: 0.6142, LEM: 0.4085, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4898, partial_loss/deprel_loss: 0.4025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6281, loss: 0.6798, batch_reg_loss: 0.2081, reg_loss: 0.2081 ||:  18%|#7        | 17/95 [00:09<00:43,  1.80it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9502, LAS: 0.9097, UEM: 0.6272, LEM: 0.4207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1815, partial_loss/deprel_loss: 0.3025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4864, loss: 0.6779, batch_reg_loss: 0.2081, reg_loss: 0.2081 ||:  22%|##2       | 21/95 [00:11<00:42,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9007, UAS: 0.9501, LAS: 0.9099, UEM: 0.6164, LEM: 0.4101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5556, partial_loss/deprel_loss: 0.5475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7572, loss: 0.6785, batch_reg_loss: 0.2081, reg_loss: 0.2081 ||:  26%|##6       | 25/95 [00:14<00:40,  1.71it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8610, UAS: 0.9503, LAS: 0.9097, UEM: 0.6350, LEM: 0.4257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1782, partial_loss/deprel_loss: 0.8499, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1236, loss: 0.6830, batch_reg_loss: 0.2080, reg_loss: 0.2081 ||:  29%|##9       | 28/95 [00:16<00:41,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9508, LAS: 0.9102, UEM: 0.6442, LEM: 0.4348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6302, partial_loss/deprel_loss: 0.6189, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8292, loss: 0.6801, batch_reg_loss: 0.2080, reg_loss: 0.2081 ||:  33%|###2      | 31/95 [00:18<00:43,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9331, UAS: 0.9524, LAS: 0.9118, UEM: 0.6488, LEM: 0.4302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2152, partial_loss/deprel_loss: 0.3765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5522, loss: 0.6697, batch_reg_loss: 0.2080, reg_loss: 0.2081 ||:  36%|###5      | 34/95 [00:21<00:45,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9180, UAS: 0.9520, LAS: 0.9110, UEM: 0.6294, LEM: 0.4108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3294, partial_loss/deprel_loss: 0.4594, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6414, loss: 0.6780, batch_reg_loss: 0.2080, reg_loss: 0.2081 ||:  40%|####      | 38/95 [00:23<00:40,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9528, LAS: 0.9117, UEM: 0.6301, LEM: 0.4064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3072, partial_loss/deprel_loss: 0.4471, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6271, loss: 0.6748, batch_reg_loss: 0.2080, reg_loss: 0.2081 ||:  43%|####3     | 41/95 [00:26<00:39,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9294, UAS: 0.9522, LAS: 0.9110, UEM: 0.6249, LEM: 0.4009, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1996, partial_loss/deprel_loss: 0.3869, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5574, loss: 0.6809, batch_reg_loss: 0.2080, reg_loss: 0.2081 ||:  46%|####6     | 44/95 [00:28<00:37,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9524, LAS: 0.9111, UEM: 0.6271, LEM: 0.4018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7328, partial_loss/deprel_loss: 0.6320, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8601, loss: 0.6801, batch_reg_loss: 0.2079, reg_loss: 0.2081 ||:  49%|####9     | 47/95 [00:30<00:34,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9531, LAS: 0.9117, UEM: 0.6350, LEM: 0.4064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2185, partial_loss/deprel_loss: 0.3277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5138, loss: 0.6734, batch_reg_loss: 0.2079, reg_loss: 0.2081 ||:  53%|#####2    | 50/95 [00:32<00:33,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8448, UAS: 0.9525, LAS: 0.9113, UEM: 0.6358, LEM: 0.4071, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5059, partial_loss/deprel_loss: 0.8047, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1528, loss: 0.6778, batch_reg_loss: 0.2079, reg_loss: 0.2080 ||:  56%|#####5    | 53/95 [00:35<00:30,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9525, LAS: 0.9112, UEM: 0.6277, LEM: 0.3979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5079, partial_loss/deprel_loss: 0.5327, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7356, loss: 0.6800, batch_reg_loss: 0.2079, reg_loss: 0.2080 ||:  60%|######    | 57/95 [00:37<00:27,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9517, LAS: 0.9103, UEM: 0.6262, LEM: 0.3972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7173, partial_loss/deprel_loss: 0.6186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8463, loss: 0.6859, batch_reg_loss: 0.2079, reg_loss: 0.2080 ||:  63%|######3   | 60/95 [00:39<00:24,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8671, UAS: 0.9513, LAS: 0.9099, UEM: 0.6200, LEM: 0.3906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0373, partial_loss/deprel_loss: 0.7337, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0023, loss: 0.6889, batch_reg_loss: 0.2079, reg_loss: 0.2080 ||:  67%|######7   | 64/95 [00:42<00:21,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9044, UAS: 0.9521, LAS: 0.9109, UEM: 0.6394, LEM: 0.4178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4713, partial_loss/deprel_loss: 0.4861, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6910, loss: 0.6820, batch_reg_loss: 0.2078, reg_loss: 0.2080 ||:  71%|#######   | 67/95 [00:44<00:20,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9529, LAS: 0.9116, UEM: 0.6413, LEM: 0.4155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4729, partial_loss/deprel_loss: 0.5493, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7419, loss: 0.6771, batch_reg_loss: 0.2078, reg_loss: 0.2080 ||:  75%|#######4  | 71/95 [00:47<00:16,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9530, LAS: 0.9115, UEM: 0.6350, LEM: 0.4062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3582, partial_loss/deprel_loss: 0.4322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6252, loss: 0.6786, batch_reg_loss: 0.2078, reg_loss: 0.2080 ||:  79%|#######8  | 75/95 [00:49<00:13,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9535, LAS: 0.9119, UEM: 0.6321, LEM: 0.3990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2951, partial_loss/deprel_loss: 0.4685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6416, loss: 0.6769, batch_reg_loss: 0.2078, reg_loss: 0.2080 ||:  83%|########3 | 79/95 [00:52<00:10,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9541, LAS: 0.9124, UEM: 0.6400, LEM: 0.4063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4562, partial_loss/deprel_loss: 0.5250, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7190, loss: 0.6728, batch_reg_loss: 0.2078, reg_loss: 0.2080 ||:  86%|########6 | 82/95 [00:54<00:09,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9347, UAS: 0.9545, LAS: 0.9130, UEM: 0.6445, LEM: 0.4101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2685, partial_loss/deprel_loss: 0.3363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5305, loss: 0.6686, batch_reg_loss: 0.2077, reg_loss: 0.2080 ||:  89%|########9 | 85/95 [00:56<00:07,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8709, UAS: 0.9535, LAS: 0.9119, UEM: 0.6368, LEM: 0.4041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0026, partial_loss/deprel_loss: 0.7095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9758, loss: 0.6767, batch_reg_loss: 0.2077, reg_loss: 0.2080 ||:  93%|#########2| 88/95 [00:59<00:05,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9255, UAS: 0.9535, LAS: 0.9118, UEM: 0.6334, LEM: 0.3994, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2819, partial_loss/deprel_loss: 0.4044, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5876, loss: 0.6783, batch_reg_loss: 0.2077, reg_loss: 0.2079 ||:  97%|#########6| 92/95 [01:01<00:02,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9000, UAS: 0.9531, LAS: 0.9113, UEM: 0.6284, LEM: 0.3948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6236, partial_loss/deprel_loss: 0.5961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8093, loss: 0.6821, batch_reg_loss: 0.2077, reg_loss: 0.2079 ||: 100%|##########| 95/95 [01:03<00:00,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9000, UAS: 0.9531, LAS: 0.9113, UEM: 0.6284, LEM: 0.3948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6236, partial_loss/deprel_loss: 0.5961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8093, loss: 0.6821, batch_reg_loss: 0.2077, reg_loss: 0.2079 ||: 100%|##########| 95/95 [01:03<00:00,  1.49it/s]\n",
+      "2023-04-07 00:54:27,132 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8554, UAS: 0.9344, LAS: 0.8765, UEM: 0.4206, LEM: 0.1262, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4799, partial_loss/deprel_loss: 34.4669, partial_loss/cycle_loss: 0.0000, batch_loss: 27.8695, loss: 18.9120, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  18%|#8        | 2/11 [00:02<00:09,  1.01s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9525, LAS: 0.9021, UEM: 0.6547, LEM: 0.3652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1809, partial_loss/deprel_loss: 8.1429, partial_loss/cycle_loss: 0.0000, batch_loss: 6.5505, loss: 13.7622, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:05<00:06,  1.02s/it]  \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9503, LAS: 0.9009, UEM: 0.6862, LEM: 0.4429, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2093, partial_loss/deprel_loss: 6.0463, partial_loss/cycle_loss: 0.0000, batch_loss: 4.8789, loss: 14.6505, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  73%|#######2  | 8/11 [00:08<00:03,  1.02s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9518, LAS: 0.9015, UEM: 0.6800, LEM: 0.4162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4081, partial_loss/deprel_loss: 9.3230, partial_loss/cycle_loss: 0.0000, batch_loss: 7.5400, loss: 13.5045, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9518, LAS: 0.9015, UEM: 0.6800, LEM: 0.4162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4081, partial_loss/deprel_loss: 9.3230, partial_loss/cycle_loss: 0.0000, batch_loss: 7.5400, loss: 13.5045, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.03it/s]\n",
+      "2023-04-07 00:54:37,859 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:54:37,859 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 00:54:37,859 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.208  |     0.000\n",
+      "2023-04-07 00:54:37,859 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:54:37,859 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:54:37,859 - INFO - combo.training.tensorboard_writer - UEM                      |     0.628  |     0.680\n",
+      "2023-04-07 00:54:37,859 - INFO - combo.training.tensorboard_writer - LEM                      |     0.395  |     0.416\n",
+      "2023-04-07 00:54:37,859 - INFO - combo.training.tensorboard_writer - EM                       |     0.900  |     0.921\n",
+      "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.624  |     0.408\n",
+      "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - UAS                      |     0.953  |     0.952\n",
+      "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.596  |     9.323\n",
+      "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - loss                     |     0.682  |    13.504\n",
+      "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - LAS                      |     0.911  |     0.901\n",
+      "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:54:37,860 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 00:54:37,865 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:54:43,239 - INFO - combo.training.trainer - Epoch duration: 0:01:23.092109\n",
+      "2023-04-07 00:54:43,239 - INFO - combo.training.trainer - Estimated training time remaining: 5:25:45\n",
+      "2023-04-07 00:54:43,240 - INFO - allennlp.training.trainer - Epoch 111/399\n",
+      "2023-04-07 00:54:43,240 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:54:43,241 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:54:43,251 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8977, UAS: 0.9590, LAS: 0.9166, UEM: 0.6606, LEM: 0.3979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5436, partial_loss/deprel_loss: 0.5115, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7256, loss: 0.6280, batch_reg_loss: 0.2077, reg_loss: 0.2077 ||:   5%|5         | 5/95 [00:02<00:39,  2.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8898, UAS: 0.9373, LAS: 0.8936, UEM: 0.5443, LEM: 0.3220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7137, partial_loss/deprel_loss: 0.5885, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8212, loss: 0.7938, batch_reg_loss: 0.2077, reg_loss: 0.2077 ||:   9%|9         | 9/95 [00:04<00:42,  2.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9437, LAS: 0.9003, UEM: 0.6005, LEM: 0.3562, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1950, partial_loss/deprel_loss: 0.4090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5739, loss: 0.7501, batch_reg_loss: 0.2077, reg_loss: 0.2077 ||:  13%|#2        | 12/95 [00:06<00:45,  1.82it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9476, LAS: 0.9040, UEM: 0.6031, LEM: 0.3496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2522, partial_loss/deprel_loss: 0.4405, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6105, loss: 0.7300, batch_reg_loss: 0.2076, reg_loss: 0.2077 ||:  17%|#6        | 16/95 [00:09<00:44,  1.76it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9514, LAS: 0.9084, UEM: 0.6514, LEM: 0.3956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1930, partial_loss/deprel_loss: 0.3176, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5003, loss: 0.6952, batch_reg_loss: 0.2076, reg_loss: 0.2077 ||:  20%|##        | 19/95 [00:11<00:47,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9505, LAS: 0.9072, UEM: 0.6217, LEM: 0.3714, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5095, partial_loss/deprel_loss: 0.5757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7701, loss: 0.7075, batch_reg_loss: 0.2076, reg_loss: 0.2077 ||:  23%|##3       | 22/95 [00:13<00:48,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9532, LAS: 0.9101, UEM: 0.6547, LEM: 0.4021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1771, partial_loss/deprel_loss: 0.3581, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5295, loss: 0.6859, batch_reg_loss: 0.2076, reg_loss: 0.2076 ||:  26%|##6       | 25/95 [00:15<00:46,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9536, LAS: 0.9108, UEM: 0.6392, LEM: 0.3879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5182, partial_loss/deprel_loss: 0.5426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7453, loss: 0.6827, batch_reg_loss: 0.2076, reg_loss: 0.2076 ||:  31%|###       | 29/95 [00:18<00:42,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9540, LAS: 0.9114, UEM: 0.6238, LEM: 0.3745, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3374, partial_loss/deprel_loss: 0.3857, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5836, loss: 0.6796, batch_reg_loss: 0.2076, reg_loss: 0.2076 ||:  35%|###4      | 33/95 [00:20<00:38,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9668, UAS: 0.9550, LAS: 0.9132, UEM: 0.6617, LEM: 0.4304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0337, partial_loss/deprel_loss: 0.1306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3188, loss: 0.6679, batch_reg_loss: 0.2075, reg_loss: 0.2076 ||:  39%|###8      | 37/95 [00:24<00:41,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8731, UAS: 0.9540, LAS: 0.9120, UEM: 0.6489, LEM: 0.4159, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9585, partial_loss/deprel_loss: 0.6945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9548, loss: 0.6778, batch_reg_loss: 0.2075, reg_loss: 0.2076 ||:  43%|####3     | 41/95 [00:26<00:37,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9540, LAS: 0.9122, UEM: 0.6452, LEM: 0.4120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4219, partial_loss/deprel_loss: 0.4436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6468, loss: 0.6761, batch_reg_loss: 0.2075, reg_loss: 0.2076 ||:  46%|####6     | 44/95 [00:28<00:36,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9541, LAS: 0.9121, UEM: 0.6530, LEM: 0.4213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3005, partial_loss/deprel_loss: 0.4328, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6138, loss: 0.6782, batch_reg_loss: 0.2075, reg_loss: 0.2076 ||:  49%|####9     | 47/95 [00:31<00:35,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9355, UAS: 0.9541, LAS: 0.9122, UEM: 0.6494, LEM: 0.4175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2077, partial_loss/deprel_loss: 0.3303, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5132, loss: 0.6784, batch_reg_loss: 0.2075, reg_loss: 0.2076 ||:  53%|#####2    | 50/95 [00:33<00:33,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9547, LAS: 0.9127, UEM: 0.6445, LEM: 0.4090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3559, partial_loss/deprel_loss: 0.4327, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6248, loss: 0.6742, batch_reg_loss: 0.2075, reg_loss: 0.2076 ||:  57%|#####6    | 54/95 [00:36<00:29,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9557, LAS: 0.9136, UEM: 0.6559, LEM: 0.4183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2399, partial_loss/deprel_loss: 0.3943, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5708, loss: 0.6671, batch_reg_loss: 0.2074, reg_loss: 0.2076 ||:  60%|######    | 57/95 [00:38<00:28,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9552, LAS: 0.9130, UEM: 0.6515, LEM: 0.4122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2354, partial_loss/deprel_loss: 0.3737, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5534, loss: 0.6727, batch_reg_loss: 0.2074, reg_loss: 0.2076 ||:  64%|######4   | 61/95 [00:41<00:24,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9347, UAS: 0.9553, LAS: 0.9132, UEM: 0.6486, LEM: 0.4083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2017, partial_loss/deprel_loss: 0.3469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5252, loss: 0.6709, batch_reg_loss: 0.2074, reg_loss: 0.2076 ||:  68%|######8   | 65/95 [00:43<00:20,  1.45it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9549, LAS: 0.9127, UEM: 0.6378, LEM: 0.3987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2895, partial_loss/deprel_loss: 0.4096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5929, loss: 0.6746, batch_reg_loss: 0.2074, reg_loss: 0.2075 ||:  73%|#######2  | 69/95 [00:46<00:17,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9554, LAS: 0.9134, UEM: 0.6394, LEM: 0.3992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4656, partial_loss/deprel_loss: 0.5376, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7305, loss: 0.6704, batch_reg_loss: 0.2073, reg_loss: 0.2075 ||:  77%|#######6  | 73/95 [00:49<00:14,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9559, LAS: 0.9139, UEM: 0.6483, LEM: 0.4087, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2332, partial_loss/deprel_loss: 0.4139, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5851, loss: 0.6655, batch_reg_loss: 0.2073, reg_loss: 0.2075 ||:  81%|########1 | 77/95 [00:51<00:12,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9549, LAS: 0.9128, UEM: 0.6375, LEM: 0.4001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7371, partial_loss/deprel_loss: 0.5769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8163, loss: 0.6732, batch_reg_loss: 0.2073, reg_loss: 0.2075 ||:  85%|########5 | 81/95 [00:54<00:09,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9552, LAS: 0.9131, UEM: 0.6416, LEM: 0.4024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4893, partial_loss/deprel_loss: 0.5063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7102, loss: 0.6706, batch_reg_loss: 0.2073, reg_loss: 0.2075 ||:  88%|########8 | 84/95 [00:56<00:07,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9546, LAS: 0.9124, UEM: 0.6412, LEM: 0.4016, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1989, partial_loss/deprel_loss: 0.3788, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5501, loss: 0.6747, batch_reg_loss: 0.2073, reg_loss: 0.2075 ||:  93%|#########2| 88/95 [00:58<00:04,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9546, LAS: 0.9125, UEM: 0.6358, LEM: 0.3966, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2665, partial_loss/deprel_loss: 0.4082, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5872, loss: 0.6744, batch_reg_loss: 0.2073, reg_loss: 0.2075 ||:  97%|#########6| 92/95 [01:01<00:01,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9315, UAS: 0.9548, LAS: 0.9128, UEM: 0.6377, LEM: 0.3979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2456, partial_loss/deprel_loss: 0.3930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5708, loss: 0.6717, batch_reg_loss: 0.2073, reg_loss: 0.2075 ||: 100%|##########| 95/95 [01:03<00:00,  1.50it/s]\n",
+      "2023-04-07 00:55:49,824 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.207  |       N/A\n",
+      "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - UEM                      |     0.638  |       N/A\n",
+      "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - LEM                      |     0.398  |       N/A\n",
+      "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - EM                       |     0.931  |       N/A\n",
+      "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.246  |       N/A\n",
+      "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - UAS                      |     0.955  |       N/A\n",
+      "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.393  |       N/A\n",
+      "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - loss                     |     0.672  |       N/A\n",
+      "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - LAS                      |     0.913  |       N/A\n",
+      "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:55:49,825 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:55:49,826 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:55:49,826 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:55:49,826 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:55:49,826 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:55:49,830 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 00:55:54,628 - INFO - combo.training.trainer - Epoch duration: 0:01:11.388004\n",
+      "2023-04-07 00:55:54,628 - INFO - combo.training.trainer - Estimated training time remaining: 5:24:47\n",
+      "2023-04-07 00:55:54,628 - INFO - allennlp.training.trainer - Epoch 112/399\n",
+      "2023-04-07 00:55:54,629 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:55:54,629 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:55:54,638 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9541, LAS: 0.9113, UEM: 0.6700, LEM: 0.4170, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2265, partial_loss/deprel_loss: 0.3354, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5209, loss: 0.6850, batch_reg_loss: 0.2072, reg_loss: 0.2072 ||:   3%|3         | 3/95 [00:02<01:07,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9573, LAS: 0.9152, UEM: 0.6773, LEM: 0.4345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1977, partial_loss/deprel_loss: 0.3732, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5453, loss: 0.6647, batch_reg_loss: 0.2072, reg_loss: 0.2072 ||:   6%|6         | 6/95 [00:04<01:05,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8745, UAS: 0.9541, LAS: 0.9116, UEM: 0.6053, LEM: 0.3598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0969, partial_loss/deprel_loss: 0.7053, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9908, loss: 0.6865, batch_reg_loss: 0.2072, reg_loss: 0.2072 ||:  12%|#1        | 11/95 [00:06<00:54,  1.53it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9283, UAS: 0.9544, LAS: 0.9121, UEM: 0.6304, LEM: 0.3931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2483, partial_loss/deprel_loss: 0.4131, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5873, loss: 0.6820, batch_reg_loss: 0.2072, reg_loss: 0.2072 ||:  16%|#5        | 15/95 [00:08<00:49,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8412, UAS: 0.9508, LAS: 0.9085, UEM: 0.5879, LEM: 0.3531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5111, partial_loss/deprel_loss: 0.8153, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1616, loss: 0.7109, batch_reg_loss: 0.2072, reg_loss: 0.2072 ||:  21%|##1       | 20/95 [00:11<00:43,  1.73it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9532, LAS: 0.9110, UEM: 0.5929, LEM: 0.3462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3499, partial_loss/deprel_loss: 0.4477, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6353, loss: 0.6941, batch_reg_loss: 0.2071, reg_loss: 0.2072 ||:  26%|##6       | 25/95 [00:13<00:38,  1.80it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9550, LAS: 0.9132, UEM: 0.6118, LEM: 0.3607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2080, partial_loss/deprel_loss: 0.3424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5226, loss: 0.6762, batch_reg_loss: 0.2071, reg_loss: 0.2072 ||:  31%|###       | 29/95 [00:16<00:38,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9534, LAS: 0.9113, UEM: 0.6007, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5243, partial_loss/deprel_loss: 0.5013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7130, loss: 0.6886, batch_reg_loss: 0.2071, reg_loss: 0.2072 ||:  35%|###4      | 33/95 [00:19<00:38,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9525, LAS: 0.9106, UEM: 0.5940, LEM: 0.3442, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5756, partial_loss/deprel_loss: 0.4825, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7082, loss: 0.6925, batch_reg_loss: 0.2071, reg_loss: 0.2072 ||:  39%|###8      | 37/95 [00:21<00:36,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9515, LAS: 0.9096, UEM: 0.5879, LEM: 0.3398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5804, partial_loss/deprel_loss: 0.5401, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7552, loss: 0.6975, batch_reg_loss: 0.2071, reg_loss: 0.2072 ||:  43%|####3     | 41/95 [00:24<00:35,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8817, UAS: 0.9521, LAS: 0.9104, UEM: 0.5935, LEM: 0.3457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8963, partial_loss/deprel_loss: 0.6886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9372, loss: 0.6926, batch_reg_loss: 0.2071, reg_loss: 0.2072 ||:  47%|####7     | 45/95 [00:27<00:32,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9109, UAS: 0.9509, LAS: 0.9092, UEM: 0.5827, LEM: 0.3359, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4573, partial_loss/deprel_loss: 0.5203, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7148, loss: 0.7012, batch_reg_loss: 0.2071, reg_loss: 0.2071 ||:  52%|#####1    | 49/95 [00:29<00:29,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8867, UAS: 0.9512, LAS: 0.9096, UEM: 0.5857, LEM: 0.3397, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7286, partial_loss/deprel_loss: 0.6428, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8670, loss: 0.6983, batch_reg_loss: 0.2070, reg_loss: 0.2071 ||:  56%|#####5    | 53/95 [00:32<00:27,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9371, UAS: 0.9525, LAS: 0.9110, UEM: 0.5959, LEM: 0.3478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1759, partial_loss/deprel_loss: 0.3055, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4866, loss: 0.6898, batch_reg_loss: 0.2070, reg_loss: 0.2071 ||:  60%|######    | 57/95 [00:35<00:25,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9532, LAS: 0.9117, UEM: 0.6244, LEM: 0.3865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2594, partial_loss/deprel_loss: 0.3744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5584, loss: 0.6855, batch_reg_loss: 0.2070, reg_loss: 0.2071 ||:  64%|######4   | 61/95 [00:38<00:25,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9535, LAS: 0.9120, UEM: 0.6219, LEM: 0.3828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3242, partial_loss/deprel_loss: 0.3285, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5346, loss: 0.6825, batch_reg_loss: 0.2070, reg_loss: 0.2071 ||:  67%|######7   | 64/95 [00:41<00:22,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9537, LAS: 0.9123, UEM: 0.6160, LEM: 0.3767, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5349, partial_loss/deprel_loss: 0.5850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7820, loss: 0.6816, batch_reg_loss: 0.2070, reg_loss: 0.2071 ||:  72%|#######1  | 68/95 [00:43<00:18,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9541, LAS: 0.9126, UEM: 0.6144, LEM: 0.3722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2564, partial_loss/deprel_loss: 0.4012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5792, loss: 0.6797, batch_reg_loss: 0.2069, reg_loss: 0.2071 ||:  76%|#######5  | 72/95 [00:45<00:15,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9540, LAS: 0.9126, UEM: 0.6114, LEM: 0.3713, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5900, partial_loss/deprel_loss: 0.5781, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7874, loss: 0.6779, batch_reg_loss: 0.2069, reg_loss: 0.2071 ||:  80%|########  | 76/95 [00:48<00:12,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8803, UAS: 0.9537, LAS: 0.9124, UEM: 0.6128, LEM: 0.3740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8648, partial_loss/deprel_loss: 0.6347, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8876, loss: 0.6790, batch_reg_loss: 0.2069, reg_loss: 0.2071 ||:  84%|########4 | 80/95 [00:51<00:10,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9390, UAS: 0.9539, LAS: 0.9127, UEM: 0.6176, LEM: 0.3807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2030, partial_loss/deprel_loss: 0.3326, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5135, loss: 0.6768, batch_reg_loss: 0.2069, reg_loss: 0.2071 ||:  88%|########8 | 84/95 [00:54<00:07,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9539, LAS: 0.9127, UEM: 0.6162, LEM: 0.3785, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7537, partial_loss/deprel_loss: 0.6348, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8654, loss: 0.6763, batch_reg_loss: 0.2069, reg_loss: 0.2071 ||:  92%|#########1| 87/95 [00:56<00:05,  1.45it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9420, UAS: 0.9547, LAS: 0.9135, UEM: 0.6343, LEM: 0.3972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0920, partial_loss/deprel_loss: 0.2665, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4384, loss: 0.6691, batch_reg_loss: 0.2068, reg_loss: 0.2071 ||:  95%|#########4| 90/95 [00:58<00:03,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8734, UAS: 0.9546, LAS: 0.9134, UEM: 0.6399, LEM: 0.4063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0046, partial_loss/deprel_loss: 0.6334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9145, loss: 0.6691, batch_reg_loss: 0.2068, reg_loss: 0.2070 ||:  98%|#########7| 93/95 [01:01<00:01,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8916, UAS: 0.9545, LAS: 0.9133, UEM: 0.6376, LEM: 0.4041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7759, partial_loss/deprel_loss: 0.6346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8696, loss: 0.6706, batch_reg_loss: 0.2068, reg_loss: 0.2070 ||: 100%|##########| 95/95 [01:02<00:00,  1.51it/s]\n",
+      "2023-04-07 00:57:00,550 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:57:00,550 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 00:57:00,550 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.207  |       N/A\n",
+      "2023-04-07 00:57:00,550 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:57:00,550 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:57:00,550 - INFO - combo.training.tensorboard_writer - UEM                      |     0.638  |       N/A\n",
+      "2023-04-07 00:57:00,550 - INFO - combo.training.tensorboard_writer - LEM                      |     0.404  |       N/A\n",
+      "2023-04-07 00:57:00,550 - INFO - combo.training.tensorboard_writer - EM                       |     0.892  |       N/A\n",
+      "2023-04-07 00:57:00,550 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.776  |       N/A\n",
+      "2023-04-07 00:57:00,550 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - UAS                      |     0.955  |       N/A\n",
+      "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.635  |       N/A\n",
+      "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - loss                     |     0.671  |       N/A\n",
+      "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - LAS                      |     0.913  |       N/A\n",
+      "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:57:00,551 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:57:00,556 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 00:57:05,958 - INFO - combo.training.trainer - Epoch duration: 0:01:11.329365\n",
+      "2023-04-07 00:57:05,958 - INFO - combo.training.trainer - Estimated training time remaining: 5:23:49\n",
+      "2023-04-07 00:57:05,958 - INFO - allennlp.training.trainer - Epoch 113/399\n",
+      "2023-04-07 00:57:05,959 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:57:05,959 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:57:05,969 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9400, UAS: 0.9584, LAS: 0.9173, UEM: 0.6802, LEM: 0.4465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1106, partial_loss/deprel_loss: 0.2887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4599, loss: 0.6359, batch_reg_loss: 0.2068, reg_loss: 0.2068 ||:   4%|4         | 4/95 [00:02<01:03,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8979, UAS: 0.9530, LAS: 0.9123, UEM: 0.5739, LEM: 0.3527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7199, partial_loss/deprel_loss: 0.5625, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8007, loss: 0.6692, batch_reg_loss: 0.2068, reg_loss: 0.2068 ||:   7%|7         | 7/95 [00:05<01:03,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8845, UAS: 0.9498, LAS: 0.9099, UEM: 0.5849, LEM: 0.3816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8978, partial_loss/deprel_loss: 0.6391, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8976, loss: 0.6865, batch_reg_loss: 0.2068, reg_loss: 0.2068 ||:  11%|#         | 10/95 [00:07<01:01,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8524, UAS: 0.9471, LAS: 0.9058, UEM: 0.5426, LEM: 0.3332, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2796, partial_loss/deprel_loss: 0.7912, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0956, loss: 0.7191, batch_reg_loss: 0.2067, reg_loss: 0.2068 ||:  15%|#4        | 14/95 [00:09<00:56,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9484, LAS: 0.9070, UEM: 0.5279, LEM: 0.3104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4803, partial_loss/deprel_loss: 0.4972, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7005, loss: 0.7120, batch_reg_loss: 0.2067, reg_loss: 0.2068 ||:  19%|#8        | 18/95 [00:12<00:52,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9518, LAS: 0.9112, UEM: 0.5883, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1955, partial_loss/deprel_loss: 0.3472, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5235, loss: 0.6831, batch_reg_loss: 0.2067, reg_loss: 0.2068 ||:  22%|##2       | 21/95 [00:14<00:52,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9522, LAS: 0.9115, UEM: 0.5883, LEM: 0.3545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4520, partial_loss/deprel_loss: 0.5374, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7270, loss: 0.6812, batch_reg_loss: 0.2067, reg_loss: 0.2067 ||:  27%|##7       | 26/95 [00:17<00:44,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9523, LAS: 0.9114, UEM: 0.5781, LEM: 0.3426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3002, partial_loss/deprel_loss: 0.3527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5488, loss: 0.6800, batch_reg_loss: 0.2067, reg_loss: 0.2067 ||:  33%|###2      | 31/95 [00:19<00:37,  1.72it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9533, LAS: 0.9122, UEM: 0.5999, LEM: 0.3633, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7041, partial_loss/deprel_loss: 0.6440, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8626, loss: 0.6761, batch_reg_loss: 0.2066, reg_loss: 0.2067 ||:  38%|###7      | 36/95 [00:21<00:32,  1.84it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9208, UAS: 0.9536, LAS: 0.9129, UEM: 0.5938, LEM: 0.3540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3882, partial_loss/deprel_loss: 0.4526, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6463, loss: 0.6712, batch_reg_loss: 0.2066, reg_loss: 0.2067 ||:  43%|####3     | 41/95 [00:23<00:27,  1.97it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9542, LAS: 0.9137, UEM: 0.6311, LEM: 0.4057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4491, partial_loss/deprel_loss: 0.5503, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7366, loss: 0.6646, batch_reg_loss: 0.2066, reg_loss: 0.2067 ||:  48%|####8     | 46/95 [00:27<00:28,  1.71it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9252, UAS: 0.9545, LAS: 0.9140, UEM: 0.6245, LEM: 0.3965, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3037, partial_loss/deprel_loss: 0.3956, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5838, loss: 0.6616, batch_reg_loss: 0.2066, reg_loss: 0.2067 ||:  53%|#####2    | 50/95 [00:30<00:28,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8946, UAS: 0.9544, LAS: 0.9136, UEM: 0.6169, LEM: 0.3865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7795, partial_loss/deprel_loss: 0.6187, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8574, loss: 0.6660, batch_reg_loss: 0.2065, reg_loss: 0.2067 ||:  57%|#####6    | 54/95 [00:32<00:25,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8638, UAS: 0.9546, LAS: 0.9136, UEM: 0.6236, LEM: 0.3896, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0144, partial_loss/deprel_loss: 0.7123, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9792, loss: 0.6655, batch_reg_loss: 0.2065, reg_loss: 0.2067 ||:  61%|######1   | 58/95 [00:35<00:23,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9545, LAS: 0.9136, UEM: 0.6254, LEM: 0.3891, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4074, partial_loss/deprel_loss: 0.4601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6560, loss: 0.6656, batch_reg_loss: 0.2065, reg_loss: 0.2067 ||:  65%|######5   | 62/95 [00:38<00:20,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8890, UAS: 0.9541, LAS: 0.9131, UEM: 0.6179, LEM: 0.3815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7141, partial_loss/deprel_loss: 0.6444, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8648, loss: 0.6699, batch_reg_loss: 0.2065, reg_loss: 0.2066 ||:  69%|######9   | 66/95 [00:41<00:19,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9549, LAS: 0.9139, UEM: 0.6262, LEM: 0.3857, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3050, partial_loss/deprel_loss: 0.4015, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5887, loss: 0.6640, batch_reg_loss: 0.2065, reg_loss: 0.2066 ||:  74%|#######3  | 70/95 [00:44<00:17,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9149, UAS: 0.9549, LAS: 0.9140, UEM: 0.6246, LEM: 0.3834, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3999, partial_loss/deprel_loss: 0.5016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6877, loss: 0.6638, batch_reg_loss: 0.2065, reg_loss: 0.2066 ||:  77%|#######6  | 73/95 [00:46<00:15,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9554, LAS: 0.9145, UEM: 0.6319, LEM: 0.3919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1239, partial_loss/deprel_loss: 0.2806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4557, loss: 0.6601, batch_reg_loss: 0.2064, reg_loss: 0.2066 ||:  80%|########  | 76/95 [00:48<00:14,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9239, UAS: 0.9548, LAS: 0.9138, UEM: 0.6278, LEM: 0.3880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2888, partial_loss/deprel_loss: 0.4178, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5984, loss: 0.6661, batch_reg_loss: 0.2064, reg_loss: 0.2066 ||:  83%|########3 | 79/95 [00:51<00:11,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9551, LAS: 0.9141, UEM: 0.6284, LEM: 0.3882, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1992, partial_loss/deprel_loss: 0.2848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4741, loss: 0.6631, batch_reg_loss: 0.2064, reg_loss: 0.2066 ||:  87%|########7 | 83/95 [00:53<00:08,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9553, LAS: 0.9143, UEM: 0.6391, LEM: 0.4009, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1942, partial_loss/deprel_loss: 0.3815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5504, loss: 0.6611, batch_reg_loss: 0.2064, reg_loss: 0.2066 ||:  91%|######### | 86/95 [00:56<00:06,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9544, LAS: 0.9134, UEM: 0.6323, LEM: 0.3953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4970, partial_loss/deprel_loss: 0.5067, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7111, loss: 0.6680, batch_reg_loss: 0.2064, reg_loss: 0.2066 ||:  94%|#########3| 89/95 [00:58<00:04,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8898, UAS: 0.9545, LAS: 0.9134, UEM: 0.6324, LEM: 0.3946, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7042, partial_loss/deprel_loss: 0.6272, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8490, loss: 0.6676, batch_reg_loss: 0.2064, reg_loss: 0.2066 ||:  98%|#########7| 93/95 [01:00<00:01,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9390, UAS: 0.9549, LAS: 0.9138, UEM: 0.6379, LEM: 0.3988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2131, partial_loss/deprel_loss: 0.3441, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5243, loss: 0.6649, batch_reg_loss: 0.2064, reg_loss: 0.2066 ||: 100%|##########| 95/95 [01:02<00:00,  1.53it/s]\n",
+      "2023-04-07 00:58:10,927 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:58:10,927 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 00:58:10,927 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.207  |       N/A\n",
+      "2023-04-07 00:58:10,927 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - UEM                      |     0.638  |       N/A\n",
+      "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - LEM                      |     0.399  |       N/A\n",
+      "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - EM                       |     0.939  |       N/A\n",
+      "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.213  |       N/A\n",
+      "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - UAS                      |     0.955  |       N/A\n",
+      "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.344  |       N/A\n",
+      "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - loss                     |     0.665  |       N/A\n",
+      "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - LAS                      |     0.914  |       N/A\n",
+      "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:58:10,928 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:58:10,929 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:58:10,932 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:58:15,015 - INFO - combo.training.trainer - Epoch duration: 0:01:09.056259\n",
+      "2023-04-07 00:58:15,015 - INFO - combo.training.trainer - Estimated training time remaining: 5:22:44\n",
+      "2023-04-07 00:58:15,015 - INFO - allennlp.training.trainer - Epoch 114/399\n",
+      "2023-04-07 00:58:15,015 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:58:15,016 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:58:15,025 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9314, LAS: 0.8917, UEM: 0.7087, LEM: 0.5256, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1108, partial_loss/deprel_loss: 0.2852, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4566, loss: 0.7819, batch_reg_loss: 0.2064, reg_loss: 0.2064 ||:   3%|3         | 3/95 [00:04<02:07,  1.39s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9427, LAS: 0.9017, UEM: 0.5768, LEM: 0.3815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5833, partial_loss/deprel_loss: 0.5521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7647, loss: 0.7315, batch_reg_loss: 0.2063, reg_loss: 0.2064 ||:   7%|7         | 7/95 [00:06<01:41,  1.15s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9199, UAS: 0.9447, LAS: 0.9032, UEM: 0.5226, LEM: 0.3182, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4223, partial_loss/deprel_loss: 0.4529, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6531, loss: 0.7285, batch_reg_loss: 0.2063, reg_loss: 0.2063 ||:  12%|#1        | 11/95 [00:08<01:22,  1.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9016, UAS: 0.9483, LAS: 0.9059, UEM: 0.5293, LEM: 0.3032, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4901, partial_loss/deprel_loss: 0.5842, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7717, loss: 0.7123, batch_reg_loss: 0.2063, reg_loss: 0.2063 ||:  15%|#4        | 14/95 [00:11<01:12,  1.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9464, LAS: 0.9037, UEM: 0.5079, LEM: 0.2812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7024, partial_loss/deprel_loss: 0.6527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8690, loss: 0.7267, batch_reg_loss: 0.2063, reg_loss: 0.2063 ||:  19%|#8        | 18/95 [00:13<01:02,  1.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9472, LAS: 0.9046, UEM: 0.5318, LEM: 0.2996, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7510, partial_loss/deprel_loss: 0.5741, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8158, loss: 0.7191, batch_reg_loss: 0.2063, reg_loss: 0.2063 ||:  22%|##2       | 21/95 [00:16<01:01,  1.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8968, UAS: 0.9480, LAS: 0.9057, UEM: 0.5322, LEM: 0.2964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6785, partial_loss/deprel_loss: 0.5636, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7929, loss: 0.7136, batch_reg_loss: 0.2063, reg_loss: 0.2063 ||:  25%|##5       | 24/95 [00:18<00:57,  1.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8908, UAS: 0.9465, LAS: 0.9042, UEM: 0.5057, LEM: 0.2787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8269, partial_loss/deprel_loss: 0.5861, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8406, loss: 0.7281, batch_reg_loss: 0.2063, reg_loss: 0.2063 ||:  28%|##8       | 27/95 [00:20<00:52,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8880, UAS: 0.9471, LAS: 0.9053, UEM: 0.5396, LEM: 0.3264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6627, partial_loss/deprel_loss: 0.5766, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8001, loss: 0.7164, batch_reg_loss: 0.2063, reg_loss: 0.2063 ||:  33%|###2      | 31/95 [00:23<00:47,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9465, LAS: 0.9044, UEM: 0.5289, LEM: 0.3153, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4289, partial_loss/deprel_loss: 0.5023, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6939, loss: 0.7222, batch_reg_loss: 0.2063, reg_loss: 0.2063 ||:  36%|###5      | 34/95 [00:25<00:44,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9481, LAS: 0.9060, UEM: 0.5428, LEM: 0.3204, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2243, partial_loss/deprel_loss: 0.3679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5455, loss: 0.7106, batch_reg_loss: 0.2062, reg_loss: 0.2063 ||:  40%|####      | 38/95 [00:27<00:39,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9156, UAS: 0.9504, LAS: 0.9085, UEM: 0.5692, LEM: 0.3384, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3216, partial_loss/deprel_loss: 0.4033, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5932, loss: 0.6906, batch_reg_loss: 0.2062, reg_loss: 0.2063 ||:  45%|####5     | 43/95 [00:29<00:31,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8907, UAS: 0.9508, LAS: 0.9088, UEM: 0.5726, LEM: 0.3382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8930, partial_loss/deprel_loss: 0.5813, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8498, loss: 0.6889, batch_reg_loss: 0.2062, reg_loss: 0.2063 ||:  49%|####9     | 47/95 [00:31<00:27,  1.73it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9514, LAS: 0.9093, UEM: 0.5837, LEM: 0.3493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1193, partial_loss/deprel_loss: 0.2989, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4692, loss: 0.6875, batch_reg_loss: 0.2062, reg_loss: 0.2063 ||:  55%|#####4    | 52/95 [00:33<00:23,  1.86it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9684, UAS: 0.9524, LAS: 0.9107, UEM: 0.6082, LEM: 0.3844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0420, partial_loss/deprel_loss: 0.1186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3095, loss: 0.6773, batch_reg_loss: 0.2062, reg_loss: 0.2063 ||:  60%|######    | 57/95 [00:36<00:20,  1.85it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9536, LAS: 0.9120, UEM: 0.6220, LEM: 0.3946, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3440, partial_loss/deprel_loss: 0.3558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5596, loss: 0.6674, batch_reg_loss: 0.2061, reg_loss: 0.2063 ||:  64%|######4   | 61/95 [00:39<00:20,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9546, LAS: 0.9131, UEM: 0.6359, LEM: 0.4066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2063, partial_loss/deprel_loss: 0.3269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5089, loss: 0.6604, batch_reg_loss: 0.2061, reg_loss: 0.2063 ||:  68%|######8   | 65/95 [00:42<00:19,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9554, LAS: 0.9141, UEM: 0.6416, LEM: 0.4083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1980, partial_loss/deprel_loss: 0.3228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5039, loss: 0.6536, batch_reg_loss: 0.2061, reg_loss: 0.2062 ||:  73%|#######2  | 69/95 [00:45<00:17,  1.52it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8658, UAS: 0.9554, LAS: 0.9140, UEM: 0.6468, LEM: 0.4109, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1753, partial_loss/deprel_loss: 0.7502, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0412, loss: 0.6552, batch_reg_loss: 0.2060, reg_loss: 0.2062 ||:  77%|#######6  | 73/95 [00:48<00:14,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9550, LAS: 0.9135, UEM: 0.6371, LEM: 0.4017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4383, partial_loss/deprel_loss: 0.5298, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7175, loss: 0.6596, batch_reg_loss: 0.2060, reg_loss: 0.2062 ||:  81%|########1 | 77/95 [00:50<00:11,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9551, LAS: 0.9139, UEM: 0.6423, LEM: 0.4079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9780, partial_loss/deprel_loss: 0.5931, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8761, loss: 0.6583, batch_reg_loss: 0.2060, reg_loss: 0.2062 ||:  85%|########5 | 81/95 [00:53<00:09,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9553, LAS: 0.9140, UEM: 0.6380, LEM: 0.4017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3073, partial_loss/deprel_loss: 0.3879, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5778, loss: 0.6582, batch_reg_loss: 0.2060, reg_loss: 0.2062 ||:  88%|########8 | 84/95 [00:55<00:07,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8638, UAS: 0.9553, LAS: 0.9139, UEM: 0.6417, LEM: 0.4037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1078, partial_loss/deprel_loss: 0.8183, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0821, loss: 0.6598, batch_reg_loss: 0.2059, reg_loss: 0.2062 ||:  93%|#########2| 88/95 [00:58<00:04,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8461, UAS: 0.9549, LAS: 0.9136, UEM: 0.6432, LEM: 0.4066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2994, partial_loss/deprel_loss: 0.8153, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1180, loss: 0.6617, batch_reg_loss: 0.2059, reg_loss: 0.2062 ||:  96%|#########5| 91/95 [01:00<00:02,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8787, UAS: 0.9545, LAS: 0.9133, UEM: 0.6382, LEM: 0.4020, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9167, partial_loss/deprel_loss: 0.6057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8738, loss: 0.6647, batch_reg_loss: 0.2059, reg_loss: 0.2062 ||:  99%|#########8| 94/95 [01:02<00:00,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9546, LAS: 0.9133, UEM: 0.6378, LEM: 0.4006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2826, partial_loss/deprel_loss: 0.4305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6068, loss: 0.6641, batch_reg_loss: 0.2059, reg_loss: 0.2062 ||: 100%|##########| 95/95 [01:03<00:00,  1.50it/s]\n",
+      "2023-04-07 00:59:21,552 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.206  |       N/A\n",
+      "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - UEM                      |     0.638  |       N/A\n",
+      "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - LEM                      |     0.401  |       N/A\n",
+      "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - EM                       |     0.918  |       N/A\n",
+      "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.283  |       N/A\n",
+      "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - UAS                      |     0.955  |       N/A\n",
+      "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.430  |       N/A\n",
+      "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - loss                     |     0.664  |       N/A\n",
+      "2023-04-07 00:59:21,553 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:59:21,554 - INFO - combo.training.tensorboard_writer - LAS                      |     0.913  |       N/A\n",
+      "2023-04-07 00:59:21,554 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 00:59:21,554 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:59:21,554 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:59:21,554 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:59:21,554 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:59:21,554 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:59:21,559 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 00:59:26,252 - INFO - combo.training.trainer - Epoch duration: 0:01:11.236866\n",
+      "2023-04-07 00:59:26,253 - INFO - combo.training.trainer - Estimated training time remaining: 5:21:45\n",
+      "2023-04-07 00:59:26,253 - INFO - allennlp.training.trainer - Epoch 115/399\n",
+      "2023-04-07 00:59:26,253 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 00:59:26,254 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:59:26,263 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9542, LAS: 0.9129, UEM: 0.6562, LEM: 0.4301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7398, partial_loss/deprel_loss: 0.5365, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7831, loss: 0.6562, batch_reg_loss: 0.2059, reg_loss: 0.2059 ||:   4%|4         | 4/95 [00:02<00:57,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9585, LAS: 0.9187, UEM: 0.7247, LEM: 0.5237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4409, partial_loss/deprel_loss: 0.4558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6587, loss: 0.6120, batch_reg_loss: 0.2059, reg_loss: 0.2059 ||:   7%|7         | 7/95 [00:04<00:58,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9152, UAS: 0.9611, LAS: 0.9198, UEM: 0.7109, LEM: 0.4816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4914, partial_loss/deprel_loss: 0.5132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7147, loss: 0.6167, batch_reg_loss: 0.2059, reg_loss: 0.2059 ||:  12%|#1        | 11/95 [00:07<00:56,  1.49it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9596, LAS: 0.9177, UEM: 0.6701, LEM: 0.4351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4028, partial_loss/deprel_loss: 0.4769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6679, loss: 0.6390, batch_reg_loss: 0.2058, reg_loss: 0.2059 ||:  16%|#5        | 15/95 [00:09<00:51,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9672, UAS: 0.9599, LAS: 0.9190, UEM: 0.7118, LEM: 0.5007, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0420, partial_loss/deprel_loss: 0.1296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3179, loss: 0.6322, batch_reg_loss: 0.2058, reg_loss: 0.2059 ||:  20%|##        | 19/95 [00:12<00:50,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8954, UAS: 0.9585, LAS: 0.9178, UEM: 0.6914, LEM: 0.4795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7070, partial_loss/deprel_loss: 0.5902, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8194, loss: 0.6418, batch_reg_loss: 0.2058, reg_loss: 0.2059 ||:  23%|##3       | 22/95 [00:14<00:49,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9599, LAS: 0.9193, UEM: 0.6954, LEM: 0.4724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2777, partial_loss/deprel_loss: 0.4057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5859, loss: 0.6282, batch_reg_loss: 0.2058, reg_loss: 0.2059 ||:  27%|##7       | 26/95 [00:17<00:46,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9602, LAS: 0.9198, UEM: 0.6900, LEM: 0.4636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3445, partial_loss/deprel_loss: 0.4295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6183, loss: 0.6251, batch_reg_loss: 0.2058, reg_loss: 0.2058 ||:  31%|###       | 29/95 [00:19<00:45,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8793, UAS: 0.9577, LAS: 0.9172, UEM: 0.6820, LEM: 0.4575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9818, partial_loss/deprel_loss: 0.7060, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9669, loss: 0.6465, batch_reg_loss: 0.2058, reg_loss: 0.2058 ||:  34%|###3      | 32/95 [00:21<00:44,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9320, UAS: 0.9580, LAS: 0.9176, UEM: 0.6762, LEM: 0.4475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2332, partial_loss/deprel_loss: 0.3557, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5369, loss: 0.6457, batch_reg_loss: 0.2057, reg_loss: 0.2058 ||:  38%|###7      | 36/95 [00:24<00:40,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9559, LAS: 0.9156, UEM: 0.6609, LEM: 0.4351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9257, partial_loss/deprel_loss: 0.6299, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8948, loss: 0.6591, batch_reg_loss: 0.2057, reg_loss: 0.2058 ||:  42%|####2     | 40/95 [00:26<00:36,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9366, UAS: 0.9558, LAS: 0.9156, UEM: 0.6678, LEM: 0.4397, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1918, partial_loss/deprel_loss: 0.3306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5086, loss: 0.6576, batch_reg_loss: 0.2057, reg_loss: 0.2058 ||:  46%|####6     | 44/95 [00:29<00:34,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9563, LAS: 0.9161, UEM: 0.6686, LEM: 0.4403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1220, partial_loss/deprel_loss: 0.2797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4538, loss: 0.6523, batch_reg_loss: 0.2057, reg_loss: 0.2058 ||:  51%|#####     | 48/95 [00:32<00:30,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9076, UAS: 0.9555, LAS: 0.9151, UEM: 0.6544, LEM: 0.4258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4670, partial_loss/deprel_loss: 0.4503, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6593, loss: 0.6589, batch_reg_loss: 0.2057, reg_loss: 0.2058 ||:  55%|#####4    | 52/95 [00:34<00:27,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9562, LAS: 0.9156, UEM: 0.6531, LEM: 0.4184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4095, partial_loss/deprel_loss: 0.4563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6526, loss: 0.6558, batch_reg_loss: 0.2057, reg_loss: 0.2058 ||:  59%|#####8    | 56/95 [00:37<00:25,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9563, LAS: 0.9158, UEM: 0.6507, LEM: 0.4165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3193, partial_loss/deprel_loss: 0.4165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6027, loss: 0.6561, batch_reg_loss: 0.2056, reg_loss: 0.2058 ||:  64%|######4   | 61/95 [00:39<00:20,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9340, UAS: 0.9571, LAS: 0.9167, UEM: 0.6601, LEM: 0.4261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2201, partial_loss/deprel_loss: 0.3520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5312, loss: 0.6494, batch_reg_loss: 0.2056, reg_loss: 0.2058 ||:  68%|######8   | 65/95 [00:42<00:18,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9568, LAS: 0.9164, UEM: 0.6540, LEM: 0.4200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2275, partial_loss/deprel_loss: 0.3866, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5603, loss: 0.6510, batch_reg_loss: 0.2056, reg_loss: 0.2057 ||:  73%|#######2  | 69/95 [00:44<00:15,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8654, UAS: 0.9562, LAS: 0.9157, UEM: 0.6508, LEM: 0.4161, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0837, partial_loss/deprel_loss: 0.7093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9897, loss: 0.6556, batch_reg_loss: 0.2056, reg_loss: 0.2057 ||:  77%|#######6  | 73/95 [00:47<00:13,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9558, LAS: 0.9151, UEM: 0.6487, LEM: 0.4129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3352, partial_loss/deprel_loss: 0.4325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6186, loss: 0.6592, batch_reg_loss: 0.2056, reg_loss: 0.2057 ||:  81%|########1 | 77/95 [00:49<00:11,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9558, LAS: 0.9152, UEM: 0.6437, LEM: 0.4069, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3180, partial_loss/deprel_loss: 0.4234, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6079, loss: 0.6580, batch_reg_loss: 0.2055, reg_loss: 0.2057 ||:  85%|########5 | 81/95 [00:52<00:08,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9558, LAS: 0.9151, UEM: 0.6405, LEM: 0.4037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5322, partial_loss/deprel_loss: 0.6085, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7987, loss: 0.6593, batch_reg_loss: 0.2055, reg_loss: 0.2057 ||:  91%|######### | 86/95 [00:54<00:05,  1.69it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9556, LAS: 0.9149, UEM: 0.6366, LEM: 0.4010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4661, partial_loss/deprel_loss: 0.4269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6402, loss: 0.6593, batch_reg_loss: 0.2055, reg_loss: 0.2057 ||:  96%|#########5| 91/95 [00:57<00:02,  1.82it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9553, LAS: 0.9146, UEM: 0.6385, LEM: 0.4047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1003, partial_loss/deprel_loss: 0.2611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4344, loss: 0.6610, batch_reg_loss: 0.2055, reg_loss: 0.2057 ||: 100%|##########| 95/95 [00:59<00:00,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9553, LAS: 0.9146, UEM: 0.6385, LEM: 0.4047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1003, partial_loss/deprel_loss: 0.2611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4344, loss: 0.6610, batch_reg_loss: 0.2055, reg_loss: 0.2057 ||: 100%|##########| 95/95 [00:59<00:00,  1.60it/s]\n",
+      "2023-04-07 01:00:28,704 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9416, LAS: 0.8932, UEM: 0.5811, LEM: 0.3623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3733, partial_loss/deprel_loss: 10.4837, partial_loss/cycle_loss: 0.0000, batch_loss: 8.4616, loss: 16.5237, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  18%|#8        | 2/11 [00:02<00:09,  1.04s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.9379, LAS: 0.8831, UEM: 0.4572, LEM: 0.2129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0242, partial_loss/deprel_loss: 22.0818, partial_loss/cycle_loss: 0.0000, batch_loss: 17.8702, loss: 16.6606, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:05<00:06,  1.02s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8934, UAS: 0.9457, LAS: 0.8922, UEM: 0.5791, LEM: 0.3092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8919, partial_loss/deprel_loss: 15.8157, partial_loss/cycle_loss: 0.0000, batch_loss: 12.8309, loss: 14.5765, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  64%|######3   | 7/11 [00:07<00:04,  1.05s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9497, LAS: 0.8965, UEM: 0.6140, LEM: 0.3146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4204, partial_loss/deprel_loss: 8.2114, partial_loss/cycle_loss: 0.0000, batch_loss: 6.6532, loss: 12.6692, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  91%|######### | 10/11 [00:09<00:01,  1.01s/it] \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9518, LAS: 0.9007, UEM: 0.6806, LEM: 0.4141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2240, partial_loss/deprel_loss: 5.7408, partial_loss/cycle_loss: 0.0000, batch_loss: 4.6375, loss: 11.9390, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.00it/s]\n",
+      "2023-04-07 01:00:39,661 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:00:39,661 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 01:00:39,661 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.206  |     0.000\n",
+      "2023-04-07 01:00:39,661 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:00:39,661 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - UEM                      |     0.639  |     0.681\n",
+      "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - LEM                      |     0.405  |     0.414\n",
+      "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - EM                       |     0.944  |     0.943\n",
+      "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.100  |     0.224\n",
+      "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - UAS                      |     0.955  |     0.952\n",
+      "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.261  |     5.741\n",
+      "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - loss                     |     0.661  |    11.939\n",
+      "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - LAS                      |     0.915  |     0.901\n",
+      "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:00:39,662 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 01:00:39,667 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:00:44,474 - INFO - combo.training.trainer - Epoch duration: 0:01:18.220975\n",
+      "2023-04-07 01:00:44,475 - INFO - combo.training.trainer - Estimated training time remaining: 5:21:03\n",
+      "2023-04-07 01:00:44,479 - INFO - allennlp.training.trainer - Epoch 116/399\n",
+      "2023-04-07 01:00:44,479 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:00:44,480 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:00:44,488 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9323, UAS: 0.9680, LAS: 0.9291, UEM: 0.7401, LEM: 0.4826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2020, partial_loss/deprel_loss: 0.3181, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5003, loss: 0.5417, batch_reg_loss: 0.2055, reg_loss: 0.2055 ||:   4%|4         | 4/95 [00:02<01:00,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9690, LAS: 0.9295, UEM: 0.7405, LEM: 0.4711, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1814, partial_loss/deprel_loss: 0.3349, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5096, loss: 0.5407, batch_reg_loss: 0.2055, reg_loss: 0.2055 ||:   7%|7         | 7/95 [00:04<01:00,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9584, LAS: 0.9176, UEM: 0.6493, LEM: 0.4011, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5633, partial_loss/deprel_loss: 0.6336, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8250, loss: 0.6347, batch_reg_loss: 0.2054, reg_loss: 0.2055 ||:  12%|#1        | 11/95 [00:07<00:56,  1.49it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9598, LAS: 0.9192, UEM: 0.6663, LEM: 0.4137, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2746, partial_loss/deprel_loss: 0.3179, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5147, loss: 0.6159, batch_reg_loss: 0.2054, reg_loss: 0.2054 ||:  15%|#4        | 14/95 [00:09<00:55,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9610, LAS: 0.9200, UEM: 0.6714, LEM: 0.4091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2278, partial_loss/deprel_loss: 0.3535, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5338, loss: 0.6081, batch_reg_loss: 0.2054, reg_loss: 0.2054 ||:  18%|#7        | 17/95 [00:11<00:54,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9594, LAS: 0.9186, UEM: 0.6447, LEM: 0.3871, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6805, partial_loss/deprel_loss: 0.5717, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7988, loss: 0.6208, batch_reg_loss: 0.2054, reg_loss: 0.2054 ||:  22%|##2       | 21/95 [00:14<00:49,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9268, UAS: 0.9585, LAS: 0.9173, UEM: 0.6355, LEM: 0.3773, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2706, partial_loss/deprel_loss: 0.3599, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5474, loss: 0.6278, batch_reg_loss: 0.2054, reg_loss: 0.2054 ||:  26%|##6       | 25/95 [00:16<00:45,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9571, LAS: 0.9159, UEM: 0.6217, LEM: 0.3660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3484, partial_loss/deprel_loss: 0.3916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5883, loss: 0.6413, batch_reg_loss: 0.2053, reg_loss: 0.2054 ||:  29%|##9       | 28/95 [00:18<00:44,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9533, UAS: 0.9567, LAS: 0.9158, UEM: 0.6375, LEM: 0.3951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0705, partial_loss/deprel_loss: 0.1764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3605, loss: 0.6432, batch_reg_loss: 0.2053, reg_loss: 0.2054 ||:  33%|###2      | 31/95 [00:20<00:42,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9267, UAS: 0.9577, LAS: 0.9171, UEM: 0.6455, LEM: 0.4021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2440, partial_loss/deprel_loss: 0.3688, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5491, loss: 0.6353, batch_reg_loss: 0.2053, reg_loss: 0.2054 ||:  37%|###6      | 35/95 [00:23<00:39,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8928, UAS: 0.9562, LAS: 0.9158, UEM: 0.6265, LEM: 0.3870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8137, partial_loss/deprel_loss: 0.6611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8969, loss: 0.6497, batch_reg_loss: 0.2053, reg_loss: 0.2054 ||:  41%|####1     | 39/95 [00:25<00:36,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8821, UAS: 0.9554, LAS: 0.9149, UEM: 0.6176, LEM: 0.3781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9319, partial_loss/deprel_loss: 0.6115, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8809, loss: 0.6571, batch_reg_loss: 0.2053, reg_loss: 0.2054 ||:  44%|####4     | 42/95 [00:28<00:36,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9563, LAS: 0.9159, UEM: 0.6318, LEM: 0.3923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1224, partial_loss/deprel_loss: 0.2459, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4264, loss: 0.6486, batch_reg_loss: 0.2053, reg_loss: 0.2054 ||:  47%|####7     | 45/95 [00:30<00:36,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9558, LAS: 0.9152, UEM: 0.6242, LEM: 0.3832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2016, partial_loss/deprel_loss: 0.3698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5414, loss: 0.6522, batch_reg_loss: 0.2053, reg_loss: 0.2054 ||:  52%|#####1    | 49/95 [00:32<00:31,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9558, LAS: 0.9153, UEM: 0.6202, LEM: 0.3778, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3851, partial_loss/deprel_loss: 0.4890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6734, loss: 0.6525, batch_reg_loss: 0.2052, reg_loss: 0.2054 ||:  56%|#####5    | 53/95 [00:35<00:27,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9565, LAS: 0.9161, UEM: 0.6234, LEM: 0.3797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4648, partial_loss/deprel_loss: 0.4853, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6864, loss: 0.6478, batch_reg_loss: 0.2052, reg_loss: 0.2053 ||:  60%|######    | 57/95 [00:38<00:25,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9563, LAS: 0.9161, UEM: 0.6263, LEM: 0.3843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3565, partial_loss/deprel_loss: 0.4152, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6086, loss: 0.6477, batch_reg_loss: 0.2052, reg_loss: 0.2053 ||:  63%|######3   | 60/95 [00:40<00:23,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9122, UAS: 0.9564, LAS: 0.9160, UEM: 0.6273, LEM: 0.3867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4026, partial_loss/deprel_loss: 0.4820, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6713, loss: 0.6483, batch_reg_loss: 0.2052, reg_loss: 0.2053 ||:  66%|######6   | 63/95 [00:42<00:22,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9559, LAS: 0.9156, UEM: 0.6322, LEM: 0.3938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1012, partial_loss/deprel_loss: 0.2647, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4372, loss: 0.6501, batch_reg_loss: 0.2052, reg_loss: 0.2053 ||:  69%|######9   | 66/95 [00:44<00:19,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9554, LAS: 0.9151, UEM: 0.6282, LEM: 0.3901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5122, partial_loss/deprel_loss: 0.4783, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6903, loss: 0.6536, batch_reg_loss: 0.2052, reg_loss: 0.2053 ||:  73%|#######2  | 69/95 [00:46<00:17,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9712, UAS: 0.9564, LAS: 0.9164, UEM: 0.6498, LEM: 0.4189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0443, partial_loss/deprel_loss: 0.1197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3098, loss: 0.6467, batch_reg_loss: 0.2052, reg_loss: 0.2053 ||:  76%|#######5  | 72/95 [00:48<00:16,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9566, LAS: 0.9165, UEM: 0.6545, LEM: 0.4220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1457, partial_loss/deprel_loss: 0.3205, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4907, loss: 0.6454, batch_reg_loss: 0.2051, reg_loss: 0.2053 ||:  79%|#######8  | 75/95 [00:51<00:14,  1.40it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9563, LAS: 0.9163, UEM: 0.6471, LEM: 0.4135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2892, partial_loss/deprel_loss: 0.4277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6051, loss: 0.6474, batch_reg_loss: 0.2051, reg_loss: 0.2053 ||:  84%|########4 | 80/95 [00:53<00:09,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9565, LAS: 0.9167, UEM: 0.6459, LEM: 0.4113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2282, partial_loss/deprel_loss: 0.3420, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5243, loss: 0.6453, batch_reg_loss: 0.2051, reg_loss: 0.2053 ||:  89%|########9 | 85/95 [00:55<00:05,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8357, UAS: 0.9556, LAS: 0.9156, UEM: 0.6391, LEM: 0.4031, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5147, partial_loss/deprel_loss: 0.8003, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1483, loss: 0.6527, batch_reg_loss: 0.2051, reg_loss: 0.2053 ||:  96%|#########5| 91/95 [00:58<00:02,  1.85it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9550, LAS: 0.9149, UEM: 0.6400, LEM: 0.4062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1389, partial_loss/deprel_loss: 0.2610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4416, loss: 0.6561, batch_reg_loss: 0.2050, reg_loss: 0.2053 ||: 100%|##########| 95/95 [01:01<00:00,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9550, LAS: 0.9149, UEM: 0.6400, LEM: 0.4062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1389, partial_loss/deprel_loss: 0.2610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4416, loss: 0.6561, batch_reg_loss: 0.2050, reg_loss: 0.2053 ||: 100%|##########| 95/95 [01:01<00:00,  1.56it/s]\n",
+      "2023-04-07 01:01:48,450 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:01:48,451 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 01:01:48,451 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.205  |       N/A\n",
+      "2023-04-07 01:01:48,451 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:01:48,451 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:01:48,451 - INFO - combo.training.tensorboard_writer - UEM                      |     0.640  |       N/A\n",
+      "2023-04-07 01:01:48,451 - INFO - combo.training.tensorboard_writer - LEM                      |     0.406  |       N/A\n",
+      "2023-04-07 01:01:48,451 - INFO - combo.training.tensorboard_writer - EM                       |     0.938  |       N/A\n",
+      "2023-04-07 01:01:48,451 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.139  |       N/A\n",
+      "2023-04-07 01:01:48,451 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:01:48,452 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:01:48,452 - INFO - combo.training.tensorboard_writer - UAS                      |     0.955  |       N/A\n",
+      "2023-04-07 01:01:48,452 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:01:48,452 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.261  |       N/A\n",
+      "2023-04-07 01:01:48,452 - INFO - combo.training.tensorboard_writer - loss                     |     0.656  |       N/A\n",
+      "2023-04-07 01:01:48,452 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:01:48,452 - INFO - combo.training.tensorboard_writer - LAS                      |     0.915  |       N/A\n",
+      "2023-04-07 01:01:48,452 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:01:48,452 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:01:48,452 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:01:48,453 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:01:48,453 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:01:48,453 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:01:48,459 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:01:53,134 - INFO - combo.training.trainer - Epoch duration: 0:01:08.655513\n",
+      "2023-04-07 01:01:53,135 - INFO - combo.training.trainer - Estimated training time remaining: 5:19:57\n",
+      "2023-04-07 01:01:53,135 - INFO - allennlp.training.trainer - Epoch 117/399\n",
+      "2023-04-07 01:01:53,135 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:01:53,136 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:01:53,144 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9657, LAS: 0.9271, UEM: 0.7289, LEM: 0.5060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3055, partial_loss/deprel_loss: 0.4084, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5929, loss: 0.5641, batch_reg_loss: 0.2050, reg_loss: 0.2050 ||:   3%|3         | 3/95 [00:02<01:09,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8961, UAS: 0.9583, LAS: 0.9174, UEM: 0.6494, LEM: 0.4258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6166, partial_loss/deprel_loss: 0.6155, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8207, loss: 0.6446, batch_reg_loss: 0.2050, reg_loss: 0.2050 ||:   6%|6         | 6/95 [00:04<01:07,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9613, LAS: 0.9211, UEM: 0.6669, LEM: 0.4219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1640, partial_loss/deprel_loss: 0.3347, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5055, loss: 0.6202, batch_reg_loss: 0.2050, reg_loss: 0.2050 ||:   9%|9         | 9/95 [00:06<01:03,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9620, LAS: 0.9220, UEM: 0.7170, LEM: 0.4787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1334, partial_loss/deprel_loss: 0.2610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4405, loss: 0.6061, batch_reg_loss: 0.2050, reg_loss: 0.2050 ||:  14%|#3        | 13/95 [00:09<00:59,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9627, LAS: 0.9226, UEM: 0.7430, LEM: 0.5152, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2285, partial_loss/deprel_loss: 0.3888, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5617, loss: 0.6003, batch_reg_loss: 0.2050, reg_loss: 0.2050 ||:  17%|#6        | 16/95 [00:11<01:00,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9054, UAS: 0.9614, LAS: 0.9207, UEM: 0.7180, LEM: 0.4855, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4569, partial_loss/deprel_loss: 0.5699, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7523, loss: 0.6153, batch_reg_loss: 0.2050, reg_loss: 0.2050 ||:  20%|##        | 19/95 [00:14<00:56,  1.34it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9606, LAS: 0.9204, UEM: 0.7169, LEM: 0.4907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5126, partial_loss/deprel_loss: 0.4923, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7013, loss: 0.6176, batch_reg_loss: 0.2050, reg_loss: 0.2050 ||:  23%|##3       | 22/95 [00:16<00:55,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8793, UAS: 0.9598, LAS: 0.9194, UEM: 0.7115, LEM: 0.4808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9651, partial_loss/deprel_loss: 0.6207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8945, loss: 0.6246, batch_reg_loss: 0.2049, reg_loss: 0.2050 ||:  26%|##6       | 25/95 [00:18<00:52,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9586, LAS: 0.9184, UEM: 0.6856, LEM: 0.4549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4719, partial_loss/deprel_loss: 0.5116, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7086, loss: 0.6347, batch_reg_loss: 0.2049, reg_loss: 0.2050 ||:  31%|###       | 29/95 [00:21<00:47,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9652, UAS: 0.9597, LAS: 0.9202, UEM: 0.7099, LEM: 0.4931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0503, partial_loss/deprel_loss: 0.1543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3384, loss: 0.6270, batch_reg_loss: 0.2049, reg_loss: 0.2050 ||:  34%|###3      | 32/95 [00:23<00:46,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9611, LAS: 0.9215, UEM: 0.7257, LEM: 0.5059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0998, partial_loss/deprel_loss: 0.2700, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4409, loss: 0.6144, batch_reg_loss: 0.2049, reg_loss: 0.2050 ||:  37%|###6      | 35/95 [00:26<00:45,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9609, LAS: 0.9211, UEM: 0.7160, LEM: 0.4924, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2467, partial_loss/deprel_loss: 0.3785, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5570, loss: 0.6155, batch_reg_loss: 0.2049, reg_loss: 0.2050 ||:  40%|####      | 38/95 [00:28<00:42,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9587, LAS: 0.9188, UEM: 0.6991, LEM: 0.4793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5246, partial_loss/deprel_loss: 0.5063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7148, loss: 0.6316, batch_reg_loss: 0.2049, reg_loss: 0.2050 ||:  43%|####3     | 41/95 [00:30<00:38,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9591, LAS: 0.9193, UEM: 0.6970, LEM: 0.4749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2204, partial_loss/deprel_loss: 0.2553, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4532, loss: 0.6274, batch_reg_loss: 0.2048, reg_loss: 0.2049 ||:  46%|####6     | 44/95 [00:32<00:37,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9577, LAS: 0.9178, UEM: 0.6826, LEM: 0.4629, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6035, partial_loss/deprel_loss: 0.5471, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7632, loss: 0.6391, batch_reg_loss: 0.2048, reg_loss: 0.2049 ||:  49%|####9     | 47/95 [00:34<00:35,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9366, UAS: 0.9578, LAS: 0.9179, UEM: 0.6828, LEM: 0.4613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2021, partial_loss/deprel_loss: 0.3638, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5363, loss: 0.6393, batch_reg_loss: 0.2048, reg_loss: 0.2049 ||:  53%|#####2    | 50/95 [00:36<00:32,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9569, LAS: 0.9169, UEM: 0.6781, LEM: 0.4556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2868, partial_loss/deprel_loss: 0.4395, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6138, loss: 0.6455, batch_reg_loss: 0.2048, reg_loss: 0.2049 ||:  56%|#####5    | 53/95 [00:39<00:31,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8651, UAS: 0.9556, LAS: 0.9155, UEM: 0.6716, LEM: 0.4519, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0218, partial_loss/deprel_loss: 0.7471, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0068, loss: 0.6539, batch_reg_loss: 0.2048, reg_loss: 0.2049 ||:  60%|######    | 57/95 [00:41<00:26,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9559, LAS: 0.9157, UEM: 0.6668, LEM: 0.4425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4642, partial_loss/deprel_loss: 0.4842, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6850, loss: 0.6526, batch_reg_loss: 0.2048, reg_loss: 0.2049 ||:  64%|######4   | 61/95 [00:43<00:22,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9561, LAS: 0.9162, UEM: 0.6638, LEM: 0.4372, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4905, partial_loss/deprel_loss: 0.4883, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6935, loss: 0.6513, batch_reg_loss: 0.2048, reg_loss: 0.2049 ||:  68%|######8   | 65/95 [00:46<00:19,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8883, UAS: 0.9557, LAS: 0.9158, UEM: 0.6566, LEM: 0.4302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7983, partial_loss/deprel_loss: 0.5908, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8371, loss: 0.6525, batch_reg_loss: 0.2048, reg_loss: 0.2049 ||:  73%|#######2  | 69/95 [00:48<00:16,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9296, UAS: 0.9558, LAS: 0.9159, UEM: 0.6555, LEM: 0.4265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2320, partial_loss/deprel_loss: 0.4106, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5796, loss: 0.6534, batch_reg_loss: 0.2048, reg_loss: 0.2049 ||:  77%|#######6  | 73/95 [00:52<00:15,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9562, LAS: 0.9163, UEM: 0.6571, LEM: 0.4281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1723, partial_loss/deprel_loss: 0.2720, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4568, loss: 0.6500, batch_reg_loss: 0.2047, reg_loss: 0.2049 ||:  80%|########  | 76/95 [00:54<00:13,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9569, LAS: 0.9168, UEM: 0.6612, LEM: 0.4284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2000, partial_loss/deprel_loss: 0.3607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5333, loss: 0.6461, batch_reg_loss: 0.2047, reg_loss: 0.2049 ||:  83%|########3 | 79/95 [00:56<00:11,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9569, LAS: 0.9167, UEM: 0.6574, LEM: 0.4224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2967, partial_loss/deprel_loss: 0.4476, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6221, loss: 0.6471, batch_reg_loss: 0.2047, reg_loss: 0.2049 ||:  86%|########6 | 82/95 [00:59<00:09,  1.37it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9563, LAS: 0.9161, UEM: 0.6521, LEM: 0.4176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4103, partial_loss/deprel_loss: 0.4323, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6326, loss: 0.6524, batch_reg_loss: 0.2047, reg_loss: 0.2049 ||:  89%|########9 | 85/95 [01:01<00:07,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9564, LAS: 0.9163, UEM: 0.6528, LEM: 0.4180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3299, partial_loss/deprel_loss: 0.3959, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5874, loss: 0.6503, batch_reg_loss: 0.2047, reg_loss: 0.2049 ||:  94%|#########3| 89/95 [01:03<00:03,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9563, LAS: 0.9160, UEM: 0.6453, LEM: 0.4094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3812, partial_loss/deprel_loss: 0.4746, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6606, loss: 0.6513, batch_reg_loss: 0.2047, reg_loss: 0.2048 ||:  99%|#########8| 94/95 [01:05<00:00,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9564, LAS: 0.9161, UEM: 0.6459, LEM: 0.4091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2517, partial_loss/deprel_loss: 0.3691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5503, loss: 0.6502, batch_reg_loss: 0.2047, reg_loss: 0.2048 ||: 100%|##########| 95/95 [01:05<00:00,  1.45it/s]\n",
+      "2023-04-07 01:03:01,644 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.205  |       N/A\n",
+      "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - UEM                      |     0.646  |       N/A\n",
+      "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - LEM                      |     0.409  |       N/A\n",
+      "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - EM                       |     0.921  |       N/A\n",
+      "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.252  |       N/A\n",
+      "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - UAS                      |     0.956  |       N/A\n",
+      "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.369  |       N/A\n",
+      "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - loss                     |     0.650  |       N/A\n",
+      "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - LAS                      |     0.916  |       N/A\n",
+      "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:03:01,645 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:03:01,646 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:03:01,646 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:03:01,646 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:03:01,646 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:03:01,652 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:03:05,803 - INFO - combo.training.trainer - Epoch duration: 0:01:12.667929\n",
+      "2023-04-07 01:03:05,803 - INFO - combo.training.trainer - Estimated training time remaining: 5:19:01\n",
+      "2023-04-07 01:03:05,803 - INFO - allennlp.training.trainer - Epoch 118/399\n",
+      "2023-04-07 01:03:05,807 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:03:05,808 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:03:05,814 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8896, UAS: 0.9398, LAS: 0.8988, UEM: 0.3985, LEM: 0.2055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7798, partial_loss/deprel_loss: 0.6197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8564, loss: 0.7712, batch_reg_loss: 0.2046, reg_loss: 0.2047 ||:   4%|4         | 4/95 [00:02<00:54,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9468, LAS: 0.9063, UEM: 0.5245, LEM: 0.2853, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1564, partial_loss/deprel_loss: 0.3276, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4980, loss: 0.7248, batch_reg_loss: 0.2046, reg_loss: 0.2046 ||:   8%|8         | 8/95 [00:05<00:54,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9524, LAS: 0.9122, UEM: 0.5617, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4304, partial_loss/deprel_loss: 0.4563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6557, loss: 0.6857, batch_reg_loss: 0.2046, reg_loss: 0.2046 ||:  13%|#2        | 12/95 [00:07<00:53,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9504, LAS: 0.9102, UEM: 0.5473, LEM: 0.3003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3414, partial_loss/deprel_loss: 0.4408, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6255, loss: 0.6945, batch_reg_loss: 0.2046, reg_loss: 0.2046 ||:  16%|#5        | 15/95 [00:10<00:53,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9525, LAS: 0.9133, UEM: 0.5967, LEM: 0.3721, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6889, partial_loss/deprel_loss: 0.5799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8063, loss: 0.6762, batch_reg_loss: 0.2046, reg_loss: 0.2046 ||:  20%|##        | 19/95 [00:12<00:51,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9561, LAS: 0.9172, UEM: 0.6425, LEM: 0.4060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1962, partial_loss/deprel_loss: 0.3841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5511, loss: 0.6493, batch_reg_loss: 0.2046, reg_loss: 0.2046 ||:  24%|##4       | 23/95 [00:15<00:48,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9299, UAS: 0.9572, LAS: 0.9185, UEM: 0.6440, LEM: 0.4010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2619, partial_loss/deprel_loss: 0.3773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5588, loss: 0.6393, batch_reg_loss: 0.2046, reg_loss: 0.2046 ||:  28%|##8       | 27/95 [00:17<00:43,  1.56it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9580, LAS: 0.9192, UEM: 0.6569, LEM: 0.4174, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1583, partial_loss/deprel_loss: 0.2687, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4512, loss: 0.6296, batch_reg_loss: 0.2045, reg_loss: 0.2046 ||:  33%|###2      | 31/95 [00:20<00:41,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9586, LAS: 0.9196, UEM: 0.6521, LEM: 0.4090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2569, partial_loss/deprel_loss: 0.3917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5693, loss: 0.6243, batch_reg_loss: 0.2045, reg_loss: 0.2046 ||:  37%|###6      | 35/95 [00:23<00:39,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9578, LAS: 0.9188, UEM: 0.6441, LEM: 0.4000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3563, partial_loss/deprel_loss: 0.4463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6328, loss: 0.6311, batch_reg_loss: 0.2045, reg_loss: 0.2046 ||:  40%|####      | 38/95 [00:25<00:37,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9587, LAS: 0.9196, UEM: 0.6489, LEM: 0.4021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2458, partial_loss/deprel_loss: 0.3657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5462, loss: 0.6265, batch_reg_loss: 0.2045, reg_loss: 0.2046 ||:  43%|####3     | 41/95 [00:27<00:36,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9579, LAS: 0.9185, UEM: 0.6353, LEM: 0.3899, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4702, partial_loss/deprel_loss: 0.5163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7116, loss: 0.6337, batch_reg_loss: 0.2045, reg_loss: 0.2046 ||:  46%|####6     | 44/95 [00:29<00:35,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9577, LAS: 0.9182, UEM: 0.6388, LEM: 0.3976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5220, partial_loss/deprel_loss: 0.5771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7706, loss: 0.6353, batch_reg_loss: 0.2044, reg_loss: 0.2046 ||:  49%|####9     | 47/95 [00:31<00:33,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9570, LAS: 0.9176, UEM: 0.6303, LEM: 0.3906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2669, partial_loss/deprel_loss: 0.3453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5341, loss: 0.6409, batch_reg_loss: 0.2044, reg_loss: 0.2046 ||:  53%|#####2    | 50/95 [00:33<00:31,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9577, LAS: 0.9183, UEM: 0.6410, LEM: 0.4001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1441, partial_loss/deprel_loss: 0.2727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4514, loss: 0.6355, batch_reg_loss: 0.2044, reg_loss: 0.2045 ||:  56%|#####5    | 53/95 [00:35<00:29,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9201, UAS: 0.9579, LAS: 0.9183, UEM: 0.6397, LEM: 0.3964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2858, partial_loss/deprel_loss: 0.4277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6037, loss: 0.6348, batch_reg_loss: 0.2044, reg_loss: 0.2045 ||:  59%|#####8    | 56/95 [00:38<00:27,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9582, LAS: 0.9185, UEM: 0.6424, LEM: 0.3971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4151, partial_loss/deprel_loss: 0.4470, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6450, loss: 0.6306, batch_reg_loss: 0.2044, reg_loss: 0.2045 ||:  62%|######2   | 59/95 [00:40<00:26,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9582, LAS: 0.9184, UEM: 0.6424, LEM: 0.3980, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5443, partial_loss/deprel_loss: 0.5232, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7318, loss: 0.6310, batch_reg_loss: 0.2044, reg_loss: 0.2045 ||:  65%|######5   | 62/95 [00:42<00:23,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9228, UAS: 0.9578, LAS: 0.9181, UEM: 0.6436, LEM: 0.4004, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2878, partial_loss/deprel_loss: 0.4176, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5960, loss: 0.6327, batch_reg_loss: 0.2044, reg_loss: 0.2045 ||:  68%|######8   | 65/95 [00:44<00:22,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9586, LAS: 0.9189, UEM: 0.6586, LEM: 0.4157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1988, partial_loss/deprel_loss: 0.3274, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5060, loss: 0.6260, batch_reg_loss: 0.2043, reg_loss: 0.2045 ||:  72%|#######1  | 68/95 [00:47<00:20,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9000, UAS: 0.9582, LAS: 0.9185, UEM: 0.6553, LEM: 0.4138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7309, partial_loss/deprel_loss: 0.5876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8206, loss: 0.6301, batch_reg_loss: 0.2043, reg_loss: 0.2045 ||:  75%|#######4  | 71/95 [00:49<00:18,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9575, LAS: 0.9177, UEM: 0.6469, LEM: 0.4064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4428, partial_loss/deprel_loss: 0.4354, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6412, loss: 0.6368, batch_reg_loss: 0.2043, reg_loss: 0.2045 ||:  78%|#######7  | 74/95 [00:51<00:15,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9564, LAS: 0.9164, UEM: 0.6414, LEM: 0.4021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3437, partial_loss/deprel_loss: 0.3802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5772, loss: 0.6446, batch_reg_loss: 0.2043, reg_loss: 0.2045 ||:  81%|########1 | 77/95 [00:54<00:13,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9566, LAS: 0.9169, UEM: 0.6540, LEM: 0.4228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7177, partial_loss/deprel_loss: 0.5827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8140, loss: 0.6425, batch_reg_loss: 0.2043, reg_loss: 0.2045 ||:  84%|########4 | 80/95 [00:56<00:11,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9564, LAS: 0.9167, UEM: 0.6479, LEM: 0.4158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1983, partial_loss/deprel_loss: 0.3592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5313, loss: 0.6447, batch_reg_loss: 0.2043, reg_loss: 0.2045 ||:  88%|########8 | 84/95 [00:58<00:08,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9568, LAS: 0.9170, UEM: 0.6508, LEM: 0.4177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4443, partial_loss/deprel_loss: 0.4700, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6691, loss: 0.6432, batch_reg_loss: 0.2043, reg_loss: 0.2045 ||:  92%|#########1| 87/95 [01:01<00:05,  1.41it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9559, LAS: 0.9159, UEM: 0.6427, LEM: 0.4108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7055, partial_loss/deprel_loss: 0.6593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8728, loss: 0.6516, batch_reg_loss: 0.2043, reg_loss: 0.2045 ||:  96%|#########5| 91/95 [01:03<00:02,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9562, LAS: 0.9163, UEM: 0.6432, LEM: 0.4092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3102, partial_loss/deprel_loss: 0.4098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5941, loss: 0.6499, batch_reg_loss: 0.2043, reg_loss: 0.2044 ||: 100%|##########| 95/95 [01:05<00:00,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9562, LAS: 0.9163, UEM: 0.6432, LEM: 0.4092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3102, partial_loss/deprel_loss: 0.4098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5941, loss: 0.6499, batch_reg_loss: 0.2043, reg_loss: 0.2044 ||: 100%|##########| 95/95 [01:05<00:00,  1.44it/s]\n",
+      "2023-04-07 01:04:14,730 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:04:14,730 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 01:04:14,730 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.204  |       N/A\n",
+      "2023-04-07 01:04:14,730 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:04:14,730 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:04:14,730 - INFO - combo.training.tensorboard_writer - UEM                      |     0.643  |       N/A\n",
+      "2023-04-07 01:04:14,730 - INFO - combo.training.tensorboard_writer - LEM                      |     0.409  |       N/A\n",
+      "2023-04-07 01:04:14,730 - INFO - combo.training.tensorboard_writer - EM                       |     0.931  |       N/A\n",
+      "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.310  |       N/A\n",
+      "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - UAS                      |     0.956  |       N/A\n",
+      "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.410  |       N/A\n",
+      "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - loss                     |     0.650  |       N/A\n",
+      "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - LAS                      |     0.916  |       N/A\n",
+      "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:04:14,731 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:04:14,736 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:04:19,866 - INFO - combo.training.trainer - Epoch duration: 0:01:14.062399\n",
+      "2023-04-07 01:04:19,866 - INFO - combo.training.trainer - Estimated training time remaining: 5:18:08\n",
+      "2023-04-07 01:04:19,867 - INFO - allennlp.training.trainer - Epoch 119/399\n",
+      "2023-04-07 01:04:19,867 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:04:19,868 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:04:19,877 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9680, LAS: 0.9297, UEM: 0.7144, LEM: 0.4521, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1628, partial_loss/deprel_loss: 0.3151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4889, loss: 0.5497, batch_reg_loss: 0.2042, reg_loss: 0.2042 ||:   5%|5         | 5/95 [00:02<00:37,  2.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8973, UAS: 0.9658, LAS: 0.9279, UEM: 0.7102, LEM: 0.4669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6621, partial_loss/deprel_loss: 0.5502, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7768, loss: 0.5636, batch_reg_loss: 0.2042, reg_loss: 0.2042 ||:  11%|#         | 10/95 [00:04<00:37,  2.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9595, LAS: 0.9203, UEM: 0.6506, LEM: 0.4146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5168, partial_loss/deprel_loss: 0.5144, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7191, loss: 0.6185, batch_reg_loss: 0.2042, reg_loss: 0.2042 ||:  15%|#4        | 14/95 [00:07<00:40,  2.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9612, LAS: 0.9225, UEM: 0.6805, LEM: 0.4490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1406, partial_loss/deprel_loss: 0.2792, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4557, loss: 0.6006, batch_reg_loss: 0.2042, reg_loss: 0.2042 ||:  18%|#7        | 17/95 [00:09<00:47,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9611, LAS: 0.9216, UEM: 0.6632, LEM: 0.4201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6356, partial_loss/deprel_loss: 0.5895, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8029, loss: 0.6072, batch_reg_loss: 0.2042, reg_loss: 0.2042 ||:  22%|##2       | 21/95 [00:12<00:46,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9596, LAS: 0.9201, UEM: 0.6629, LEM: 0.4254, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8306, partial_loss/deprel_loss: 0.5451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8064, loss: 0.6138, batch_reg_loss: 0.2041, reg_loss: 0.2042 ||:  25%|##5       | 24/95 [00:14<00:45,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9589, LAS: 0.9196, UEM: 0.6462, LEM: 0.4091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2599, partial_loss/deprel_loss: 0.3826, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5622, loss: 0.6170, batch_reg_loss: 0.2041, reg_loss: 0.2042 ||:  29%|##9       | 28/95 [00:17<00:44,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9266, UAS: 0.9607, LAS: 0.9210, UEM: 0.6755, LEM: 0.4337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1929, partial_loss/deprel_loss: 0.3773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5445, loss: 0.6047, batch_reg_loss: 0.2041, reg_loss: 0.2042 ||:  33%|###2      | 31/95 [00:19<00:45,  1.41it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9595, LAS: 0.9196, UEM: 0.6593, LEM: 0.4180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2287, partial_loss/deprel_loss: 0.3646, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5415, loss: 0.6169, batch_reg_loss: 0.2041, reg_loss: 0.2042 ||:  37%|###6      | 35/95 [00:22<00:40,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9577, LAS: 0.9178, UEM: 0.6494, LEM: 0.4099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5927, partial_loss/deprel_loss: 0.5126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7327, loss: 0.6291, batch_reg_loss: 0.2041, reg_loss: 0.2042 ||:  40%|####      | 38/95 [00:24<00:39,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8500, UAS: 0.9555, LAS: 0.9152, UEM: 0.6316, LEM: 0.3936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4118, partial_loss/deprel_loss: 0.7559, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0912, loss: 0.6490, batch_reg_loss: 0.2041, reg_loss: 0.2042 ||:  44%|####4     | 42/95 [00:26<00:35,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9555, LAS: 0.9152, UEM: 0.6242, LEM: 0.3862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4271, partial_loss/deprel_loss: 0.4676, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6636, loss: 0.6491, batch_reg_loss: 0.2040, reg_loss: 0.2041 ||:  48%|####8     | 46/95 [00:29<00:31,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9555, LAS: 0.9153, UEM: 0.6226, LEM: 0.3851, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1712, partial_loss/deprel_loss: 0.2492, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4376, loss: 0.6464, batch_reg_loss: 0.2040, reg_loss: 0.2041 ||:  53%|#####2    | 50/95 [00:31<00:28,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9567, LAS: 0.9167, UEM: 0.6471, LEM: 0.4138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1921, partial_loss/deprel_loss: 0.2977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4806, loss: 0.6348, batch_reg_loss: 0.2040, reg_loss: 0.2041 ||:  57%|#####6    | 54/95 [00:35<00:29,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8579, UAS: 0.9551, LAS: 0.9151, UEM: 0.6367, LEM: 0.4053, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3423, partial_loss/deprel_loss: 0.7008, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0331, loss: 0.6454, batch_reg_loss: 0.2040, reg_loss: 0.2041 ||:  60%|######    | 57/95 [00:37<00:27,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9559, LAS: 0.9158, UEM: 0.6492, LEM: 0.4177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2480, partial_loss/deprel_loss: 0.3437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5286, loss: 0.6408, batch_reg_loss: 0.2040, reg_loss: 0.2041 ||:  63%|######3   | 60/95 [00:39<00:24,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8860, UAS: 0.9561, LAS: 0.9162, UEM: 0.6626, LEM: 0.4415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8539, partial_loss/deprel_loss: 0.6229, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8731, loss: 0.6397, batch_reg_loss: 0.2040, reg_loss: 0.2041 ||:  66%|######6   | 63/95 [00:41<00:23,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9565, LAS: 0.9165, UEM: 0.6619, LEM: 0.4371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2363, partial_loss/deprel_loss: 0.3619, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5407, loss: 0.6368, batch_reg_loss: 0.2040, reg_loss: 0.2041 ||:  71%|#######   | 67/95 [00:44<00:20,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9563, LAS: 0.9162, UEM: 0.6544, LEM: 0.4272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3891, partial_loss/deprel_loss: 0.4232, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6203, loss: 0.6394, batch_reg_loss: 0.2039, reg_loss: 0.2041 ||:  75%|#######4  | 71/95 [00:47<00:16,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9478, UAS: 0.9556, LAS: 0.9155, UEM: 0.6502, LEM: 0.4245, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1658, partial_loss/deprel_loss: 0.2808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4618, loss: 0.6453, batch_reg_loss: 0.2039, reg_loss: 0.2041 ||:  79%|#######8  | 75/95 [00:49<00:13,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9363, UAS: 0.9553, LAS: 0.9152, UEM: 0.6450, LEM: 0.4194, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1619, partial_loss/deprel_loss: 0.3237, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4953, loss: 0.6480, batch_reg_loss: 0.2039, reg_loss: 0.2041 ||:  83%|########3 | 79/95 [00:52<00:10,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8967, UAS: 0.9551, LAS: 0.9150, UEM: 0.6381, LEM: 0.4116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7115, partial_loss/deprel_loss: 0.6701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8823, loss: 0.6514, batch_reg_loss: 0.2039, reg_loss: 0.2041 ||:  87%|########7 | 83/95 [00:55<00:08,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9110, UAS: 0.9554, LAS: 0.9153, UEM: 0.6370, LEM: 0.4086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4684, partial_loss/deprel_loss: 0.5085, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7044, loss: 0.6494, batch_reg_loss: 0.2039, reg_loss: 0.2041 ||:  91%|######### | 86/95 [00:57<00:06,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9557, LAS: 0.9156, UEM: 0.6374, LEM: 0.4068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2779, partial_loss/deprel_loss: 0.4226, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5975, loss: 0.6469, batch_reg_loss: 0.2039, reg_loss: 0.2041 ||:  94%|#########3| 89/95 [00:59<00:04,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8874, UAS: 0.9557, LAS: 0.9154, UEM: 0.6349, LEM: 0.4037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7387, partial_loss/deprel_loss: 0.6025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8336, loss: 0.6483, batch_reg_loss: 0.2039, reg_loss: 0.2041 ||:  97%|#########6| 92/95 [01:01<00:02,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9558, LAS: 0.9156, UEM: 0.6386, LEM: 0.4066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2235, partial_loss/deprel_loss: 0.3477, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5267, loss: 0.6477, batch_reg_loss: 0.2039, reg_loss: 0.2040 ||: 100%|##########| 95/95 [01:04<00:00,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9558, LAS: 0.9156, UEM: 0.6386, LEM: 0.4066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2235, partial_loss/deprel_loss: 0.3477, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5267, loss: 0.6477, batch_reg_loss: 0.2039, reg_loss: 0.2040 ||: 100%|##########| 95/95 [01:04<00:00,  1.47it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:05:27,550 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:05:27,550 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 01:05:27,550 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.204  |       N/A\n",
+      "2023-04-07 01:05:27,550 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:05:27,550 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:05:27,550 - INFO - combo.training.tensorboard_writer - UEM                      |     0.639  |       N/A\n",
+      "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - LEM                      |     0.407  |       N/A\n",
+      "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - EM                       |     0.936  |       N/A\n",
+      "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.224  |       N/A\n",
+      "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - UAS                      |     0.956  |       N/A\n",
+      "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.348  |       N/A\n",
+      "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - loss                     |     0.648  |       N/A\n",
+      "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - LAS                      |     0.916  |       N/A\n",
+      "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:05:27,551 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:05:27,556 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:05:32,555 - INFO - combo.training.trainer - Epoch duration: 0:01:12.688653\n",
+      "2023-04-07 01:05:32,556 - INFO - combo.training.trainer - Estimated training time remaining: 5:17:11\n",
+      "2023-04-07 01:05:32,556 - INFO - allennlp.training.trainer - Epoch 120/399\n",
+      "2023-04-07 01:05:32,556 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:05:32,557 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:05:32,567 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8717, UAS: 0.9607, LAS: 0.9192, UEM: 0.6978, LEM: 0.4385, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8741, partial_loss/deprel_loss: 0.6850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9267, loss: 0.6465, batch_reg_loss: 0.2039, reg_loss: 0.2039 ||:   4%|4         | 4/95 [00:02<00:57,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9171, UAS: 0.9641, LAS: 0.9246, UEM: 0.7115, LEM: 0.4575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4423, partial_loss/deprel_loss: 0.4296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6360, loss: 0.5976, batch_reg_loss: 0.2038, reg_loss: 0.2039 ||:   7%|7         | 7/95 [00:04<00:58,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9647, LAS: 0.9252, UEM: 0.7035, LEM: 0.4419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4366, partial_loss/deprel_loss: 0.4334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6379, loss: 0.5810, batch_reg_loss: 0.2038, reg_loss: 0.2038 ||:  13%|#2        | 12/95 [00:06<00:49,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9593, LAS: 0.9201, UEM: 0.6765, LEM: 0.4341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1827, partial_loss/deprel_loss: 0.3296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5040, loss: 0.6190, batch_reg_loss: 0.2038, reg_loss: 0.2038 ||:  17%|#6        | 16/95 [00:09<00:45,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8718, UAS: 0.9571, LAS: 0.9183, UEM: 0.6765, LEM: 0.4389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0005, partial_loss/deprel_loss: 0.6994, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9634, loss: 0.6334, batch_reg_loss: 0.2038, reg_loss: 0.2038 ||:  22%|##2       | 21/95 [00:11<00:40,  1.84it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9577, LAS: 0.9187, UEM: 0.6619, LEM: 0.4209, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4076, partial_loss/deprel_loss: 0.5277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7075, loss: 0.6312, batch_reg_loss: 0.2038, reg_loss: 0.2038 ||:  26%|##6       | 25/95 [00:13<00:38,  1.83it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9590, LAS: 0.9198, UEM: 0.6632, LEM: 0.4135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2917, partial_loss/deprel_loss: 0.4139, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5932, loss: 0.6214, batch_reg_loss: 0.2037, reg_loss: 0.2038 ||:  31%|###       | 29/95 [00:16<00:37,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8956, UAS: 0.9589, LAS: 0.9198, UEM: 0.6604, LEM: 0.4150, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6513, partial_loss/deprel_loss: 0.5765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7952, loss: 0.6228, batch_reg_loss: 0.2037, reg_loss: 0.2038 ||:  35%|###4      | 33/95 [00:19<00:38,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9584, LAS: 0.9192, UEM: 0.6470, LEM: 0.4003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3922, partial_loss/deprel_loss: 0.4201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6182, loss: 0.6277, batch_reg_loss: 0.2037, reg_loss: 0.2038 ||:  39%|###8      | 37/95 [00:21<00:35,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9585, LAS: 0.9190, UEM: 0.6380, LEM: 0.3900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3262, partial_loss/deprel_loss: 0.4707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6455, loss: 0.6304, batch_reg_loss: 0.2037, reg_loss: 0.2038 ||:  43%|####3     | 41/95 [00:24<00:35,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9584, LAS: 0.9187, UEM: 0.6337, LEM: 0.3822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2109, partial_loss/deprel_loss: 0.4067, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5713, loss: 0.6353, batch_reg_loss: 0.2037, reg_loss: 0.2038 ||:  47%|####7     | 45/95 [00:26<00:32,  1.56it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9456, UAS: 0.9592, LAS: 0.9196, UEM: 0.6479, LEM: 0.3988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0840, partial_loss/deprel_loss: 0.2389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4116, loss: 0.6285, batch_reg_loss: 0.2037, reg_loss: 0.2038 ||:  52%|#####1    | 49/95 [00:30<00:32,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9584, LAS: 0.9189, UEM: 0.6377, LEM: 0.3910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6546, partial_loss/deprel_loss: 0.4722, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7123, loss: 0.6337, batch_reg_loss: 0.2036, reg_loss: 0.2038 ||:  56%|#####5    | 53/95 [00:32<00:28,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9571, LAS: 0.9176, UEM: 0.6324, LEM: 0.3865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2468, partial_loss/deprel_loss: 0.3608, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5416, loss: 0.6433, batch_reg_loss: 0.2036, reg_loss: 0.2037 ||:  59%|#####8    | 56/95 [00:34<00:26,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9569, LAS: 0.9173, UEM: 0.6276, LEM: 0.3819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6429, partial_loss/deprel_loss: 0.6347, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8400, loss: 0.6461, batch_reg_loss: 0.2036, reg_loss: 0.2037 ||:  62%|######2   | 59/95 [00:37<00:24,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9704, UAS: 0.9578, LAS: 0.9186, UEM: 0.6535, LEM: 0.4186, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0350, partial_loss/deprel_loss: 0.1191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3059, loss: 0.6387, batch_reg_loss: 0.2036, reg_loss: 0.2037 ||:  65%|######5   | 62/95 [00:39<00:23,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9576, LAS: 0.9183, UEM: 0.6445, LEM: 0.4095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5544, partial_loss/deprel_loss: 0.5059, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7192, loss: 0.6401, batch_reg_loss: 0.2036, reg_loss: 0.2037 ||:  69%|######9   | 66/95 [00:41<00:20,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9575, LAS: 0.9182, UEM: 0.6455, LEM: 0.4114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6521, partial_loss/deprel_loss: 0.6149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8259, loss: 0.6402, batch_reg_loss: 0.2036, reg_loss: 0.2037 ||:  73%|#######2  | 69/95 [00:44<00:18,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9570, LAS: 0.9177, UEM: 0.6504, LEM: 0.4216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1028, partial_loss/deprel_loss: 0.1930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3785, loss: 0.6430, batch_reg_loss: 0.2036, reg_loss: 0.2037 ||:  76%|#######5  | 72/95 [00:46<00:16,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9560, LAS: 0.9166, UEM: 0.6452, LEM: 0.4176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2186, partial_loss/deprel_loss: 0.3310, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5121, loss: 0.6504, batch_reg_loss: 0.2036, reg_loss: 0.2037 ||:  80%|########  | 76/95 [00:48<00:12,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9156, UAS: 0.9562, LAS: 0.9168, UEM: 0.6437, LEM: 0.4146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4998, partial_loss/deprel_loss: 0.5030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7059, loss: 0.6489, batch_reg_loss: 0.2036, reg_loss: 0.2037 ||:  84%|########4 | 80/95 [00:51<00:09,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9564, LAS: 0.9170, UEM: 0.6455, LEM: 0.4172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3524, partial_loss/deprel_loss: 0.3942, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5894, loss: 0.6464, batch_reg_loss: 0.2035, reg_loss: 0.2037 ||:  88%|########8 | 84/95 [00:53<00:07,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9565, LAS: 0.9170, UEM: 0.6404, LEM: 0.4098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3748, partial_loss/deprel_loss: 0.4616, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6478, loss: 0.6465, batch_reg_loss: 0.2035, reg_loss: 0.2037 ||:  93%|#########2| 88/95 [00:56<00:04,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9267, UAS: 0.9563, LAS: 0.9166, UEM: 0.6429, LEM: 0.4095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2583, partial_loss/deprel_loss: 0.3898, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5670, loss: 0.6479, batch_reg_loss: 0.2035, reg_loss: 0.2037 ||:  97%|#########6| 92/95 [00:59<00:02,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9056, UAS: 0.9562, LAS: 0.9165, UEM: 0.6439, LEM: 0.4110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6464, partial_loss/deprel_loss: 0.5771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7945, loss: 0.6475, batch_reg_loss: 0.2035, reg_loss: 0.2037 ||: 100%|##########| 95/95 [01:01<00:00,  1.55it/s]\n",
+      "2023-04-07 01:06:36,825 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8825, UAS: 0.9550, LAS: 0.9072, UEM: 0.7556, LEM: 0.5511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1711, partial_loss/deprel_loss: 23.5112, partial_loss/cycle_loss: 0.0000, batch_loss: 19.0432, loss: 11.8022, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  27%|##7       | 3/11 [00:02<00:07,  1.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9537, LAS: 0.9059, UEM: 0.7448, LEM: 0.5037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1712, partial_loss/deprel_loss: 7.0066, partial_loss/cycle_loss: 0.0000, batch_loss: 5.6395, loss: 11.6950, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  55%|#####4    | 6/11 [00:05<00:04,  1.09it/s]  \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8733, UAS: 0.9520, LAS: 0.9009, UEM: 0.6977, LEM: 0.4213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0938, partial_loss/deprel_loss: 20.2974, partial_loss/cycle_loss: 0.0000, batch_loss: 16.4566, loss: 11.4879, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  82%|########1 | 9/11 [00:07<00:01,  1.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8790, UAS: 0.9515, LAS: 0.9014, UEM: 0.6811, LEM: 0.4059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0456, partial_loss/deprel_loss: 12.9410, partial_loss/cycle_loss: 0.0000, batch_loss: 10.5620, loss: 11.0767, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:09<00:00,  1.16it/s]\n",
+      "2023-04-07 01:06:46,328 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:06:46,328 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 01:06:46,328 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.204  |     0.000\n",
+      "2023-04-07 01:06:46,328 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:06:46,328 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:06:46,328 - INFO - combo.training.tensorboard_writer - UEM                      |     0.644  |     0.681\n",
+      "2023-04-07 01:06:46,328 - INFO - combo.training.tensorboard_writer - LEM                      |     0.411  |     0.406\n",
+      "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - EM                       |     0.906  |     0.879\n",
+      "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.646  |     1.046\n",
+      "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - UAS                      |     0.956  |     0.952\n",
+      "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.577  |    12.941\n",
+      "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - loss                     |     0.648  |    11.077\n",
+      "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - LAS                      |     0.917  |     0.901\n",
+      "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:06:46,329 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 01:06:46,336 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:06:52,753 - INFO - combo.training.trainer - Epoch duration: 0:01:20.197188\n",
+      "2023-04-07 01:06:52,754 - INFO - combo.training.trainer - Estimated training time remaining: 5:16:31\n",
+      "2023-04-07 01:06:52,754 - INFO - allennlp.training.trainer - Epoch 121/399\n",
+      "2023-04-07 01:06:52,754 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:06:52,755 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:06:52,764 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9657, LAS: 0.9285, UEM: 0.7889, LEM: 0.6036, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4974, partial_loss/deprel_loss: 0.5193, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7184, loss: 0.5442, batch_reg_loss: 0.2035, reg_loss: 0.2035 ||:   3%|3         | 3/95 [00:02<01:03,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9615, LAS: 0.9228, UEM: 0.7172, LEM: 0.5127, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1285, partial_loss/deprel_loss: 0.3225, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4871, loss: 0.5970, batch_reg_loss: 0.2035, reg_loss: 0.2035 ||:   7%|7         | 7/95 [00:04<00:57,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9591, LAS: 0.9207, UEM: 0.6577, LEM: 0.4435, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2278, partial_loss/deprel_loss: 0.2828, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4752, loss: 0.6176, batch_reg_loss: 0.2034, reg_loss: 0.2035 ||:  13%|#2        | 12/95 [00:06<00:50,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9604, LAS: 0.9221, UEM: 0.6761, LEM: 0.4535, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3532, partial_loss/deprel_loss: 0.4561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6389, loss: 0.6078, batch_reg_loss: 0.2034, reg_loss: 0.2035 ||:  17%|#6        | 16/95 [00:09<00:48,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9605, LAS: 0.9217, UEM: 0.6605, LEM: 0.4306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4820, partial_loss/deprel_loss: 0.4622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6695, loss: 0.6117, batch_reg_loss: 0.2034, reg_loss: 0.2034 ||:  21%|##1       | 20/95 [00:11<00:45,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9606, LAS: 0.9215, UEM: 0.6706, LEM: 0.4322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1739, partial_loss/deprel_loss: 0.3131, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4886, loss: 0.6099, batch_reg_loss: 0.2034, reg_loss: 0.2034 ||:  25%|##5       | 24/95 [00:14<00:43,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8757, UAS: 0.9551, LAS: 0.9160, UEM: 0.6458, LEM: 0.4153, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0604, partial_loss/deprel_loss: 0.6867, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9648, loss: 0.6471, batch_reg_loss: 0.2034, reg_loss: 0.2034 ||:  28%|##8       | 27/95 [00:16<00:43,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8706, UAS: 0.9537, LAS: 0.9144, UEM: 0.6245, LEM: 0.3936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0133, partial_loss/deprel_loss: 0.7242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9854, loss: 0.6621, batch_reg_loss: 0.2034, reg_loss: 0.2034 ||:  33%|###2      | 31/95 [00:18<00:39,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9545, LAS: 0.9156, UEM: 0.6416, LEM: 0.4122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2303, partial_loss/deprel_loss: 0.3377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5196, loss: 0.6512, batch_reg_loss: 0.2033, reg_loss: 0.2034 ||:  37%|###6      | 35/95 [00:20<00:36,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9555, LAS: 0.9166, UEM: 0.6503, LEM: 0.4216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4090, partial_loss/deprel_loss: 0.4479, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6435, loss: 0.6435, batch_reg_loss: 0.2033, reg_loss: 0.2034 ||:  41%|####1     | 39/95 [00:22<00:32,  1.72it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9564, LAS: 0.9176, UEM: 0.6608, LEM: 0.4324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5306, partial_loss/deprel_loss: 0.5478, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7476, loss: 0.6387, batch_reg_loss: 0.2033, reg_loss: 0.2034 ||:  46%|####6     | 44/95 [00:25<00:27,  1.84it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9563, LAS: 0.9174, UEM: 0.6605, LEM: 0.4348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4828, partial_loss/deprel_loss: 0.5112, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7088, loss: 0.6393, batch_reg_loss: 0.2033, reg_loss: 0.2034 ||:  51%|#####     | 48/95 [00:28<00:27,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9692, UAS: 0.9548, LAS: 0.9160, UEM: 0.6715, LEM: 0.4605, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0341, partial_loss/deprel_loss: 0.1105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2985, loss: 0.6491, batch_reg_loss: 0.2033, reg_loss: 0.2034 ||:  55%|#####4    | 52/95 [00:31<00:27,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8971, UAS: 0.9543, LAS: 0.9154, UEM: 0.6605, LEM: 0.4493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7332, partial_loss/deprel_loss: 0.5672, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8036, loss: 0.6531, batch_reg_loss: 0.2033, reg_loss: 0.2034 ||:  59%|#####8    | 56/95 [00:34<00:26,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9547, LAS: 0.9155, UEM: 0.6511, LEM: 0.4367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4452, partial_loss/deprel_loss: 0.5057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6969, loss: 0.6522, batch_reg_loss: 0.2032, reg_loss: 0.2034 ||:  63%|######3   | 60/95 [00:36<00:23,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9260, UAS: 0.9550, LAS: 0.9158, UEM: 0.6472, LEM: 0.4294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2990, partial_loss/deprel_loss: 0.3634, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5538, loss: 0.6503, batch_reg_loss: 0.2032, reg_loss: 0.2034 ||:  66%|######6   | 63/95 [00:39<00:22,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9551, LAS: 0.9158, UEM: 0.6459, LEM: 0.4267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4032, partial_loss/deprel_loss: 0.5283, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7065, loss: 0.6498, batch_reg_loss: 0.2032, reg_loss: 0.2034 ||:  69%|######9   | 66/95 [00:41<00:20,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9557, LAS: 0.9162, UEM: 0.6485, LEM: 0.4255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2272, partial_loss/deprel_loss: 0.3453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5249, loss: 0.6453, batch_reg_loss: 0.2032, reg_loss: 0.2033 ||:  73%|#######2  | 69/95 [00:43<00:17,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9565, LAS: 0.9170, UEM: 0.6550, LEM: 0.4283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2400, partial_loss/deprel_loss: 0.3800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5552, loss: 0.6408, batch_reg_loss: 0.2032, reg_loss: 0.2033 ||:  76%|#######5  | 72/95 [00:45<00:16,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9564, LAS: 0.9168, UEM: 0.6488, LEM: 0.4210, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3583, partial_loss/deprel_loss: 0.4040, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5980, loss: 0.6432, batch_reg_loss: 0.2032, reg_loss: 0.2033 ||:  80%|########  | 76/95 [00:47<00:12,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9573, LAS: 0.9176, UEM: 0.6578, LEM: 0.4263, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1597, partial_loss/deprel_loss: 0.3499, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5150, loss: 0.6371, batch_reg_loss: 0.2032, reg_loss: 0.2033 ||:  84%|########4 | 80/95 [00:51<00:10,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9572, LAS: 0.9176, UEM: 0.6526, LEM: 0.4205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8893, partial_loss/deprel_loss: 0.6400, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8930, loss: 0.6384, batch_reg_loss: 0.2031, reg_loss: 0.2033 ||:  88%|########8 | 84/95 [00:53<00:07,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9575, LAS: 0.9180, UEM: 0.6517, LEM: 0.4188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2876, partial_loss/deprel_loss: 0.4038, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5837, loss: 0.6361, batch_reg_loss: 0.2031, reg_loss: 0.2033 ||:  93%|#########2| 88/95 [00:56<00:04,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9201, UAS: 0.9578, LAS: 0.9182, UEM: 0.6517, LEM: 0.4170, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4092, partial_loss/deprel_loss: 0.4666, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6582, loss: 0.6346, batch_reg_loss: 0.2031, reg_loss: 0.2033 ||:  96%|#########5| 91/95 [00:58<00:02,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9572, LAS: 0.9176, UEM: 0.6478, LEM: 0.4128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3699, partial_loss/deprel_loss: 0.4647, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6488, loss: 0.6397, batch_reg_loss: 0.2031, reg_loss: 0.2033 ||:  99%|#########8| 94/95 [01:00<00:00,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9036, UAS: 0.9570, LAS: 0.9174, UEM: 0.6454, LEM: 0.4113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7064, partial_loss/deprel_loss: 0.5231, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7628, loss: 0.6410, batch_reg_loss: 0.2031, reg_loss: 0.2033 ||: 100%|##########| 95/95 [01:00<00:00,  1.56it/s]\n",
+      "2023-04-07 01:07:56,773 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.203  |       N/A\n",
+      "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - UEM                      |     0.645  |       N/A\n",
+      "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - LEM                      |     0.411  |       N/A\n",
+      "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - EM                       |     0.904  |       N/A\n",
+      "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.706  |       N/A\n",
+      "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - UAS                      |     0.957  |       N/A\n",
+      "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:07:56,774 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.523  |       N/A\n",
+      "2023-04-07 01:07:56,775 - INFO - combo.training.tensorboard_writer - loss                     |     0.641  |       N/A\n",
+      "2023-04-07 01:07:56,775 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:07:56,775 - INFO - combo.training.tensorboard_writer - LAS                      |     0.917  |       N/A\n",
+      "2023-04-07 01:07:56,775 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:07:56,775 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:07:56,775 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:07:56,775 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:07:56,775 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:07:56,775 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:07:56,780 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:08:01,559 - INFO - combo.training.trainer - Epoch duration: 0:01:08.804784\n",
+      "2023-04-07 01:08:01,559 - INFO - combo.training.trainer - Estimated training time remaining: 5:15:25\n",
+      "2023-04-07 01:08:01,559 - INFO - allennlp.training.trainer - Epoch 122/399\n",
+      "2023-04-07 01:08:01,559 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:08:01,560 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:08:01,568 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9243, UAS: 0.9522, LAS: 0.9092, UEM: 0.6411, LEM: 0.3540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2410, partial_loss/deprel_loss: 0.3748, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5511, loss: 0.6883, batch_reg_loss: 0.2031, reg_loss: 0.2031 ||:   4%|4         | 4/95 [00:02<01:05,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8958, UAS: 0.9574, LAS: 0.9141, UEM: 0.6795, LEM: 0.4133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6053, partial_loss/deprel_loss: 0.5899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7961, loss: 0.6567, batch_reg_loss: 0.2031, reg_loss: 0.2031 ||:   7%|7         | 7/95 [00:04<01:02,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9607, LAS: 0.9189, UEM: 0.6862, LEM: 0.4099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1805, partial_loss/deprel_loss: 0.3899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5511, loss: 0.6337, batch_reg_loss: 0.2030, reg_loss: 0.2031 ||:  12%|#1        | 11/95 [00:07<00:58,  1.44it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9631, LAS: 0.9222, UEM: 0.7088, LEM: 0.4397, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2324, partial_loss/deprel_loss: 0.3625, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5396, loss: 0.6084, batch_reg_loss: 0.2030, reg_loss: 0.2031 ||:  15%|#4        | 14/95 [00:10<00:59,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8903, UAS: 0.9604, LAS: 0.9200, UEM: 0.6754, LEM: 0.4102, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8685, partial_loss/deprel_loss: 0.5884, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8475, loss: 0.6257, batch_reg_loss: 0.2030, reg_loss: 0.2031 ||:  19%|#8        | 18/95 [00:12<00:55,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8572, UAS: 0.9579, LAS: 0.9176, UEM: 0.6667, LEM: 0.4036, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4474, partial_loss/deprel_loss: 0.8004, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1328, loss: 0.6446, batch_reg_loss: 0.2030, reg_loss: 0.2030 ||:  22%|##2       | 21/95 [00:14<00:52,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8610, UAS: 0.9560, LAS: 0.9159, UEM: 0.6531, LEM: 0.3947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2114, partial_loss/deprel_loss: 0.6714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9824, loss: 0.6546, batch_reg_loss: 0.2030, reg_loss: 0.2030 ||:  25%|##5       | 24/95 [00:17<00:52,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9556, LAS: 0.9155, UEM: 0.6472, LEM: 0.3905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1760, partial_loss/deprel_loss: 0.3607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5268, loss: 0.6565, batch_reg_loss: 0.2030, reg_loss: 0.2030 ||:  28%|##8       | 27/95 [00:19<00:51,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9556, LAS: 0.9157, UEM: 0.6317, LEM: 0.3773, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7273, partial_loss/deprel_loss: 0.5864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8175, loss: 0.6584, batch_reg_loss: 0.2030, reg_loss: 0.2030 ||:  33%|###2      | 31/95 [00:22<00:46,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9380, UAS: 0.9570, LAS: 0.9178, UEM: 0.6732, LEM: 0.4393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1928, partial_loss/deprel_loss: 0.2727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4597, loss: 0.6434, batch_reg_loss: 0.2030, reg_loss: 0.2030 ||:  36%|###5      | 34/95 [00:24<00:45,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9577, LAS: 0.9184, UEM: 0.6754, LEM: 0.4366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6310, partial_loss/deprel_loss: 0.5785, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7920, loss: 0.6375, batch_reg_loss: 0.2029, reg_loss: 0.2030 ||:  40%|####      | 38/95 [00:27<00:41,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9576, LAS: 0.9185, UEM: 0.6792, LEM: 0.4450, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4283, partial_loss/deprel_loss: 0.4232, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6271, loss: 0.6361, batch_reg_loss: 0.2029, reg_loss: 0.2030 ||:  43%|####3     | 41/95 [00:29<00:39,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9574, LAS: 0.9182, UEM: 0.6802, LEM: 0.4504, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3893, partial_loss/deprel_loss: 0.5060, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6856, loss: 0.6373, batch_reg_loss: 0.2029, reg_loss: 0.2030 ||:  48%|####8     | 46/95 [00:31<00:32,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9577, LAS: 0.9183, UEM: 0.6801, LEM: 0.4500, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6569, partial_loss/deprel_loss: 0.5854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8026, loss: 0.6332, batch_reg_loss: 0.2029, reg_loss: 0.2030 ||:  54%|#####3    | 51/95 [00:34<00:26,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8977, UAS: 0.9563, LAS: 0.9167, UEM: 0.6622, LEM: 0.4331, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5892, partial_loss/deprel_loss: 0.5016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7220, loss: 0.6428, batch_reg_loss: 0.2029, reg_loss: 0.2030 ||:  59%|#####8    | 56/95 [00:36<00:21,  1.78it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9457, UAS: 0.9564, LAS: 0.9165, UEM: 0.6609, LEM: 0.4303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1120, partial_loss/deprel_loss: 0.2517, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4266, loss: 0.6454, batch_reg_loss: 0.2029, reg_loss: 0.2030 ||:  63%|######3   | 60/95 [00:39<00:19,  1.77it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9566, LAS: 0.9166, UEM: 0.6570, LEM: 0.4238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2082, partial_loss/deprel_loss: 0.3126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4946, loss: 0.6445, batch_reg_loss: 0.2028, reg_loss: 0.2030 ||:  67%|######7   | 64/95 [00:41<00:17,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9565, LAS: 0.9165, UEM: 0.6534, LEM: 0.4198, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1969, partial_loss/deprel_loss: 0.3458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5188, loss: 0.6468, batch_reg_loss: 0.2028, reg_loss: 0.2030 ||:  72%|#######1  | 68/95 [00:44<00:16,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9368, UAS: 0.9571, LAS: 0.9168, UEM: 0.6561, LEM: 0.4180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1879, partial_loss/deprel_loss: 0.3157, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4929, loss: 0.6437, batch_reg_loss: 0.2028, reg_loss: 0.2029 ||:  76%|#######5  | 72/95 [00:47<00:14,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9571, LAS: 0.9170, UEM: 0.6505, LEM: 0.4114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4361, partial_loss/deprel_loss: 0.4849, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6779, loss: 0.6436, batch_reg_loss: 0.2028, reg_loss: 0.2029 ||:  80%|########  | 76/95 [00:49<00:12,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9294, UAS: 0.9567, LAS: 0.9166, UEM: 0.6428, LEM: 0.4050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2727, partial_loss/deprel_loss: 0.3795, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5610, loss: 0.6456, batch_reg_loss: 0.2028, reg_loss: 0.2029 ||:  84%|########4 | 80/95 [00:52<00:09,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9566, LAS: 0.9165, UEM: 0.6422, LEM: 0.4044, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2938, partial_loss/deprel_loss: 0.3757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5621, loss: 0.6467, batch_reg_loss: 0.2028, reg_loss: 0.2029 ||:  88%|########8 | 84/95 [00:54<00:07,  1.55it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8963, UAS: 0.9566, LAS: 0.9164, UEM: 0.6409, LEM: 0.4035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7118, partial_loss/deprel_loss: 0.6359, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8538, loss: 0.6471, batch_reg_loss: 0.2028, reg_loss: 0.2029 ||:  93%|#########2| 88/95 [00:57<00:04,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9569, LAS: 0.9167, UEM: 0.6413, LEM: 0.4018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2269, partial_loss/deprel_loss: 0.3773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5499, loss: 0.6463, batch_reg_loss: 0.2027, reg_loss: 0.2029 ||:  97%|#########6| 92/95 [01:00<00:01,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9575, LAS: 0.9173, UEM: 0.6502, LEM: 0.4115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3807, partial_loss/deprel_loss: 0.4250, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6188, loss: 0.6419, batch_reg_loss: 0.2027, reg_loss: 0.2029 ||: 100%|##########| 95/95 [01:02<00:00,  1.53it/s]\n",
+      "2023-04-07 01:09:07,080 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:09:07,080 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.203  |       N/A\n",
+      "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - UEM                      |     0.650  |       N/A\n",
+      "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - LEM                      |     0.412  |       N/A\n",
+      "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - EM                       |     0.924  |       N/A\n",
+      "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.381  |       N/A\n",
+      "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - UAS                      |     0.957  |       N/A\n",
+      "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.425  |       N/A\n",
+      "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - loss                     |     0.642  |       N/A\n",
+      "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - LAS                      |     0.917  |       N/A\n",
+      "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:09:07,081 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:09:07,082 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:09:07,082 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:09:07,086 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:09:11,880 - INFO - combo.training.trainer - Epoch duration: 0:01:10.320997\n",
+      "2023-04-07 01:09:11,881 - INFO - combo.training.trainer - Estimated training time remaining: 5:14:22\n",
+      "2023-04-07 01:09:11,881 - INFO - allennlp.training.trainer - Epoch 123/399\n",
+      "2023-04-07 01:09:11,881 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:09:11,882 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:09:11,892 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9522, LAS: 0.9148, UEM: 0.3620, LEM: 0.1128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4884, partial_loss/deprel_loss: 0.4218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6379, loss: 0.6508, batch_reg_loss: 0.2027, reg_loss: 0.2027 ||:   3%|3         | 3/95 [00:02<01:07,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9526, LAS: 0.9140, UEM: 0.4789, LEM: 0.2115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1629, partial_loss/deprel_loss: 0.3631, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5257, loss: 0.6626, batch_reg_loss: 0.2027, reg_loss: 0.2027 ||:   6%|6         | 6/95 [00:04<01:06,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9574, LAS: 0.9187, UEM: 0.5721, LEM: 0.2951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3070, partial_loss/deprel_loss: 0.4475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6221, loss: 0.6244, batch_reg_loss: 0.2027, reg_loss: 0.2027 ||:   9%|9         | 9/95 [00:06<01:03,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9548, LAS: 0.9155, UEM: 0.5731, LEM: 0.3115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5578, partial_loss/deprel_loss: 0.6007, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7948, loss: 0.6512, batch_reg_loss: 0.2027, reg_loss: 0.2027 ||:  13%|#2        | 12/95 [00:09<01:03,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9550, LAS: 0.9159, UEM: 0.5895, LEM: 0.3399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5842, partial_loss/deprel_loss: 0.5232, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7381, loss: 0.6500, batch_reg_loss: 0.2027, reg_loss: 0.2027 ||:  16%|#5        | 15/95 [00:11<01:01,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9543, LAS: 0.9144, UEM: 0.5722, LEM: 0.3227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3629, partial_loss/deprel_loss: 0.3955, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5917, loss: 0.6535, batch_reg_loss: 0.2026, reg_loss: 0.2027 ||:  19%|#8        | 18/95 [00:13<00:57,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9538, LAS: 0.9140, UEM: 0.5603, LEM: 0.3080, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3997, partial_loss/deprel_loss: 0.4252, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6227, loss: 0.6544, batch_reg_loss: 0.2026, reg_loss: 0.2027 ||:  23%|##3       | 22/95 [00:15<00:51,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9542, LAS: 0.9148, UEM: 0.5804, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6433, partial_loss/deprel_loss: 0.4986, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7302, loss: 0.6507, batch_reg_loss: 0.2026, reg_loss: 0.2027 ||:  27%|##7       | 26/95 [00:18<00:46,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9548, LAS: 0.9153, UEM: 0.5932, LEM: 0.3459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4847, partial_loss/deprel_loss: 0.5432, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7341, loss: 0.6479, batch_reg_loss: 0.2026, reg_loss: 0.2027 ||:  31%|###       | 29/95 [00:20<00:46,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9553, LAS: 0.9154, UEM: 0.5956, LEM: 0.3472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1736, partial_loss/deprel_loss: 0.3527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5195, loss: 0.6472, batch_reg_loss: 0.2026, reg_loss: 0.2027 ||:  34%|###3      | 32/95 [00:22<00:43,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9364, UAS: 0.9560, LAS: 0.9162, UEM: 0.6137, LEM: 0.3682, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2107, partial_loss/deprel_loss: 0.2776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4668, loss: 0.6398, batch_reg_loss: 0.2026, reg_loss: 0.2027 ||:  37%|###6      | 35/95 [00:25<00:43,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9567, LAS: 0.9168, UEM: 0.6190, LEM: 0.3690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4259, partial_loss/deprel_loss: 0.5109, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6964, loss: 0.6367, batch_reg_loss: 0.2026, reg_loss: 0.2026 ||:  40%|####      | 38/95 [00:27<00:41,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9576, LAS: 0.9179, UEM: 0.6319, LEM: 0.3817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1669, partial_loss/deprel_loss: 0.2997, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4757, loss: 0.6291, batch_reg_loss: 0.2026, reg_loss: 0.2026 ||:  43%|####3     | 41/95 [00:29<00:38,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9573, LAS: 0.9176, UEM: 0.6268, LEM: 0.3779, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6621, partial_loss/deprel_loss: 0.5440, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7702, loss: 0.6318, batch_reg_loss: 0.2025, reg_loss: 0.2026 ||:  46%|####6     | 44/95 [00:31<00:37,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9452, UAS: 0.9581, LAS: 0.9185, UEM: 0.6446, LEM: 0.3997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1093, partial_loss/deprel_loss: 0.2532, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4269, loss: 0.6259, batch_reg_loss: 0.2025, reg_loss: 0.2026 ||:  49%|####9     | 47/95 [00:33<00:35,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9578, LAS: 0.9183, UEM: 0.6351, LEM: 0.3895, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2864, partial_loss/deprel_loss: 0.3295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5234, loss: 0.6274, batch_reg_loss: 0.2025, reg_loss: 0.2026 ||:  54%|#####3    | 51/95 [00:36<00:31,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8508, UAS: 0.9567, LAS: 0.9169, UEM: 0.6282, LEM: 0.3826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3334, partial_loss/deprel_loss: 0.8025, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1112, loss: 0.6377, batch_reg_loss: 0.2025, reg_loss: 0.2026 ||:  57%|#####6    | 54/95 [00:38<00:28,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9557, LAS: 0.9158, UEM: 0.6224, LEM: 0.3775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5367, partial_loss/deprel_loss: 0.5252, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7300, loss: 0.6446, batch_reg_loss: 0.2025, reg_loss: 0.2026 ||:  60%|######    | 57/95 [00:40<00:26,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9256, UAS: 0.9569, LAS: 0.9172, UEM: 0.6417, LEM: 0.4002, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3564, partial_loss/deprel_loss: 0.3868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5832, loss: 0.6343, batch_reg_loss: 0.2025, reg_loss: 0.2026 ||:  65%|######5   | 62/95 [00:43<00:20,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8934, UAS: 0.9569, LAS: 0.9174, UEM: 0.6374, LEM: 0.3967, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6705, partial_loss/deprel_loss: 0.6447, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8523, loss: 0.6355, batch_reg_loss: 0.2024, reg_loss: 0.2026 ||:  71%|#######   | 67/95 [00:45<00:16,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8468, UAS: 0.9559, LAS: 0.9163, UEM: 0.6302, LEM: 0.3890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2689, partial_loss/deprel_loss: 0.8164, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1094, loss: 0.6433, batch_reg_loss: 0.2024, reg_loss: 0.2026 ||:  76%|#######5  | 72/95 [00:47<00:12,  1.88it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9556, LAS: 0.9158, UEM: 0.6252, LEM: 0.3839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2892, partial_loss/deprel_loss: 0.3821, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5660, loss: 0.6471, batch_reg_loss: 0.2024, reg_loss: 0.2026 ||:  80%|########  | 76/95 [00:49<00:10,  1.79it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9563, LAS: 0.9166, UEM: 0.6355, LEM: 0.3928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3708, partial_loss/deprel_loss: 0.4307, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6211, loss: 0.6427, batch_reg_loss: 0.2024, reg_loss: 0.2026 ||:  84%|########4 | 80/95 [00:52<00:09,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9561, LAS: 0.9164, UEM: 0.6302, LEM: 0.3872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4902, partial_loss/deprel_loss: 0.5109, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7091, loss: 0.6444, batch_reg_loss: 0.2024, reg_loss: 0.2025 ||:  88%|########8 | 84/95 [00:55<00:07,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9566, LAS: 0.9172, UEM: 0.6456, LEM: 0.4111, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2067, partial_loss/deprel_loss: 0.2926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4778, loss: 0.6389, batch_reg_loss: 0.2024, reg_loss: 0.2025 ||:  93%|#########2| 88/95 [00:59<00:04,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9566, LAS: 0.9171, UEM: 0.6438, LEM: 0.4087, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2377, partial_loss/deprel_loss: 0.3362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5189, loss: 0.6395, batch_reg_loss: 0.2024, reg_loss: 0.2025 ||:  96%|#########5| 91/95 [01:01<00:02,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9569, LAS: 0.9175, UEM: 0.6463, LEM: 0.4100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3060, partial_loss/deprel_loss: 0.4120, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5932, loss: 0.6364, batch_reg_loss: 0.2024, reg_loss: 0.2025 ||:  99%|#########8| 94/95 [01:03<00:00,  1.37it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9327, UAS: 0.9571, LAS: 0.9176, UEM: 0.6469, LEM: 0.4097, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2050, partial_loss/deprel_loss: 0.4041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5666, loss: 0.6357, batch_reg_loss: 0.2024, reg_loss: 0.2025 ||: 100%|##########| 95/95 [01:04<00:00,  1.48it/s]\n",
+      "2023-04-07 01:10:19,433 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:10:19,433 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 01:10:19,433 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.203  |       N/A\n",
+      "2023-04-07 01:10:19,433 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:10:19,433 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:10:19,433 - INFO - combo.training.tensorboard_writer - UEM                      |     0.647  |       N/A\n",
+      "2023-04-07 01:10:19,433 - INFO - combo.training.tensorboard_writer - LEM                      |     0.410  |       N/A\n",
+      "2023-04-07 01:10:19,433 - INFO - combo.training.tensorboard_writer - EM                       |     0.933  |       N/A\n",
+      "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.205  |       N/A\n",
+      "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - UAS                      |     0.957  |       N/A\n",
+      "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.404  |       N/A\n",
+      "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - loss                     |     0.636  |       N/A\n",
+      "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - LAS                      |     0.918  |       N/A\n",
+      "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:10:19,434 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:10:19,435 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:10:19,435 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:10:19,440 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:10:24,289 - INFO - combo.training.trainer - Epoch duration: 0:01:12.408076\n",
+      "2023-04-07 01:10:24,290 - INFO - combo.training.trainer - Estimated training time remaining: 5:13:23\n",
+      "2023-04-07 01:10:24,290 - INFO - allennlp.training.trainer - Epoch 124/399\n",
+      "2023-04-07 01:10:24,290 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:10:24,290 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:10:24,298 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9765, LAS: 0.9418, UEM: 0.7820, LEM: 0.5188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1438, partial_loss/deprel_loss: 0.3288, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4941, loss: 0.4928, batch_reg_loss: 0.2023, reg_loss: 0.2023 ||:   3%|3         | 3/95 [00:02<01:06,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9070, UAS: 0.9661, LAS: 0.9291, UEM: 0.7183, LEM: 0.4843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4962, partial_loss/deprel_loss: 0.4507, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6621, loss: 0.5646, batch_reg_loss: 0.2023, reg_loss: 0.2023 ||:   6%|6         | 6/95 [00:04<01:04,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9637, LAS: 0.9263, UEM: 0.6649, LEM: 0.4202, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5642, partial_loss/deprel_loss: 0.5338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7421, loss: 0.5819, batch_reg_loss: 0.2023, reg_loss: 0.2023 ||:  11%|#         | 10/95 [00:06<00:58,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9622, LAS: 0.9240, UEM: 0.6498, LEM: 0.4046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1761, partial_loss/deprel_loss: 0.2817, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4628, loss: 0.6004, batch_reg_loss: 0.2023, reg_loss: 0.2023 ||:  14%|#3        | 13/95 [00:08<00:56,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8881, UAS: 0.9591, LAS: 0.9210, UEM: 0.6203, LEM: 0.3814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8691, partial_loss/deprel_loss: 0.6093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8636, loss: 0.6202, batch_reg_loss: 0.2023, reg_loss: 0.2023 ||:  17%|#6        | 16/95 [00:11<00:55,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8849, UAS: 0.9585, LAS: 0.9200, UEM: 0.6173, LEM: 0.3775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9060, partial_loss/deprel_loss: 0.6450, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8995, loss: 0.6287, batch_reg_loss: 0.2022, reg_loss: 0.2023 ||:  21%|##1       | 20/95 [00:13<00:52,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9577, LAS: 0.9189, UEM: 0.6070, LEM: 0.3655, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2624, partial_loss/deprel_loss: 0.4049, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5786, loss: 0.6363, batch_reg_loss: 0.2022, reg_loss: 0.2023 ||:  24%|##4       | 23/95 [00:16<00:51,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9603, LAS: 0.9221, UEM: 0.6962, LEM: 0.4812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0908, partial_loss/deprel_loss: 0.2607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4290, loss: 0.6100, batch_reg_loss: 0.2022, reg_loss: 0.2023 ||:  27%|##7       | 26/95 [00:19<00:56,  1.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9255, UAS: 0.9596, LAS: 0.9213, UEM: 0.6856, LEM: 0.4690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2466, partial_loss/deprel_loss: 0.3520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5332, loss: 0.6146, batch_reg_loss: 0.2022, reg_loss: 0.2023 ||:  31%|###       | 29/95 [00:21<00:53,  1.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9588, LAS: 0.9204, UEM: 0.6891, LEM: 0.4723, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1239, partial_loss/deprel_loss: 0.2913, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4601, loss: 0.6208, batch_reg_loss: 0.2022, reg_loss: 0.2023 ||:  34%|###3      | 32/95 [00:23<00:49,  1.27it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9587, LAS: 0.9200, UEM: 0.6841, LEM: 0.4652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7536, partial_loss/deprel_loss: 0.5833, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8195, loss: 0.6237, batch_reg_loss: 0.2022, reg_loss: 0.2023 ||:  37%|###6      | 35/95 [00:26<00:47,  1.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9056, UAS: 0.9590, LAS: 0.9205, UEM: 0.6883, LEM: 0.4692, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6676, partial_loss/deprel_loss: 0.5064, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7408, loss: 0.6198, batch_reg_loss: 0.2022, reg_loss: 0.2023 ||:  40%|####      | 38/95 [00:28<00:45,  1.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9300, UAS: 0.9595, LAS: 0.9206, UEM: 0.6843, LEM: 0.4582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2497, partial_loss/deprel_loss: 0.3926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5662, loss: 0.6188, batch_reg_loss: 0.2022, reg_loss: 0.2022 ||:  44%|####4     | 42/95 [00:31<00:40,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9583, LAS: 0.9195, UEM: 0.6712, LEM: 0.4468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3946, partial_loss/deprel_loss: 0.4463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6381, loss: 0.6288, batch_reg_loss: 0.2021, reg_loss: 0.2022 ||:  47%|####7     | 45/95 [00:33<00:37,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9589, LAS: 0.9200, UEM: 0.6707, LEM: 0.4422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2488, partial_loss/deprel_loss: 0.3808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5565, loss: 0.6250, batch_reg_loss: 0.2021, reg_loss: 0.2022 ||:  51%|#####     | 48/95 [00:35<00:34,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9582, LAS: 0.9192, UEM: 0.6620, LEM: 0.4344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4370, partial_loss/deprel_loss: 0.4411, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6424, loss: 0.6316, batch_reg_loss: 0.2021, reg_loss: 0.2022 ||:  55%|#####4    | 52/95 [00:38<00:29,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9590, LAS: 0.9201, UEM: 0.6630, LEM: 0.4293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2529, partial_loss/deprel_loss: 0.3615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5419, loss: 0.6265, batch_reg_loss: 0.2021, reg_loss: 0.2022 ||:  59%|#####8    | 56/95 [00:40<00:25,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9122, UAS: 0.9591, LAS: 0.9204, UEM: 0.6680, LEM: 0.4394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5619, partial_loss/deprel_loss: 0.4953, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7107, loss: 0.6241, batch_reg_loss: 0.2021, reg_loss: 0.2022 ||:  63%|######3   | 60/95 [00:43<00:24,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9176, UAS: 0.9593, LAS: 0.9207, UEM: 0.6668, LEM: 0.4373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4439, partial_loss/deprel_loss: 0.5178, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7051, loss: 0.6225, batch_reg_loss: 0.2021, reg_loss: 0.2022 ||:  66%|######6   | 63/95 [00:45<00:21,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9598, LAS: 0.9211, UEM: 0.6707, LEM: 0.4395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3855, partial_loss/deprel_loss: 0.4356, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6277, loss: 0.6206, batch_reg_loss: 0.2021, reg_loss: 0.2022 ||:  69%|######9   | 66/95 [00:47<00:19,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9595, LAS: 0.9208, UEM: 0.6629, LEM: 0.4314, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4894, partial_loss/deprel_loss: 0.4298, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6437, loss: 0.6225, batch_reg_loss: 0.2021, reg_loss: 0.2022 ||:  73%|#######2  | 69/95 [00:49<00:18,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9592, LAS: 0.9206, UEM: 0.6657, LEM: 0.4348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1943, partial_loss/deprel_loss: 0.3193, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4963, loss: 0.6230, batch_reg_loss: 0.2020, reg_loss: 0.2022 ||:  77%|#######6  | 73/95 [00:51<00:14,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8910, UAS: 0.9583, LAS: 0.9196, UEM: 0.6557, LEM: 0.4264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9570, partial_loss/deprel_loss: 0.6285, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8962, loss: 0.6307, batch_reg_loss: 0.2020, reg_loss: 0.2022 ||:  82%|########2 | 78/95 [00:54<00:10,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9577, LAS: 0.9189, UEM: 0.6487, LEM: 0.4199, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6121, partial_loss/deprel_loss: 0.5276, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7465, loss: 0.6344, batch_reg_loss: 0.2020, reg_loss: 0.2022 ||:  87%|########7 | 83/95 [00:56<00:06,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9578, LAS: 0.9188, UEM: 0.6475, LEM: 0.4166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4638, partial_loss/deprel_loss: 0.5290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7179, loss: 0.6341, batch_reg_loss: 0.2020, reg_loss: 0.2022 ||:  93%|#########2| 88/95 [00:59<00:03,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9584, LAS: 0.9194, UEM: 0.6526, LEM: 0.4189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2525, partial_loss/deprel_loss: 0.3589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5396, loss: 0.6302, batch_reg_loss: 0.2020, reg_loss: 0.2021 ||:  97%|#########6| 92/95 [01:02<00:01,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9579, LAS: 0.9188, UEM: 0.6505, LEM: 0.4164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3767, partial_loss/deprel_loss: 0.4896, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6690, loss: 0.6343, batch_reg_loss: 0.2020, reg_loss: 0.2021 ||: 100%|##########| 95/95 [01:04<00:00,  1.48it/s]\n",
+      "2023-04-07 01:11:31,294 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:11:31,294 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 01:11:31,294 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.202  |       N/A\n",
+      "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - UEM                      |     0.650  |       N/A\n",
+      "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - LEM                      |     0.416  |       N/A\n",
+      "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - EM                       |     0.917  |       N/A\n",
+      "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.377  |       N/A\n",
+      "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - UAS                      |     0.958  |       N/A\n",
+      "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.490  |       N/A\n",
+      "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - loss                     |     0.634  |       N/A\n",
+      "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - LAS                      |     0.919  |       N/A\n",
+      "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:11:31,295 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:11:31,296 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:11:31,299 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:11:35,526 - INFO - combo.training.trainer - Epoch duration: 0:01:11.235946\n",
+      "2023-04-07 01:11:35,526 - INFO - combo.training.trainer - Estimated training time remaining: 5:12:22\n",
+      "2023-04-07 01:11:35,526 - INFO - allennlp.training.trainer - Epoch 125/399\n",
+      "2023-04-07 01:11:35,526 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:11:35,527 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:11:35,534 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9727, LAS: 0.9330, UEM: 0.7624, LEM: 0.4673, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2298, partial_loss/deprel_loss: 0.3928, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5621, loss: 0.5460, batch_reg_loss: 0.2020, reg_loss: 0.2020 ||:   3%|3         | 3/95 [00:02<01:12,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9598, LAS: 0.9199, UEM: 0.6872, LEM: 0.4239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1942, partial_loss/deprel_loss: 0.3307, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5053, loss: 0.6276, batch_reg_loss: 0.2019, reg_loss: 0.2019 ||:   6%|6         | 6/95 [00:04<01:10,  1.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9279, UAS: 0.9616, LAS: 0.9217, UEM: 0.6680, LEM: 0.3982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3015, partial_loss/deprel_loss: 0.3950, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5782, loss: 0.6213, batch_reg_loss: 0.2019, reg_loss: 0.2019 ||:  11%|#         | 10/95 [00:07<01:02,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9636, LAS: 0.9240, UEM: 0.6833, LEM: 0.4095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1830, partial_loss/deprel_loss: 0.3177, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4927, loss: 0.5963, batch_reg_loss: 0.2019, reg_loss: 0.2019 ||:  15%|#4        | 14/95 [00:10<00:59,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9638, LAS: 0.9243, UEM: 0.6749, LEM: 0.3969, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4080, partial_loss/deprel_loss: 0.4319, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6290, loss: 0.5924, batch_reg_loss: 0.2019, reg_loss: 0.2019 ||:  18%|#7        | 17/95 [00:12<00:58,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9627, LAS: 0.9238, UEM: 0.6518, LEM: 0.3788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4117, partial_loss/deprel_loss: 0.4157, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6167, loss: 0.5937, batch_reg_loss: 0.2019, reg_loss: 0.2019 ||:  21%|##1       | 20/95 [00:14<00:54,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9643, LAS: 0.9255, UEM: 0.6762, LEM: 0.4063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1209, partial_loss/deprel_loss: 0.2901, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4581, loss: 0.5823, batch_reg_loss: 0.2019, reg_loss: 0.2019 ||:  24%|##4       | 23/95 [00:16<00:53,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9662, LAS: 0.9276, UEM: 0.7097, LEM: 0.4462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0926, partial_loss/deprel_loss: 0.2642, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4317, loss: 0.5671, batch_reg_loss: 0.2018, reg_loss: 0.2019 ||:  27%|##7       | 26/95 [00:19<00:53,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9650, LAS: 0.9264, UEM: 0.7100, LEM: 0.4561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6103, partial_loss/deprel_loss: 0.5114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7330, loss: 0.5736, batch_reg_loss: 0.2018, reg_loss: 0.2019 ||:  31%|###       | 29/95 [00:21<00:51,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9236, UAS: 0.9643, LAS: 0.9255, UEM: 0.7037, LEM: 0.4526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3383, partial_loss/deprel_loss: 0.4147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6012, loss: 0.5795, batch_reg_loss: 0.2018, reg_loss: 0.2019 ||:  34%|###3      | 32/95 [00:24<00:48,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9626, LAS: 0.9236, UEM: 0.6871, LEM: 0.4382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4311, partial_loss/deprel_loss: 0.5208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7046, loss: 0.5945, batch_reg_loss: 0.2018, reg_loss: 0.2019 ||:  37%|###6      | 35/95 [00:26<00:45,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9343, UAS: 0.9622, LAS: 0.9235, UEM: 0.6751, LEM: 0.4275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3145, partial_loss/deprel_loss: 0.3811, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5696, loss: 0.5969, batch_reg_loss: 0.2018, reg_loss: 0.2019 ||:  40%|####      | 38/95 [00:28<00:42,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9708, UAS: 0.9622, LAS: 0.9239, UEM: 0.6983, LEM: 0.4666, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0376, partial_loss/deprel_loss: 0.1143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3007, loss: 0.5956, batch_reg_loss: 0.2017, reg_loss: 0.2019 ||:  43%|####3     | 41/95 [00:30<00:41,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9288, UAS: 0.9617, LAS: 0.9231, UEM: 0.6876, LEM: 0.4549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2292, partial_loss/deprel_loss: 0.3355, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5159, loss: 0.6006, batch_reg_loss: 0.2017, reg_loss: 0.2018 ||:  47%|####7     | 45/95 [00:33<00:37,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9612, LAS: 0.9227, UEM: 0.6824, LEM: 0.4484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2393, partial_loss/deprel_loss: 0.3674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5435, loss: 0.6015, batch_reg_loss: 0.2017, reg_loss: 0.2018 ||:  52%|#####1    | 49/95 [00:36<00:32,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8496, UAS: 0.9600, LAS: 0.9214, UEM: 0.6797, LEM: 0.4462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2860, partial_loss/deprel_loss: 0.7001, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0190, loss: 0.6081, batch_reg_loss: 0.2017, reg_loss: 0.2018 ||:  55%|#####4    | 52/95 [00:40<00:39,  1.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8978, UAS: 0.9595, LAS: 0.9208, UEM: 0.6774, LEM: 0.4456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7134, partial_loss/deprel_loss: 0.5727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8025, loss: 0.6134, batch_reg_loss: 0.2017, reg_loss: 0.2018 ||:  58%|#####7    | 55/95 [00:42<00:33,  1.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9597, LAS: 0.9209, UEM: 0.6760, LEM: 0.4410, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2389, partial_loss/deprel_loss: 0.3760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5502, loss: 0.6121, batch_reg_loss: 0.2017, reg_loss: 0.2018 ||:  61%|######1   | 58/95 [00:44<00:29,  1.25it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9596, LAS: 0.9208, UEM: 0.6722, LEM: 0.4365, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4008, partial_loss/deprel_loss: 0.3814, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5870, loss: 0.6125, batch_reg_loss: 0.2017, reg_loss: 0.2018 ||:  65%|######5   | 62/95 [00:46<00:24,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9599, LAS: 0.9212, UEM: 0.6732, LEM: 0.4365, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4425, partial_loss/deprel_loss: 0.4701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6662, loss: 0.6095, batch_reg_loss: 0.2017, reg_loss: 0.2018 ||:  69%|######9   | 66/95 [00:49<00:20,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9533, UAS: 0.9597, LAS: 0.9212, UEM: 0.6806, LEM: 0.4483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1058, partial_loss/deprel_loss: 0.2003, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3831, loss: 0.6090, batch_reg_loss: 0.2016, reg_loss: 0.2018 ||:  73%|#######2  | 69/95 [00:51<00:18,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9020, UAS: 0.9598, LAS: 0.9213, UEM: 0.6795, LEM: 0.4463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5656, partial_loss/deprel_loss: 0.5189, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7299, loss: 0.6075, batch_reg_loss: 0.2016, reg_loss: 0.2018 ||:  77%|#######6  | 73/95 [00:53<00:14,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9126, UAS: 0.9588, LAS: 0.9204, UEM: 0.6721, LEM: 0.4391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4846, partial_loss/deprel_loss: 0.5055, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7029, loss: 0.6140, batch_reg_loss: 0.2016, reg_loss: 0.2018 ||:  81%|########1 | 77/95 [00:56<00:12,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9583, LAS: 0.9198, UEM: 0.6638, LEM: 0.4316, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7274, partial_loss/deprel_loss: 0.5789, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8102, loss: 0.6188, batch_reg_loss: 0.2016, reg_loss: 0.2018 ||:  85%|########5 | 81/95 [00:59<00:09,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9584, LAS: 0.9200, UEM: 0.6629, LEM: 0.4314, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1167, partial_loss/deprel_loss: 0.2720, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4425, loss: 0.6179, batch_reg_loss: 0.2016, reg_loss: 0.2018 ||:  89%|########9 | 85/95 [01:01<00:06,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9578, LAS: 0.9191, UEM: 0.6565, LEM: 0.4244, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6786, partial_loss/deprel_loss: 0.5944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8128, loss: 0.6245, batch_reg_loss: 0.2016, reg_loss: 0.2017 ||:  95%|#########4| 90/95 [01:03<00:02,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9362, UAS: 0.9574, LAS: 0.9186, UEM: 0.6510, LEM: 0.4180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1776, partial_loss/deprel_loss: 0.3353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5053, loss: 0.6280, batch_reg_loss: 0.2016, reg_loss: 0.2017 ||: 100%|##########| 95/95 [01:06<00:00,  1.79it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9362, UAS: 0.9574, LAS: 0.9186, UEM: 0.6510, LEM: 0.4180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1776, partial_loss/deprel_loss: 0.3353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5053, loss: 0.6280, batch_reg_loss: 0.2016, reg_loss: 0.2017 ||: 100%|##########| 95/95 [01:06<00:00,  1.43it/s]\n",
+      "2023-04-07 01:12:45,128 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8665, UAS: 0.9510, LAS: 0.9035, UEM: 0.7940, LEM: 0.6163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0306, partial_loss/deprel_loss: 17.9014, partial_loss/cycle_loss: 0.0000, batch_loss: 14.5273, loss: 9.4725, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  18%|#8        | 2/11 [00:02<00:09,  1.05s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9523, LAS: 0.9032, UEM: 0.7358, LEM: 0.5074, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1613, partial_loss/deprel_loss: 6.3737, partial_loss/cycle_loss: 0.0000, batch_loss: 5.1312, loss: 10.3144, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:05<00:06,  1.04s/it] \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8989, UAS: 0.9466, LAS: 0.8957, UEM: 0.6798, LEM: 0.4373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5936, partial_loss/deprel_loss: 8.5089, partial_loss/cycle_loss: 0.0000, batch_loss: 6.9258, loss: 11.1434, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  64%|######3   | 7/11 [00:07<00:04,  1.03s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9480, LAS: 0.8973, UEM: 0.6645, LEM: 0.4026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3634, partial_loss/deprel_loss: 8.6906, partial_loss/cycle_loss: 0.0000, batch_loss: 7.0251, loss: 10.1889, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  91%|######### | 10/11 [00:09<00:00,  1.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9497, LAS: 0.8995, UEM: 0.6775, LEM: 0.4090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4289, partial_loss/deprel_loss: 7.0862, partial_loss/cycle_loss: 0.0000, batch_loss: 5.7547, loss: 9.7858, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.03it/s] \n",
+      "2023-04-07 01:12:55,794 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:12:55,794 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 01:12:55,794 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.202  |     0.000\n",
+      "2023-04-07 01:12:55,794 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:12:55,794 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:12:55,794 - INFO - combo.training.tensorboard_writer - UEM                      |     0.651  |     0.677\n",
+      "2023-04-07 01:12:55,794 - INFO - combo.training.tensorboard_writer - LEM                      |     0.418  |     0.409\n",
+      "2023-04-07 01:12:55,794 - INFO - combo.training.tensorboard_writer - EM                       |     0.936  |     0.922\n",
+      "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.178  |     0.429\n",
+      "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - UAS                      |     0.957  |     0.950\n",
+      "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.335  |     7.086\n",
+      "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - loss                     |     0.628  |     9.786\n",
+      "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - LAS                      |     0.919  |     0.899\n",
+      "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:12:55,795 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 01:12:55,799 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:13:00,394 - INFO - combo.training.trainer - Epoch duration: 0:01:24.867347\n",
+      "2023-04-07 01:13:00,394 - INFO - combo.training.trainer - Estimated training time remaining: 5:11:50\n",
+      "2023-04-07 01:13:00,394 - INFO - allennlp.training.trainer - Epoch 126/399\n",
+      "2023-04-07 01:13:00,394 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:13:00,395 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:13:00,402 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9517, UAS: 0.9772, LAS: 0.9414, UEM: 0.8386, LEM: 0.6353, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0986, partial_loss/deprel_loss: 0.1837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3682, loss: 0.4718, batch_reg_loss: 0.2016, reg_loss: 0.2016 ||:   3%|3         | 3/95 [00:02<01:03,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9713, LAS: 0.9333, UEM: 0.7912, LEM: 0.5681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1304, partial_loss/deprel_loss: 0.2594, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4351, loss: 0.5159, batch_reg_loss: 0.2015, reg_loss: 0.2016 ||:   6%|6         | 6/95 [00:04<01:01,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9256, UAS: 0.9652, LAS: 0.9277, UEM: 0.7161, LEM: 0.4873, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2455, partial_loss/deprel_loss: 0.3899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5626, loss: 0.5609, batch_reg_loss: 0.2015, reg_loss: 0.2015 ||:  11%|#         | 10/95 [00:06<00:57,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9684, LAS: 0.9322, UEM: 0.7560, LEM: 0.5313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1075, partial_loss/deprel_loss: 0.2256, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4035, loss: 0.5308, batch_reg_loss: 0.2015, reg_loss: 0.2015 ||:  15%|#4        | 14/95 [00:09<00:54,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9651, LAS: 0.9286, UEM: 0.7391, LEM: 0.5164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1538, partial_loss/deprel_loss: 0.3231, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4907, loss: 0.5543, batch_reg_loss: 0.2015, reg_loss: 0.2015 ||:  18%|#7        | 17/95 [00:11<00:53,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9648, LAS: 0.9285, UEM: 0.7214, LEM: 0.4970, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2192, partial_loss/deprel_loss: 0.3522, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5271, loss: 0.5599, batch_reg_loss: 0.2015, reg_loss: 0.2015 ||:  21%|##1       | 20/95 [00:13<00:52,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9655, LAS: 0.9289, UEM: 0.7323, LEM: 0.5032, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3495, partial_loss/deprel_loss: 0.3889, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5825, loss: 0.5538, batch_reg_loss: 0.2015, reg_loss: 0.2015 ||:  24%|##4       | 23/95 [00:16<00:52,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9658, LAS: 0.9287, UEM: 0.7277, LEM: 0.4930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1855, partial_loss/deprel_loss: 0.3848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5463, loss: 0.5550, batch_reg_loss: 0.2014, reg_loss: 0.2015 ||:  27%|##7       | 26/95 [00:18<00:51,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9196, UAS: 0.9655, LAS: 0.9283, UEM: 0.7182, LEM: 0.4791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2810, partial_loss/deprel_loss: 0.3895, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5692, loss: 0.5568, batch_reg_loss: 0.2014, reg_loss: 0.2015 ||:  31%|###       | 29/95 [00:20<00:48,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9680, UAS: 0.9652, LAS: 0.9283, UEM: 0.7284, LEM: 0.5052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0355, partial_loss/deprel_loss: 0.1220, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3061, loss: 0.5586, batch_reg_loss: 0.2014, reg_loss: 0.2015 ||:  35%|###4      | 33/95 [00:23<00:46,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8923, UAS: 0.9636, LAS: 0.9265, UEM: 0.7188, LEM: 0.4964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8579, partial_loss/deprel_loss: 0.5797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8367, loss: 0.5703, batch_reg_loss: 0.2014, reg_loss: 0.2015 ||:  38%|###7      | 36/95 [00:25<00:43,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9643, LAS: 0.9269, UEM: 0.7215, LEM: 0.4945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1387, partial_loss/deprel_loss: 0.2731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4476, loss: 0.5679, batch_reg_loss: 0.2014, reg_loss: 0.2015 ||:  41%|####1     | 39/95 [00:28<00:41,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8592, UAS: 0.9623, LAS: 0.9248, UEM: 0.7082, LEM: 0.4834, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3996, partial_loss/deprel_loss: 0.7611, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0902, loss: 0.5859, batch_reg_loss: 0.2014, reg_loss: 0.2015 ||:  44%|####4     | 42/95 [00:30<00:38,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8893, UAS: 0.9614, LAS: 0.9236, UEM: 0.6933, LEM: 0.4678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8482, partial_loss/deprel_loss: 0.6434, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8857, loss: 0.5937, batch_reg_loss: 0.2013, reg_loss: 0.2015 ||:  48%|####8     | 46/95 [00:32<00:33,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9623, LAS: 0.9244, UEM: 0.7066, LEM: 0.4795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1985, partial_loss/deprel_loss: 0.3384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5118, loss: 0.5878, batch_reg_loss: 0.2013, reg_loss: 0.2014 ||:  52%|#####1    | 49/95 [00:34<00:32,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9618, LAS: 0.9238, UEM: 0.7034, LEM: 0.4771, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6143, partial_loss/deprel_loss: 0.5572, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7699, loss: 0.5918, batch_reg_loss: 0.2013, reg_loss: 0.2014 ||:  55%|#####4    | 52/95 [00:37<00:31,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9615, LAS: 0.9233, UEM: 0.6965, LEM: 0.4692, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2506, partial_loss/deprel_loss: 0.3667, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5447, loss: 0.5971, batch_reg_loss: 0.2013, reg_loss: 0.2014 ||:  59%|#####8    | 56/95 [00:39<00:28,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9070, UAS: 0.9609, LAS: 0.9227, UEM: 0.6897, LEM: 0.4626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5770, partial_loss/deprel_loss: 0.4771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6984, loss: 0.5998, batch_reg_loss: 0.2013, reg_loss: 0.2014 ||:  63%|######3   | 60/95 [00:42<00:23,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9600, LAS: 0.9217, UEM: 0.6836, LEM: 0.4567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3667, partial_loss/deprel_loss: 0.4615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6438, loss: 0.6066, batch_reg_loss: 0.2013, reg_loss: 0.2014 ||:  67%|######7   | 64/95 [00:44<00:20,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9586, LAS: 0.9201, UEM: 0.6741, LEM: 0.4474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5645, partial_loss/deprel_loss: 0.4994, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7137, loss: 0.6182, batch_reg_loss: 0.2013, reg_loss: 0.2014 ||:  72%|#######1  | 68/95 [00:47<00:18,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9581, LAS: 0.9196, UEM: 0.6668, LEM: 0.4409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6667, partial_loss/deprel_loss: 0.5602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7827, loss: 0.6209, batch_reg_loss: 0.2013, reg_loss: 0.2014 ||:  76%|#######5  | 72/95 [00:49<00:15,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9054, UAS: 0.9575, LAS: 0.9190, UEM: 0.6594, LEM: 0.4337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5403, partial_loss/deprel_loss: 0.4920, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7029, loss: 0.6248, batch_reg_loss: 0.2013, reg_loss: 0.2014 ||:  80%|########  | 76/95 [00:52<00:12,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9580, LAS: 0.9195, UEM: 0.6659, LEM: 0.4398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3179, partial_loss/deprel_loss: 0.3758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5655, loss: 0.6214, batch_reg_loss: 0.2013, reg_loss: 0.2014 ||:  84%|########4 | 80/95 [00:55<00:10,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9579, LAS: 0.9194, UEM: 0.6578, LEM: 0.4304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3447, partial_loss/deprel_loss: 0.4449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6261, loss: 0.6225, batch_reg_loss: 0.2012, reg_loss: 0.2014 ||:  89%|########9 | 85/95 [00:58<00:06,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9432, UAS: 0.9581, LAS: 0.9196, UEM: 0.6574, LEM: 0.4293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2276, partial_loss/deprel_loss: 0.2833, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4734, loss: 0.6205, batch_reg_loss: 0.2012, reg_loss: 0.2014 ||:  94%|#########3| 89/95 [01:00<00:03,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9126, UAS: 0.9579, LAS: 0.9195, UEM: 0.6501, LEM: 0.4220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4741, partial_loss/deprel_loss: 0.4854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6844, loss: 0.6220, batch_reg_loss: 0.2012, reg_loss: 0.2014 ||:  98%|#########7| 93/95 [01:02<00:01,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8829, UAS: 0.9576, LAS: 0.9191, UEM: 0.6473, LEM: 0.4191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9417, partial_loss/deprel_loss: 0.5799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8535, loss: 0.6244, batch_reg_loss: 0.2012, reg_loss: 0.2014 ||: 100%|##########| 95/95 [01:03<00:00,  1.49it/s]\n",
+      "2023-04-07 01:14:07,173 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:14:07,173 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 01:14:07,173 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.201  |       N/A\n",
+      "2023-04-07 01:14:07,173 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:14:07,173 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:14:07,173 - INFO - combo.training.tensorboard_writer - UEM                      |     0.647  |       N/A\n",
+      "2023-04-07 01:14:07,173 - INFO - combo.training.tensorboard_writer - LEM                      |     0.419  |       N/A\n",
+      "2023-04-07 01:14:07,173 - INFO - combo.training.tensorboard_writer - EM                       |     0.883  |       N/A\n",
+      "2023-04-07 01:14:07,173 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.942  |       N/A\n",
+      "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - UAS                      |     0.958  |       N/A\n",
+      "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.580  |       N/A\n",
+      "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - loss                     |     0.624  |       N/A\n",
+      "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - LAS                      |     0.919  |       N/A\n",
+      "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:14:07,174 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:14:07,179 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:14:12,486 - INFO - combo.training.trainer - Epoch duration: 0:01:12.091447\n",
+      "2023-04-07 01:14:12,486 - INFO - combo.training.trainer - Estimated training time remaining: 5:10:50\n",
+      "2023-04-07 01:14:12,486 - INFO - allennlp.training.trainer - Epoch 127/399\n",
+      "2023-04-07 01:14:12,487 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:14:12,487 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:14:12,497 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9739, LAS: 0.9382, UEM: 0.7630, LEM: 0.4788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2674, partial_loss/deprel_loss: 0.3419, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5282, loss: 0.5111, batch_reg_loss: 0.2012, reg_loss: 0.2012 ||:   4%|4         | 4/95 [00:02<00:45,  1.98it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9681, LAS: 0.9307, UEM: 0.7433, LEM: 0.4810, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1699, partial_loss/deprel_loss: 0.3132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4857, loss: 0.5487, batch_reg_loss: 0.2012, reg_loss: 0.2012 ||:   8%|8         | 8/95 [00:05<00:50,  1.71it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9642, LAS: 0.9272, UEM: 0.7015, LEM: 0.4420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2023, partial_loss/deprel_loss: 0.3681, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5361, loss: 0.5721, batch_reg_loss: 0.2012, reg_loss: 0.2012 ||:  12%|#1        | 11/95 [00:07<00:52,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9613, LAS: 0.9238, UEM: 0.6804, LEM: 0.4289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5743, partial_loss/deprel_loss: 0.5249, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7360, loss: 0.5969, batch_reg_loss: 0.2012, reg_loss: 0.2012 ||:  16%|#5        | 15/95 [00:09<00:50,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9280, UAS: 0.9621, LAS: 0.9246, UEM: 0.6907, LEM: 0.4387, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2519, partial_loss/deprel_loss: 0.3477, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5297, loss: 0.5854, batch_reg_loss: 0.2011, reg_loss: 0.2012 ||:  19%|#8        | 18/95 [00:12<00:51,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9680, UAS: 0.9650, LAS: 0.9283, UEM: 0.7494, LEM: 0.5237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0463, partial_loss/deprel_loss: 0.1296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3141, loss: 0.5614, batch_reg_loss: 0.2011, reg_loss: 0.2012 ||:  22%|##2       | 21/95 [00:14<00:55,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9650, LAS: 0.9281, UEM: 0.7352, LEM: 0.5033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1640, partial_loss/deprel_loss: 0.3558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5185, loss: 0.5639, batch_reg_loss: 0.2011, reg_loss: 0.2012 ||:  26%|##6       | 25/95 [00:17<00:48,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9393, UAS: 0.9653, LAS: 0.9285, UEM: 0.7276, LEM: 0.4932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2053, partial_loss/deprel_loss: 0.3580, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5285, loss: 0.5639, batch_reg_loss: 0.2011, reg_loss: 0.2011 ||:  31%|###       | 29/95 [00:19<00:44,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9656, LAS: 0.9284, UEM: 0.7280, LEM: 0.4914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3123, partial_loss/deprel_loss: 0.4142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5948, loss: 0.5647, batch_reg_loss: 0.2011, reg_loss: 0.2011 ||:  34%|###3      | 32/95 [00:21<00:42,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9645, LAS: 0.9272, UEM: 0.7129, LEM: 0.4766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1832, partial_loss/deprel_loss: 0.3297, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5014, loss: 0.5741, batch_reg_loss: 0.2010, reg_loss: 0.2011 ||:  38%|###7      | 36/95 [00:24<00:40,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9649, LAS: 0.9274, UEM: 0.7101, LEM: 0.4685, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3522, partial_loss/deprel_loss: 0.4360, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6202, loss: 0.5739, batch_reg_loss: 0.2010, reg_loss: 0.2011 ||:  41%|####1     | 39/95 [00:26<00:39,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9654, LAS: 0.9278, UEM: 0.7141, LEM: 0.4691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3462, partial_loss/deprel_loss: 0.4392, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6216, loss: 0.5726, batch_reg_loss: 0.2010, reg_loss: 0.2011 ||:  44%|####4     | 42/95 [00:28<00:37,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9647, LAS: 0.9272, UEM: 0.7092, LEM: 0.4665, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1644, partial_loss/deprel_loss: 0.2823, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4597, loss: 0.5752, batch_reg_loss: 0.2010, reg_loss: 0.2011 ||:  48%|####8     | 46/95 [00:31<00:34,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9630, LAS: 0.9255, UEM: 0.7011, LEM: 0.4610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2332, partial_loss/deprel_loss: 0.3335, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5144, loss: 0.5878, batch_reg_loss: 0.2010, reg_loss: 0.2011 ||:  52%|#####1    | 49/95 [00:33<00:32,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9631, LAS: 0.9255, UEM: 0.7005, LEM: 0.4632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1052, partial_loss/deprel_loss: 0.2660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4348, loss: 0.5863, batch_reg_loss: 0.2009, reg_loss: 0.2011 ||:  56%|#####5    | 53/95 [00:36<00:29,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9629, LAS: 0.9252, UEM: 0.6964, LEM: 0.4573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1875, partial_loss/deprel_loss: 0.2794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4619, loss: 0.5870, batch_reg_loss: 0.2009, reg_loss: 0.2011 ||:  60%|######    | 57/95 [00:39<00:26,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9279, UAS: 0.9625, LAS: 0.9246, UEM: 0.6915, LEM: 0.4526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2424, partial_loss/deprel_loss: 0.4287, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5924, loss: 0.5919, batch_reg_loss: 0.2009, reg_loss: 0.2011 ||:  64%|######4   | 61/95 [00:42<00:23,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9142, UAS: 0.9619, LAS: 0.9241, UEM: 0.6864, LEM: 0.4488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5492, partial_loss/deprel_loss: 0.4411, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6636, loss: 0.5949, batch_reg_loss: 0.2009, reg_loss: 0.2011 ||:  67%|######7   | 64/95 [00:44<00:22,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8961, UAS: 0.9606, LAS: 0.9227, UEM: 0.6774, LEM: 0.4413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7253, partial_loss/deprel_loss: 0.5621, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7956, loss: 0.6048, batch_reg_loss: 0.2009, reg_loss: 0.2010 ||:  71%|#######   | 67/95 [00:46<00:20,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9610, LAS: 0.9228, UEM: 0.6762, LEM: 0.4367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2409, partial_loss/deprel_loss: 0.4075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5750, loss: 0.6024, batch_reg_loss: 0.2009, reg_loss: 0.2010 ||:  75%|#######4  | 71/95 [00:48<00:16,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8943, UAS: 0.9600, LAS: 0.9219, UEM: 0.6669, LEM: 0.4278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7751, partial_loss/deprel_loss: 0.5957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8324, loss: 0.6088, batch_reg_loss: 0.2009, reg_loss: 0.2010 ||:  79%|#######8  | 75/95 [00:51<00:13,  1.51it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9126, UAS: 0.9601, LAS: 0.9222, UEM: 0.6717, LEM: 0.4359, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5031, partial_loss/deprel_loss: 0.5019, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7030, loss: 0.6068, batch_reg_loss: 0.2009, reg_loss: 0.2010 ||:  83%|########3 | 79/95 [00:54<00:11,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8651, UAS: 0.9590, LAS: 0.9210, UEM: 0.6638, LEM: 0.4294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1759, partial_loss/deprel_loss: 0.7507, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0366, loss: 0.6173, batch_reg_loss: 0.2008, reg_loss: 0.2010 ||:  86%|########6 | 82/95 [00:56<00:09,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9204, UAS: 0.9586, LAS: 0.9206, UEM: 0.6571, LEM: 0.4231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3880, partial_loss/deprel_loss: 0.4338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6255, loss: 0.6197, batch_reg_loss: 0.2008, reg_loss: 0.2010 ||:  89%|########9 | 85/95 [00:59<00:07,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9586, LAS: 0.9205, UEM: 0.6572, LEM: 0.4235, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6085, partial_loss/deprel_loss: 0.5601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7706, loss: 0.6196, batch_reg_loss: 0.2008, reg_loss: 0.2010 ||:  93%|#########2| 88/95 [01:01<00:05,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9544, UAS: 0.9593, LAS: 0.9212, UEM: 0.6665, LEM: 0.4321, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0789, partial_loss/deprel_loss: 0.2412, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4095, loss: 0.6155, batch_reg_loss: 0.2008, reg_loss: 0.2010 ||:  97%|#########6| 92/95 [01:04<00:02,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9590, LAS: 0.9209, UEM: 0.6612, LEM: 0.4272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3630, partial_loss/deprel_loss: 0.3949, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5893, loss: 0.6174, batch_reg_loss: 0.2008, reg_loss: 0.2010 ||: 100%|##########| 95/95 [01:05<00:00,  1.44it/s]\n",
+      "2023-04-07 01:15:21,660 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.201  |       N/A\n",
+      "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - UEM                      |     0.661  |       N/A\n",
+      "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - LEM                      |     0.427  |       N/A\n",
+      "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - EM                       |     0.926  |       N/A\n",
+      "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.363  |       N/A\n",
+      "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - UAS                      |     0.959  |       N/A\n",
+      "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.395  |       N/A\n",
+      "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - loss                     |     0.617  |       N/A\n",
+      "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - LAS                      |     0.921  |       N/A\n",
+      "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:15:21,661 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:15:21,662 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:15:21,662 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:15:21,662 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:15:21,662 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:15:21,667 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:15:26,676 - INFO - combo.training.trainer - Epoch duration: 0:01:14.189760\n",
+      "2023-04-07 01:15:26,677 - INFO - combo.training.trainer - Estimated training time remaining: 5:09:54\n",
+      "2023-04-07 01:15:26,677 - INFO - allennlp.training.trainer - Epoch 128/399\n",
+      "2023-04-07 01:15:26,677 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:15:26,678 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:15:26,688 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9631, LAS: 0.9239, UEM: 0.6215, LEM: 0.3546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2397, partial_loss/deprel_loss: 0.3410, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5215, loss: 0.5860, batch_reg_loss: 0.2008, reg_loss: 0.2008 ||:   3%|3         | 3/95 [00:02<01:05,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9458, UAS: 0.9607, LAS: 0.9213, UEM: 0.6019, LEM: 0.3412, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1463, partial_loss/deprel_loss: 0.3190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4853, loss: 0.6123, batch_reg_loss: 0.2008, reg_loss: 0.2008 ||:   7%|7         | 7/95 [00:04<00:57,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9596, LAS: 0.9208, UEM: 0.6229, LEM: 0.3702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4060, partial_loss/deprel_loss: 0.4722, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6598, loss: 0.6096, batch_reg_loss: 0.2008, reg_loss: 0.2008 ||:  13%|#2        | 12/95 [00:06<00:49,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9108, UAS: 0.9572, LAS: 0.9186, UEM: 0.6252, LEM: 0.3764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5571, partial_loss/deprel_loss: 0.4929, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7065, loss: 0.6281, batch_reg_loss: 0.2008, reg_loss: 0.2008 ||:  17%|#6        | 16/95 [00:08<00:45,  1.72it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9480, UAS: 0.9584, LAS: 0.9201, UEM: 0.6581, LEM: 0.4215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0955, partial_loss/deprel_loss: 0.2614, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4290, loss: 0.6133, batch_reg_loss: 0.2007, reg_loss: 0.2008 ||:  22%|##2       | 21/95 [00:11<00:41,  1.80it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9256, UAS: 0.9592, LAS: 0.9209, UEM: 0.6667, LEM: 0.4241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3006, partial_loss/deprel_loss: 0.4103, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5891, loss: 0.6094, batch_reg_loss: 0.2007, reg_loss: 0.2008 ||:  26%|##6       | 25/95 [00:13<00:40,  1.74it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9610, LAS: 0.9231, UEM: 0.6955, LEM: 0.4624, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2267, partial_loss/deprel_loss: 0.2844, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4736, loss: 0.5951, batch_reg_loss: 0.2007, reg_loss: 0.2008 ||:  31%|###       | 29/95 [00:16<00:40,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9304, UAS: 0.9602, LAS: 0.9222, UEM: 0.6792, LEM: 0.4445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3083, partial_loss/deprel_loss: 0.3617, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5517, loss: 0.6033, batch_reg_loss: 0.2007, reg_loss: 0.2007 ||:  35%|###4      | 33/95 [00:19<00:39,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9596, LAS: 0.9220, UEM: 0.6778, LEM: 0.4436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3199, partial_loss/deprel_loss: 0.3508, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5453, loss: 0.6060, batch_reg_loss: 0.2007, reg_loss: 0.2007 ||:  39%|###8      | 37/95 [00:22<00:38,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8871, UAS: 0.9593, LAS: 0.9215, UEM: 0.6763, LEM: 0.4430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8521, partial_loss/deprel_loss: 0.6038, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8541, loss: 0.6095, batch_reg_loss: 0.2006, reg_loss: 0.2007 ||:  43%|####3     | 41/95 [00:24<00:35,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9597, LAS: 0.9218, UEM: 0.6778, LEM: 0.4418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1736, partial_loss/deprel_loss: 0.3180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4898, loss: 0.6066, batch_reg_loss: 0.2006, reg_loss: 0.2007 ||:  46%|####6     | 44/95 [00:27<00:35,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9589, LAS: 0.9205, UEM: 0.6627, LEM: 0.4269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6611, partial_loss/deprel_loss: 0.5736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7917, loss: 0.6158, batch_reg_loss: 0.2006, reg_loss: 0.2007 ||:  51%|#####     | 48/95 [00:29<00:32,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9577, LAS: 0.9195, UEM: 0.6543, LEM: 0.4200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2906, partial_loss/deprel_loss: 0.3542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5421, loss: 0.6220, batch_reg_loss: 0.2006, reg_loss: 0.2007 ||:  54%|#####3    | 51/95 [00:31<00:30,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9476, UAS: 0.9582, LAS: 0.9200, UEM: 0.6520, LEM: 0.4167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1726, partial_loss/deprel_loss: 0.2786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4580, loss: 0.6194, batch_reg_loss: 0.2006, reg_loss: 0.2007 ||:  57%|#####6    | 54/95 [00:33<00:28,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9581, LAS: 0.9200, UEM: 0.6490, LEM: 0.4147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6074, partial_loss/deprel_loss: 0.5364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7512, loss: 0.6199, batch_reg_loss: 0.2006, reg_loss: 0.2007 ||:  60%|######    | 57/95 [00:36<00:27,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9304, UAS: 0.9582, LAS: 0.9202, UEM: 0.6509, LEM: 0.4176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2521, partial_loss/deprel_loss: 0.3419, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5246, loss: 0.6191, batch_reg_loss: 0.2006, reg_loss: 0.2007 ||:  63%|######3   | 60/95 [00:38<00:26,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9583, LAS: 0.9202, UEM: 0.6537, LEM: 0.4209, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3821, partial_loss/deprel_loss: 0.4796, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6607, loss: 0.6180, batch_reg_loss: 0.2006, reg_loss: 0.2007 ||:  66%|######6   | 63/95 [00:40<00:23,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8968, UAS: 0.9579, LAS: 0.9197, UEM: 0.6464, LEM: 0.4136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7458, partial_loss/deprel_loss: 0.6028, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8320, loss: 0.6227, batch_reg_loss: 0.2006, reg_loss: 0.2007 ||:  69%|######9   | 66/95 [00:42<00:20,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9579, LAS: 0.9197, UEM: 0.6427, LEM: 0.4094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2012, partial_loss/deprel_loss: 0.3035, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4836, loss: 0.6232, batch_reg_loss: 0.2006, reg_loss: 0.2007 ||:  73%|#######2  | 69/95 [00:44<00:18,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9574, LAS: 0.9192, UEM: 0.6365, LEM: 0.4040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3333, partial_loss/deprel_loss: 0.3599, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5551, loss: 0.6278, batch_reg_loss: 0.2005, reg_loss: 0.2007 ||:  77%|#######6  | 73/95 [00:47<00:14,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9473, UAS: 0.9570, LAS: 0.9188, UEM: 0.6392, LEM: 0.4102, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1122, partial_loss/deprel_loss: 0.2291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4062, loss: 0.6284, batch_reg_loss: 0.2005, reg_loss: 0.2007 ||:  81%|########1 | 77/95 [00:49<00:12,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9571, LAS: 0.9188, UEM: 0.6399, LEM: 0.4095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1791, partial_loss/deprel_loss: 0.3245, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4960, loss: 0.6296, batch_reg_loss: 0.2005, reg_loss: 0.2007 ||:  84%|########4 | 80/95 [00:52<00:10,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9574, LAS: 0.9193, UEM: 0.6407, LEM: 0.4081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2936, partial_loss/deprel_loss: 0.4140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5905, loss: 0.6260, batch_reg_loss: 0.2005, reg_loss: 0.2007 ||:  88%|########8 | 84/95 [00:54<00:07,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9582, LAS: 0.9201, UEM: 0.6564, LEM: 0.4279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3467, partial_loss/deprel_loss: 0.3845, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5775, loss: 0.6202, batch_reg_loss: 0.2005, reg_loss: 0.2006 ||:  93%|#########2| 88/95 [00:57<00:04,  1.50it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9585, LAS: 0.9203, UEM: 0.6591, LEM: 0.4284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4352, partial_loss/deprel_loss: 0.5214, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7046, loss: 0.6176, batch_reg_loss: 0.2005, reg_loss: 0.2006 ||:  97%|#########6| 92/95 [00:59<00:02,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8967, UAS: 0.9582, LAS: 0.9201, UEM: 0.6531, LEM: 0.4225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5036, partial_loss/deprel_loss: 0.5400, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7332, loss: 0.6198, batch_reg_loss: 0.2005, reg_loss: 0.2006 ||: 100%|##########| 95/95 [01:01<00:00,  1.54it/s]\n",
+      "2023-04-07 01:16:31,053 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:16:31,053 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 01:16:31,053 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.201  |       N/A\n",
+      "2023-04-07 01:16:31,053 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:16:31,053 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:16:31,053 - INFO - combo.training.tensorboard_writer - UEM                      |     0.653  |       N/A\n",
+      "2023-04-07 01:16:31,053 - INFO - combo.training.tensorboard_writer - LEM                      |     0.422  |       N/A\n",
+      "2023-04-07 01:16:31,053 - INFO - combo.training.tensorboard_writer - EM                       |     0.897  |       N/A\n",
+      "2023-04-07 01:16:31,053 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.504  |       N/A\n",
+      "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - UAS                      |     0.958  |       N/A\n",
+      "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.540  |       N/A\n",
+      "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - loss                     |     0.620  |       N/A\n",
+      "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - LAS                      |     0.920  |       N/A\n",
+      "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:16:31,054 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:16:31,058 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:16:35,283 - INFO - combo.training.trainer - Epoch duration: 0:01:08.605642\n",
+      "2023-04-07 01:16:35,283 - INFO - combo.training.trainer - Estimated training time remaining: 5:08:46\n",
+      "2023-04-07 01:16:35,283 - INFO - allennlp.training.trainer - Epoch 129/399\n",
+      "2023-04-07 01:16:35,283 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:16:35,284 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:16:35,293 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9487, LAS: 0.9084, UEM: 0.4551, LEM: 0.2244, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6219, partial_loss/deprel_loss: 0.5310, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7497, loss: 0.7101, batch_reg_loss: 0.2005, reg_loss: 0.2005 ||:   3%|3         | 3/95 [00:02<01:02,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9595, LAS: 0.9227, UEM: 0.5622, LEM: 0.3092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1934, partial_loss/deprel_loss: 0.3574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5250, loss: 0.6236, batch_reg_loss: 0.2004, reg_loss: 0.2005 ||:   7%|7         | 7/95 [00:04<00:57,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9295, UAS: 0.9568, LAS: 0.9193, UEM: 0.6007, LEM: 0.3470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2255, partial_loss/deprel_loss: 0.3540, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5287, loss: 0.6336, batch_reg_loss: 0.2004, reg_loss: 0.2004 ||:  11%|#         | 10/95 [00:06<00:57,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9604, LAS: 0.9228, UEM: 0.6565, LEM: 0.4014, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1986, partial_loss/deprel_loss: 0.3299, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5041, loss: 0.6059, batch_reg_loss: 0.2004, reg_loss: 0.2004 ||:  14%|#3        | 13/95 [00:09<00:59,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9605, LAS: 0.9228, UEM: 0.6833, LEM: 0.4484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4336, partial_loss/deprel_loss: 0.4614, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6563, loss: 0.6044, batch_reg_loss: 0.2004, reg_loss: 0.2004 ||:  17%|#6        | 16/95 [00:11<00:57,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9621, LAS: 0.9241, UEM: 0.6955, LEM: 0.4608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3060, partial_loss/deprel_loss: 0.3548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5454, loss: 0.5916, batch_reg_loss: 0.2004, reg_loss: 0.2004 ||:  20%|##        | 19/95 [00:13<00:55,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9618, LAS: 0.9234, UEM: 0.6882, LEM: 0.4515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1866, partial_loss/deprel_loss: 0.3131, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4882, loss: 0.5959, batch_reg_loss: 0.2004, reg_loss: 0.2004 ||:  23%|##3       | 22/95 [00:15<00:52,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9617, LAS: 0.9238, UEM: 0.6714, LEM: 0.4334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4624, partial_loss/deprel_loss: 0.4234, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6316, loss: 0.5981, batch_reg_loss: 0.2003, reg_loss: 0.2004 ||:  28%|##8       | 27/95 [00:17<00:43,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9605, LAS: 0.9225, UEM: 0.6491, LEM: 0.4075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3813, partial_loss/deprel_loss: 0.4035, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5994, loss: 0.6075, batch_reg_loss: 0.2003, reg_loss: 0.2004 ||:  34%|###3      | 32/95 [00:20<00:37,  1.66it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9600, LAS: 0.9222, UEM: 0.6444, LEM: 0.4011, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2141, partial_loss/deprel_loss: 0.3387, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.6112, batch_reg_loss: 0.2003, reg_loss: 0.2004 ||:  39%|###8      | 37/95 [00:22<00:32,  1.80it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9600, LAS: 0.9222, UEM: 0.6411, LEM: 0.3976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2529, partial_loss/deprel_loss: 0.3846, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5585, loss: 0.6134, batch_reg_loss: 0.2003, reg_loss: 0.2004 ||:  44%|####4     | 42/95 [00:25<00:28,  1.85it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8825, UAS: 0.9594, LAS: 0.9214, UEM: 0.6397, LEM: 0.3973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8439, partial_loss/deprel_loss: 0.5619, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8186, loss: 0.6150, batch_reg_loss: 0.2003, reg_loss: 0.2004 ||:  48%|####8     | 46/95 [00:28<00:29,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9201, UAS: 0.9606, LAS: 0.9228, UEM: 0.6704, LEM: 0.4379, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3845, partial_loss/deprel_loss: 0.4122, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6069, loss: 0.6046, batch_reg_loss: 0.2003, reg_loss: 0.2004 ||:  53%|#####2    | 50/95 [00:31<00:30,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9603, LAS: 0.9223, UEM: 0.6629, LEM: 0.4304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1744, partial_loss/deprel_loss: 0.3334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5018, loss: 0.6073, batch_reg_loss: 0.2002, reg_loss: 0.2004 ||:  57%|#####6    | 54/95 [00:34<00:26,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9428, UAS: 0.9609, LAS: 0.9229, UEM: 0.6689, LEM: 0.4349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1728, partial_loss/deprel_loss: 0.3175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4888, loss: 0.6016, batch_reg_loss: 0.2002, reg_loss: 0.2003 ||:  61%|######1   | 58/95 [00:36<00:24,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9605, LAS: 0.9227, UEM: 0.6625, LEM: 0.4276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2980, partial_loss/deprel_loss: 0.3101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5079, loss: 0.6039, batch_reg_loss: 0.2002, reg_loss: 0.2003 ||:  65%|######5   | 62/95 [00:39<00:21,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9077, UAS: 0.9603, LAS: 0.9224, UEM: 0.6588, LEM: 0.4241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4922, partial_loss/deprel_loss: 0.5550, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7426, loss: 0.6062, batch_reg_loss: 0.2002, reg_loss: 0.2003 ||:  69%|######9   | 66/95 [00:42<00:19,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9606, LAS: 0.9228, UEM: 0.6639, LEM: 0.4287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3517, partial_loss/deprel_loss: 0.4263, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6116, loss: 0.6030, batch_reg_loss: 0.2002, reg_loss: 0.2003 ||:  73%|#######2  | 69/95 [00:44<00:18,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9096, UAS: 0.9603, LAS: 0.9225, UEM: 0.6559, LEM: 0.4210, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6056, partial_loss/deprel_loss: 0.5127, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7315, loss: 0.6070, batch_reg_loss: 0.2002, reg_loss: 0.2003 ||:  76%|#######5  | 72/95 [00:46<00:16,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9601, LAS: 0.9222, UEM: 0.6523, LEM: 0.4168, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4340, partial_loss/deprel_loss: 0.5110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6958, loss: 0.6086, batch_reg_loss: 0.2002, reg_loss: 0.2003 ||:  79%|#######8  | 75/95 [00:49<00:15,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9603, LAS: 0.9224, UEM: 0.6567, LEM: 0.4222, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1000, partial_loss/deprel_loss: 0.2497, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4199, loss: 0.6076, batch_reg_loss: 0.2002, reg_loss: 0.2003 ||:  82%|########2 | 78/95 [00:51<00:12,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9294, UAS: 0.9599, LAS: 0.9220, UEM: 0.6516, LEM: 0.4166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2894, partial_loss/deprel_loss: 0.3204, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5144, loss: 0.6095, batch_reg_loss: 0.2002, reg_loss: 0.2003 ||:  86%|########6 | 82/95 [00:53<00:09,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9592, LAS: 0.9214, UEM: 0.6509, LEM: 0.4178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4873, partial_loss/deprel_loss: 0.4518, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6590, loss: 0.6129, batch_reg_loss: 0.2001, reg_loss: 0.2003 ||:  89%|########9 | 85/95 [00:56<00:07,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9481, UAS: 0.9593, LAS: 0.9216, UEM: 0.6544, LEM: 0.4226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0975, partial_loss/deprel_loss: 0.2299, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4035, loss: 0.6113, batch_reg_loss: 0.2001, reg_loss: 0.2003 ||:  93%|#########2| 88/95 [00:58<00:05,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8639, UAS: 0.9585, LAS: 0.9207, UEM: 0.6479, LEM: 0.4169, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1383, partial_loss/deprel_loss: 0.6807, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9724, loss: 0.6168, batch_reg_loss: 0.2001, reg_loss: 0.2003 ||:  96%|#########5| 91/95 [01:00<00:02,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9586, LAS: 0.9208, UEM: 0.6522, LEM: 0.4217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9341, partial_loss/deprel_loss: 0.6648, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9187, loss: 0.6163, batch_reg_loss: 0.2001, reg_loss: 0.2003 ||:  99%|#########8| 94/95 [01:02<00:00,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9587, LAS: 0.9209, UEM: 0.6532, LEM: 0.4216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2108, partial_loss/deprel_loss: 0.3687, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5373, loss: 0.6154, batch_reg_loss: 0.2001, reg_loss: 0.2003 ||: 100%|##########| 95/95 [01:03<00:00,  1.49it/s]\n",
+      "2023-04-07 01:17:42,126 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:17:42,126 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 01:17:42,126 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.200  |       N/A\n",
+      "2023-04-07 01:17:42,126 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:17:42,126 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:17:42,126 - INFO - combo.training.tensorboard_writer - UEM                      |     0.653  |       N/A\n",
+      "2023-04-07 01:17:42,126 - INFO - combo.training.tensorboard_writer - LEM                      |     0.422  |       N/A\n",
+      "2023-04-07 01:17:42,126 - INFO - combo.training.tensorboard_writer - EM                       |     0.929  |       N/A\n",
+      "2023-04-07 01:17:42,126 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.211  |       N/A\n",
+      "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - UAS                      |     0.959  |       N/A\n",
+      "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.369  |       N/A\n",
+      "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - loss                     |     0.615  |       N/A\n",
+      "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - LAS                      |     0.921  |       N/A\n",
+      "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:17:42,127 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:17:42,128 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:17:42,128 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:17:42,128 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:17:42,136 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:17:47,046 - INFO - combo.training.trainer - Epoch duration: 0:01:11.763142\n",
+      "2023-04-07 01:17:47,047 - INFO - combo.training.trainer - Estimated training time remaining: 5:07:45\n",
+      "2023-04-07 01:17:47,047 - INFO - allennlp.training.trainer - Epoch 130/399\n",
+      "2023-04-07 01:17:47,047 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:17:47,047 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:17:47,055 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9790, LAS: 0.9467, UEM: 0.8767, LEM: 0.7108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1059, partial_loss/deprel_loss: 0.2329, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4076, loss: 0.4231, batch_reg_loss: 0.2001, reg_loss: 0.2001 ||:   3%|3         | 3/95 [00:02<01:13,  1.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9716, LAS: 0.9350, UEM: 0.7807, LEM: 0.5725, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4357, partial_loss/deprel_loss: 0.4884, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6780, loss: 0.5086, batch_reg_loss: 0.2001, reg_loss: 0.2001 ||:   7%|7         | 7/95 [00:05<01:07,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9682, LAS: 0.9306, UEM: 0.7316, LEM: 0.5186, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4908, partial_loss/deprel_loss: 0.5178, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7125, loss: 0.5421, batch_reg_loss: 0.2001, reg_loss: 0.2001 ||:  11%|#         | 10/95 [00:07<01:04,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8696, UAS: 0.9620, LAS: 0.9238, UEM: 0.7156, LEM: 0.5068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2515, partial_loss/deprel_loss: 0.7855, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0787, loss: 0.5891, batch_reg_loss: 0.2001, reg_loss: 0.2001 ||:  14%|#3        | 13/95 [00:09<01:03,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9610, LAS: 0.9234, UEM: 0.6973, LEM: 0.4832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2365, partial_loss/deprel_loss: 0.3414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5205, loss: 0.5968, batch_reg_loss: 0.2001, reg_loss: 0.2001 ||:  17%|#6        | 16/95 [00:11<00:59,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9626, LAS: 0.9249, UEM: 0.6968, LEM: 0.4707, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1997, partial_loss/deprel_loss: 0.3292, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5034, loss: 0.5830, batch_reg_loss: 0.2000, reg_loss: 0.2001 ||:  20%|##        | 19/95 [00:13<00:55,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9620, LAS: 0.9240, UEM: 0.6781, LEM: 0.4459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5423, partial_loss/deprel_loss: 0.4953, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7048, loss: 0.5941, batch_reg_loss: 0.2000, reg_loss: 0.2001 ||:  24%|##4       | 23/95 [00:16<00:50,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9593, LAS: 0.9211, UEM: 0.6633, LEM: 0.4331, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3364, partial_loss/deprel_loss: 0.4034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5901, loss: 0.6109, batch_reg_loss: 0.2000, reg_loss: 0.2001 ||:  28%|##8       | 27/95 [00:18<00:45,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9597, LAS: 0.9215, UEM: 0.6719, LEM: 0.4444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5934, partial_loss/deprel_loss: 0.5457, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7553, loss: 0.6088, batch_reg_loss: 0.2000, reg_loss: 0.2001 ||:  32%|###1      | 30/95 [00:21<00:46,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9605, LAS: 0.9221, UEM: 0.6805, LEM: 0.4501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5358, partial_loss/deprel_loss: 0.4960, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7040, loss: 0.6035, batch_reg_loss: 0.2000, reg_loss: 0.2001 ||:  35%|###4      | 33/95 [00:23<00:43,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9608, LAS: 0.9222, UEM: 0.6809, LEM: 0.4463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6867, partial_loss/deprel_loss: 0.5800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8013, loss: 0.6046, batch_reg_loss: 0.2000, reg_loss: 0.2001 ||:  38%|###7      | 36/95 [00:25<00:41,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9597, LAS: 0.9208, UEM: 0.6796, LEM: 0.4475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6576, partial_loss/deprel_loss: 0.5707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7880, loss: 0.6127, batch_reg_loss: 0.2000, reg_loss: 0.2000 ||:  42%|####2     | 40/95 [00:27<00:35,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9303, UAS: 0.9605, LAS: 0.9216, UEM: 0.6810, LEM: 0.4443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3295, partial_loss/deprel_loss: 0.3975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5839, loss: 0.6071, batch_reg_loss: 0.2000, reg_loss: 0.2000 ||:  47%|####7     | 45/95 [00:29<00:29,  1.72it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9609, LAS: 0.9219, UEM: 0.6751, LEM: 0.4347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2667, partial_loss/deprel_loss: 0.4058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5780, loss: 0.6060, batch_reg_loss: 0.2000, reg_loss: 0.2000 ||:  53%|#####2    | 50/95 [00:31<00:24,  1.87it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9603, LAS: 0.9211, UEM: 0.6737, LEM: 0.4332, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4861, partial_loss/deprel_loss: 0.4945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6927, loss: 0.6114, batch_reg_loss: 0.1999, reg_loss: 0.2000 ||:  57%|#####6    | 54/95 [00:33<00:22,  1.85it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9599, LAS: 0.9210, UEM: 0.6660, LEM: 0.4250, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4030, partial_loss/deprel_loss: 0.4400, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6325, loss: 0.6132, batch_reg_loss: 0.1999, reg_loss: 0.2000 ||:  61%|######1   | 58/95 [00:36<00:20,  1.76it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9606, LAS: 0.9218, UEM: 0.6709, LEM: 0.4270, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2830, partial_loss/deprel_loss: 0.3800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5605, loss: 0.6065, batch_reg_loss: 0.1999, reg_loss: 0.2000 ||:  65%|######5   | 62/95 [00:39<00:19,  1.68it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9600, LAS: 0.9212, UEM: 0.6656, LEM: 0.4226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2019, partial_loss/deprel_loss: 0.3419, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5138, loss: 0.6111, batch_reg_loss: 0.1999, reg_loss: 0.2000 ||:  69%|######9   | 66/95 [00:42<00:19,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9461, UAS: 0.9605, LAS: 0.9219, UEM: 0.6708, LEM: 0.4288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1165, partial_loss/deprel_loss: 0.2782, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4457, loss: 0.6058, batch_reg_loss: 0.1999, reg_loss: 0.2000 ||:  74%|#######3  | 70/95 [00:45<00:17,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9596, LAS: 0.9209, UEM: 0.6613, LEM: 0.4213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9136, partial_loss/deprel_loss: 0.5708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8392, loss: 0.6117, batch_reg_loss: 0.1999, reg_loss: 0.2000 ||:  78%|#######7  | 74/95 [00:47<00:13,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9428, UAS: 0.9597, LAS: 0.9210, UEM: 0.6599, LEM: 0.4197, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2266, partial_loss/deprel_loss: 0.2700, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4612, loss: 0.6109, batch_reg_loss: 0.1999, reg_loss: 0.2000 ||:  82%|########2 | 78/95 [00:50<00:11,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9593, LAS: 0.9207, UEM: 0.6565, LEM: 0.4166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6489, partial_loss/deprel_loss: 0.5137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7405, loss: 0.6117, batch_reg_loss: 0.1998, reg_loss: 0.2000 ||:  86%|########6 | 82/95 [00:53<00:09,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9596, LAS: 0.9210, UEM: 0.6572, LEM: 0.4174, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3953, partial_loss/deprel_loss: 0.4711, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6558, loss: 0.6099, batch_reg_loss: 0.1998, reg_loss: 0.2000 ||:  89%|########9 | 85/95 [00:56<00:07,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9592, LAS: 0.9206, UEM: 0.6511, LEM: 0.4111, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3850, partial_loss/deprel_loss: 0.4810, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6616, loss: 0.6140, batch_reg_loss: 0.1998, reg_loss: 0.2000 ||:  94%|#########3| 89/95 [00:58<00:04,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9692, UAS: 0.9595, LAS: 0.9209, UEM: 0.6614, LEM: 0.4286, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0337, partial_loss/deprel_loss: 0.1437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3215, loss: 0.6122, batch_reg_loss: 0.1998, reg_loss: 0.2000 ||:  97%|#########6| 92/95 [01:00<00:02,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9592, LAS: 0.9206, UEM: 0.6562, LEM: 0.4234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5121, partial_loss/deprel_loss: 0.4671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6759, loss: 0.6141, batch_reg_loss: 0.1998, reg_loss: 0.2000 ||: 100%|##########| 95/95 [01:03<00:00,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9592, LAS: 0.9206, UEM: 0.6562, LEM: 0.4234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5121, partial_loss/deprel_loss: 0.4671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6759, loss: 0.6141, batch_reg_loss: 0.1998, reg_loss: 0.2000 ||: 100%|##########| 95/95 [01:03<00:00,  1.50it/s]\n",
+      "2023-04-07 01:18:53,395 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9522, LAS: 0.9051, UEM: 0.8053, LEM: 0.6314, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2243, partial_loss/deprel_loss: 5.3319, partial_loss/cycle_loss: 0.0000, batch_loss: 4.3104, loss: 8.7662, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  18%|#8        | 2/11 [00:02<00:09,  1.09s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8621, UAS: 0.9489, LAS: 0.9015, UEM: 0.7739, LEM: 0.5648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5831, partial_loss/deprel_loss: 21.8201, partial_loss/cycle_loss: 0.0000, batch_loss: 17.7727, loss: 10.0723, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  36%|###6      | 4/11 [00:04<00:07,  1.12s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9235, UAS: 0.9504, LAS: 0.9011, UEM: 0.7239, LEM: 0.4769, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3935, partial_loss/deprel_loss: 6.7236, partial_loss/cycle_loss: 0.0000, batch_loss: 5.4576, loss: 9.6231, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  64%|######3   | 7/11 [00:07<00:04,  1.08s/it]   \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8802, UAS: 0.9502, LAS: 0.9006, UEM: 0.6871, LEM: 0.4267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0650, partial_loss/deprel_loss: 9.9326, partial_loss/cycle_loss: 0.0000, batch_loss: 8.1591, loss: 9.1834, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  91%|######### | 10/11 [00:10<00:01,  1.03s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9512, LAS: 0.9009, UEM: 0.6878, LEM: 0.4146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4606, partial_loss/deprel_loss: 8.6600, partial_loss/cycle_loss: 0.0000, batch_loss: 7.0201, loss: 8.9867, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:11<00:00,  1.01s/it]\n",
+      "2023-04-07 01:19:04,558 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:19:04,558 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.200  |     0.000\n",
+      "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - UEM                      |     0.656  |     0.688\n",
+      "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - LEM                      |     0.423  |     0.415\n",
+      "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - EM                       |     0.909  |     0.903\n",
+      "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.512  |     0.461\n",
+      "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - UAS                      |     0.959  |     0.951\n",
+      "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.467  |     8.660\n",
+      "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - loss                     |     0.614  |     8.987\n",
+      "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - LAS                      |     0.921  |     0.901\n",
+      "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:19:04,559 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:19:04,560 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:19:04,560 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:19:04,560 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 01:19:04,564 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:19:09,248 - INFO - combo.training.trainer - Epoch duration: 0:01:22.200925\n",
+      "2023-04-07 01:19:09,248 - INFO - combo.training.trainer - Estimated training time remaining: 5:07:05\n",
+      "2023-04-07 01:19:09,249 - INFO - allennlp.training.trainer - Epoch 131/399\n",
+      "2023-04-07 01:19:09,249 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:19:09,249 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:19:09,259 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9199, UAS: 0.9535, LAS: 0.9158, UEM: 0.5011, LEM: 0.3121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4068, partial_loss/deprel_loss: 0.3856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5897, loss: 0.6570, batch_reg_loss: 0.1998, reg_loss: 0.1998 ||:   4%|4         | 4/95 [00:02<00:55,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9538, LAS: 0.9153, UEM: 0.5257, LEM: 0.3221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4342, partial_loss/deprel_loss: 0.5154, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6989, loss: 0.6594, batch_reg_loss: 0.1998, reg_loss: 0.1998 ||:   8%|8         | 8/95 [00:04<00:52,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9604, LAS: 0.9219, UEM: 0.6755, LEM: 0.4524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1335, partial_loss/deprel_loss: 0.2827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4526, loss: 0.6061, batch_reg_loss: 0.1998, reg_loss: 0.1998 ||:  12%|#1        | 11/95 [00:07<00:56,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9596, LAS: 0.9214, UEM: 0.6476, LEM: 0.4193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4787, partial_loss/deprel_loss: 0.4810, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6803, loss: 0.6183, batch_reg_loss: 0.1997, reg_loss: 0.1998 ||:  15%|#4        | 14/95 [00:09<00:55,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9558, LAS: 0.9178, UEM: 0.5973, LEM: 0.3772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9191, partial_loss/deprel_loss: 0.5869, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8531, loss: 0.6437, batch_reg_loss: 0.1997, reg_loss: 0.1998 ||:  19%|#8        | 18/95 [00:11<00:50,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9428, UAS: 0.9582, LAS: 0.9205, UEM: 0.6412, LEM: 0.4220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1938, partial_loss/deprel_loss: 0.3034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4812, loss: 0.6236, batch_reg_loss: 0.1997, reg_loss: 0.1998 ||:  22%|##2       | 21/95 [00:14<00:51,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9574, LAS: 0.9199, UEM: 0.6314, LEM: 0.4101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6610, partial_loss/deprel_loss: 0.4659, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7047, loss: 0.6270, batch_reg_loss: 0.1997, reg_loss: 0.1998 ||:  26%|##6       | 25/95 [00:16<00:47,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9572, LAS: 0.9199, UEM: 0.6175, LEM: 0.3944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5019, partial_loss/deprel_loss: 0.4243, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6396, loss: 0.6262, batch_reg_loss: 0.1997, reg_loss: 0.1997 ||:  31%|###       | 29/95 [00:19<00:42,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9579, LAS: 0.9208, UEM: 0.6278, LEM: 0.4008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2056, partial_loss/deprel_loss: 0.3265, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5020, loss: 0.6206, batch_reg_loss: 0.1997, reg_loss: 0.1997 ||:  34%|###3      | 32/95 [00:21<00:42,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9596, LAS: 0.9229, UEM: 0.6748, LEM: 0.4611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3569, partial_loss/deprel_loss: 0.4496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6307, loss: 0.6067, batch_reg_loss: 0.1997, reg_loss: 0.1997 ||:  37%|###6      | 35/95 [00:23<00:44,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9596, LAS: 0.9226, UEM: 0.6779, LEM: 0.4595, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9298, partial_loss/deprel_loss: 0.5515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8268, loss: 0.6067, batch_reg_loss: 0.1997, reg_loss: 0.1997 ||:  41%|####1     | 39/95 [00:26<00:38,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9594, LAS: 0.9223, UEM: 0.6655, LEM: 0.4429, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8453, partial_loss/deprel_loss: 0.5137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7797, loss: 0.6100, batch_reg_loss: 0.1996, reg_loss: 0.1997 ||:  46%|####6     | 44/95 [00:28<00:31,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9581, LAS: 0.9209, UEM: 0.6483, LEM: 0.4262, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0519, partial_loss/deprel_loss: 0.5943, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8854, loss: 0.6173, batch_reg_loss: 0.1996, reg_loss: 0.1997 ||:  52%|#####1    | 49/95 [00:30<00:26,  1.73it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9574, LAS: 0.9203, UEM: 0.6443, LEM: 0.4240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1752, partial_loss/deprel_loss: 0.2790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4578, loss: 0.6196, batch_reg_loss: 0.1996, reg_loss: 0.1997 ||:  56%|#####5    | 53/95 [00:33<00:23,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9578, LAS: 0.9204, UEM: 0.6455, LEM: 0.4213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6243, partial_loss/deprel_loss: 0.5155, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7368, loss: 0.6177, batch_reg_loss: 0.1996, reg_loss: 0.1997 ||:  60%|######    | 57/95 [00:35<00:21,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9573, LAS: 0.9199, UEM: 0.6416, LEM: 0.4177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1696, partial_loss/deprel_loss: 0.2771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4552, loss: 0.6219, batch_reg_loss: 0.1996, reg_loss: 0.1997 ||:  64%|######4   | 61/95 [00:38<00:20,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9586, LAS: 0.9211, UEM: 0.6617, LEM: 0.4350, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2029, partial_loss/deprel_loss: 0.3563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5252, loss: 0.6137, batch_reg_loss: 0.1996, reg_loss: 0.1997 ||:  68%|######8   | 65/95 [00:41<00:19,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9307, UAS: 0.9583, LAS: 0.9207, UEM: 0.6527, LEM: 0.4258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3263, partial_loss/deprel_loss: 0.3790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5680, loss: 0.6164, batch_reg_loss: 0.1996, reg_loss: 0.1997 ||:  73%|#######2  | 69/95 [00:44<00:17,  1.50it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9283, UAS: 0.9588, LAS: 0.9213, UEM: 0.6577, LEM: 0.4287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2250, partial_loss/deprel_loss: 0.3399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5165, loss: 0.6119, batch_reg_loss: 0.1995, reg_loss: 0.1997 ||:  77%|#######6  | 73/95 [00:47<00:15,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9587, LAS: 0.9211, UEM: 0.6497, LEM: 0.4212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3552, partial_loss/deprel_loss: 0.4067, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5960, loss: 0.6139, batch_reg_loss: 0.1995, reg_loss: 0.1997 ||:  81%|########1 | 77/95 [00:49<00:12,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9590, LAS: 0.9215, UEM: 0.6537, LEM: 0.4244, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3266, partial_loss/deprel_loss: 0.3612, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5538, loss: 0.6116, batch_reg_loss: 0.1995, reg_loss: 0.1997 ||:  85%|########5 | 81/95 [00:52<00:09,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9594, LAS: 0.9219, UEM: 0.6617, LEM: 0.4345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2208, partial_loss/deprel_loss: 0.3385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5144, loss: 0.6079, batch_reg_loss: 0.1995, reg_loss: 0.1997 ||:  88%|########8 | 84/95 [00:54<00:07,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9586, LAS: 0.9211, UEM: 0.6562, LEM: 0.4295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6149, partial_loss/deprel_loss: 0.5757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7831, loss: 0.6144, batch_reg_loss: 0.1995, reg_loss: 0.1996 ||:  92%|#########1| 87/95 [00:56<00:05,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9324, UAS: 0.9590, LAS: 0.9214, UEM: 0.6612, LEM: 0.4330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2563, partial_loss/deprel_loss: 0.4114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5799, loss: 0.6115, batch_reg_loss: 0.1995, reg_loss: 0.1996 ||:  95%|#########4| 90/95 [00:59<00:03,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9591, LAS: 0.9216, UEM: 0.6571, LEM: 0.4274, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3742, partial_loss/deprel_loss: 0.3562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5592, loss: 0.6103, batch_reg_loss: 0.1995, reg_loss: 0.1996 ||:  99%|#########8| 94/95 [01:01<00:00,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9591, LAS: 0.9216, UEM: 0.6561, LEM: 0.4257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3952, partial_loss/deprel_loss: 0.4304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6228, loss: 0.6104, batch_reg_loss: 0.1995, reg_loss: 0.1996 ||: 100%|##########| 95/95 [01:02<00:00,  1.52it/s]\n",
+      "2023-04-07 01:20:14,786 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:20:14,786 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 01:20:14,786 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.200  |       N/A\n",
+      "2023-04-07 01:20:14,786 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - UEM                      |     0.656  |       N/A\n",
+      "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - LEM                      |     0.426  |       N/A\n",
+      "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - EM                       |     0.920  |       N/A\n",
+      "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.395  |       N/A\n",
+      "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - UAS                      |     0.959  |       N/A\n",
+      "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.430  |       N/A\n",
+      "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - loss                     |     0.610  |       N/A\n",
+      "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - LAS                      |     0.922  |       N/A\n",
+      "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:20:14,787 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:20:14,792 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:20:19,595 - INFO - combo.training.trainer - Epoch duration: 0:01:10.346127\n",
+      "2023-04-07 01:20:19,595 - INFO - combo.training.trainer - Estimated training time remaining: 5:06:00\n",
+      "2023-04-07 01:20:19,595 - INFO - allennlp.training.trainer - Epoch 132/399\n",
+      "2023-04-07 01:20:19,596 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:20:19,596 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:20:19,606 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9726, LAS: 0.9355, UEM: 0.7834, LEM: 0.5588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1801, partial_loss/deprel_loss: 0.3268, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4969, loss: 0.5050, batch_reg_loss: 0.1995, reg_loss: 0.1995 ||:   3%|3         | 3/95 [00:02<01:15,  1.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9665, LAS: 0.9290, UEM: 0.6954, LEM: 0.4582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2625, partial_loss/deprel_loss: 0.3557, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5365, loss: 0.5598, batch_reg_loss: 0.1994, reg_loss: 0.1995 ||:   6%|6         | 6/95 [00:04<01:11,  1.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9568, LAS: 0.9192, UEM: 0.6097, LEM: 0.3903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6579, partial_loss/deprel_loss: 0.5388, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7621, loss: 0.6298, batch_reg_loss: 0.1994, reg_loss: 0.1994 ||:   9%|9         | 9/95 [00:06<01:06,  1.30it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9581, LAS: 0.9204, UEM: 0.6453, LEM: 0.4183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1791, partial_loss/deprel_loss: 0.3220, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4929, loss: 0.6212, batch_reg_loss: 0.1994, reg_loss: 0.1994 ||:  13%|#2        | 12/95 [00:09<01:02,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9562, LAS: 0.9191, UEM: 0.5933, LEM: 0.3655, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5175, partial_loss/deprel_loss: 0.4918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6963, loss: 0.6354, batch_reg_loss: 0.1994, reg_loss: 0.1994 ||:  17%|#6        | 16/95 [00:11<00:57,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9586, LAS: 0.9215, UEM: 0.6436, LEM: 0.4147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1133, partial_loss/deprel_loss: 0.2584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4288, loss: 0.6159, batch_reg_loss: 0.1994, reg_loss: 0.1994 ||:  20%|##        | 19/95 [00:14<00:59,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9360, UAS: 0.9598, LAS: 0.9227, UEM: 0.6414, LEM: 0.4065, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2147, partial_loss/deprel_loss: 0.3550, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5263, loss: 0.6056, batch_reg_loss: 0.1994, reg_loss: 0.1994 ||:  23%|##3       | 22/95 [00:16<00:55,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9595, LAS: 0.9226, UEM: 0.6297, LEM: 0.3955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3931, partial_loss/deprel_loss: 0.3886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5889, loss: 0.6056, batch_reg_loss: 0.1994, reg_loss: 0.1994 ||:  26%|##6       | 25/95 [00:18<00:53,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8899, UAS: 0.9583, LAS: 0.9213, UEM: 0.6171, LEM: 0.3839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7926, partial_loss/deprel_loss: 0.5822, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8236, loss: 0.6173, batch_reg_loss: 0.1994, reg_loss: 0.1994 ||:  29%|##9       | 28/95 [00:21<00:50,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9583, LAS: 0.9213, UEM: 0.6311, LEM: 0.3954, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9408, partial_loss/deprel_loss: 0.5951, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8636, loss: 0.6161, batch_reg_loss: 0.1993, reg_loss: 0.1994 ||:  33%|###2      | 31/95 [00:23<00:48,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9381, UAS: 0.9578, LAS: 0.9207, UEM: 0.6404, LEM: 0.4068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1576, partial_loss/deprel_loss: 0.2774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4528, loss: 0.6182, batch_reg_loss: 0.1993, reg_loss: 0.1994 ||:  36%|###5      | 34/95 [00:25<00:46,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9574, LAS: 0.9199, UEM: 0.6286, LEM: 0.3936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4544, partial_loss/deprel_loss: 0.4705, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6666, loss: 0.6246, batch_reg_loss: 0.1993, reg_loss: 0.1994 ||:  40%|####      | 38/95 [00:28<00:40,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9572, LAS: 0.9197, UEM: 0.6213, LEM: 0.3856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4091, partial_loss/deprel_loss: 0.4012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6020, loss: 0.6266, batch_reg_loss: 0.1993, reg_loss: 0.1994 ||:  43%|####3     | 41/95 [00:30<00:38,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9579, LAS: 0.9202, UEM: 0.6249, LEM: 0.3839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1761, partial_loss/deprel_loss: 0.3662, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5274, loss: 0.6225, batch_reg_loss: 0.1993, reg_loss: 0.1994 ||:  46%|####6     | 44/95 [00:32<00:37,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8862, UAS: 0.9579, LAS: 0.9203, UEM: 0.6215, LEM: 0.3804, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8664, partial_loss/deprel_loss: 0.6563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8976, loss: 0.6244, batch_reg_loss: 0.1993, reg_loss: 0.1994 ||:  51%|#####     | 48/95 [00:35<00:33,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9576, LAS: 0.9199, UEM: 0.6289, LEM: 0.3925, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1261, partial_loss/deprel_loss: 0.2248, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4043, loss: 0.6267, batch_reg_loss: 0.1993, reg_loss: 0.1994 ||:  54%|#####3    | 51/95 [00:37<00:31,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9582, LAS: 0.9207, UEM: 0.6301, LEM: 0.3910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5878, partial_loss/deprel_loss: 0.4516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6781, loss: 0.6213, batch_reg_loss: 0.1993, reg_loss: 0.1994 ||:  59%|#####8    | 56/95 [00:39<00:25,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9578, LAS: 0.9204, UEM: 0.6178, LEM: 0.3806, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4879, partial_loss/deprel_loss: 0.4643, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6683, loss: 0.6228, batch_reg_loss: 0.1993, reg_loss: 0.1993 ||:  64%|######4   | 61/95 [00:42<00:20,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9581, LAS: 0.9205, UEM: 0.6223, LEM: 0.3820, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6060, partial_loss/deprel_loss: 0.4639, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6916, loss: 0.6196, batch_reg_loss: 0.1992, reg_loss: 0.1993 ||:  68%|######8   | 65/95 [00:44<00:18,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9372, UAS: 0.9579, LAS: 0.9202, UEM: 0.6264, LEM: 0.3853, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1883, partial_loss/deprel_loss: 0.3032, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4794, loss: 0.6218, batch_reg_loss: 0.1992, reg_loss: 0.1993 ||:  73%|#######2  | 69/95 [00:47<00:15,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9579, LAS: 0.9200, UEM: 0.6206, LEM: 0.3791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4641, partial_loss/deprel_loss: 0.4905, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6844, loss: 0.6241, batch_reg_loss: 0.1992, reg_loss: 0.1993 ||:  77%|#######6  | 73/95 [00:49<00:13,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9578, LAS: 0.9199, UEM: 0.6231, LEM: 0.3826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1604, partial_loss/deprel_loss: 0.3210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4881, loss: 0.6250, batch_reg_loss: 0.1992, reg_loss: 0.1993 ||:  81%|########1 | 77/95 [00:51<00:10,  1.69it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9585, LAS: 0.9208, UEM: 0.6421, LEM: 0.4047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1988, partial_loss/deprel_loss: 0.2897, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4708, loss: 0.6171, batch_reg_loss: 0.1992, reg_loss: 0.1993 ||:  85%|########5 | 81/95 [00:54<00:08,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9587, LAS: 0.9212, UEM: 0.6542, LEM: 0.4252, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7923, partial_loss/deprel_loss: 0.5080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7641, loss: 0.6143, batch_reg_loss: 0.1992, reg_loss: 0.1993 ||:  89%|########9 | 85/95 [00:56<00:06,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9590, LAS: 0.9216, UEM: 0.6569, LEM: 0.4281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2455, partial_loss/deprel_loss: 0.3351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5163, loss: 0.6113, batch_reg_loss: 0.1991, reg_loss: 0.1993 ||:  95%|#########4| 90/95 [00:59<00:02,  1.79it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9591, LAS: 0.9216, UEM: 0.6544, LEM: 0.4242, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5435, partial_loss/deprel_loss: 0.4717, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6852, loss: 0.6107, batch_reg_loss: 0.1991, reg_loss: 0.1993 ||:  99%|#########8| 94/95 [01:01<00:00,  1.74it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9593, LAS: 0.9218, UEM: 0.6573, LEM: 0.4266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1718, partial_loss/deprel_loss: 0.2827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4596, loss: 0.6091, batch_reg_loss: 0.1991, reg_loss: 0.1993 ||: 100%|##########| 95/95 [01:02<00:00,  1.52it/s]\n",
+      "2023-04-07 01:21:24,923 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:21:24,923 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 01:21:24,923 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.199  |       N/A\n",
+      "2023-04-07 01:21:24,923 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:21:24,923 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:21:24,923 - INFO - combo.training.tensorboard_writer - UEM                      |     0.657  |       N/A\n",
+      "2023-04-07 01:21:24,923 - INFO - combo.training.tensorboard_writer - LEM                      |     0.427  |       N/A\n",
+      "2023-04-07 01:21:24,923 - INFO - combo.training.tensorboard_writer - EM                       |     0.941  |       N/A\n",
+      "2023-04-07 01:21:24,923 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.172  |       N/A\n",
+      "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - UAS                      |     0.959  |       N/A\n",
+      "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.283  |       N/A\n",
+      "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - loss                     |     0.609  |       N/A\n",
+      "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - LAS                      |     0.922  |       N/A\n",
+      "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:21:24,924 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:21:24,929 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:21:29,084 - INFO - combo.training.trainer - Epoch duration: 0:01:09.488866\n",
+      "2023-04-07 01:21:29,085 - INFO - combo.training.trainer - Estimated training time remaining: 5:04:54\n",
+      "2023-04-07 01:21:29,085 - INFO - allennlp.training.trainer - Epoch 133/399\n",
+      "2023-04-07 01:21:29,085 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:21:29,086 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:21:29,093 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9399, LAS: 0.9028, UEM: 0.2065, LEM: 0.0769, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5936, partial_loss/deprel_loss: 0.5406, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7503, loss: 0.7376, batch_reg_loss: 0.1991, reg_loss: 0.1991 ||:   3%|3         | 3/95 [00:02<01:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9539, LAS: 0.9176, UEM: 0.5125, LEM: 0.2943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2040, partial_loss/deprel_loss: 0.3429, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5142, loss: 0.6439, batch_reg_loss: 0.1991, reg_loss: 0.1991 ||:   7%|7         | 7/95 [00:04<00:59,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9564, LAS: 0.9197, UEM: 0.5869, LEM: 0.3630, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1730, partial_loss/deprel_loss: 0.2958, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4703, loss: 0.6288, batch_reg_loss: 0.1991, reg_loss: 0.1991 ||:  11%|#         | 10/95 [00:06<00:57,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9559, LAS: 0.9192, UEM: 0.5592, LEM: 0.3337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3661, partial_loss/deprel_loss: 0.4280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6147, loss: 0.6349, batch_reg_loss: 0.1991, reg_loss: 0.1991 ||:  15%|#4        | 14/95 [00:09<00:54,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9171, UAS: 0.9564, LAS: 0.9201, UEM: 0.5590, LEM: 0.3300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5096, partial_loss/deprel_loss: 0.4017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6224, loss: 0.6229, batch_reg_loss: 0.1991, reg_loss: 0.1991 ||:  18%|#7        | 17/95 [00:11<00:52,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9589, LAS: 0.9226, UEM: 0.5985, LEM: 0.3627, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2027, partial_loss/deprel_loss: 0.2514, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4407, loss: 0.6044, batch_reg_loss: 0.1990, reg_loss: 0.1991 ||:  22%|##2       | 21/95 [00:13<00:47,  1.55it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9576, LAS: 0.9207, UEM: 0.6014, LEM: 0.3598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3723, partial_loss/deprel_loss: 0.4805, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6579, loss: 0.6190, batch_reg_loss: 0.1990, reg_loss: 0.1991 ||:  25%|##5       | 24/95 [00:15<00:46,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9574, LAS: 0.9211, UEM: 0.5883, LEM: 0.3519, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3182, partial_loss/deprel_loss: 0.3423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5365, loss: 0.6163, batch_reg_loss: 0.1990, reg_loss: 0.1991 ||:  28%|##8       | 27/95 [00:17<00:45,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9577, LAS: 0.9216, UEM: 0.5975, LEM: 0.3608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1524, partial_loss/deprel_loss: 0.3113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4785, loss: 0.6115, batch_reg_loss: 0.1990, reg_loss: 0.1991 ||:  33%|###2      | 31/95 [00:20<00:43,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9468, UAS: 0.9586, LAS: 0.9224, UEM: 0.6095, LEM: 0.3703, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1509, partial_loss/deprel_loss: 0.2543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4326, loss: 0.6066, batch_reg_loss: 0.1990, reg_loss: 0.1991 ||:  36%|###5      | 34/95 [00:22<00:42,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9574, LAS: 0.9210, UEM: 0.5948, LEM: 0.3568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6901, partial_loss/deprel_loss: 0.5410, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7698, loss: 0.6148, batch_reg_loss: 0.1990, reg_loss: 0.1990 ||:  39%|###8      | 37/95 [00:25<00:40,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9583, LAS: 0.9223, UEM: 0.6306, LEM: 0.4103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3606, partial_loss/deprel_loss: 0.3141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5224, loss: 0.6058, batch_reg_loss: 0.1990, reg_loss: 0.1990 ||:  42%|####2     | 40/95 [00:27<00:41,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9590, LAS: 0.9227, UEM: 0.6295, LEM: 0.4043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3459, partial_loss/deprel_loss: 0.4359, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6169, loss: 0.6030, batch_reg_loss: 0.1989, reg_loss: 0.1990 ||:  46%|####6     | 44/95 [00:30<00:36,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9593, LAS: 0.9228, UEM: 0.6317, LEM: 0.4045, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3376, partial_loss/deprel_loss: 0.4140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5977, loss: 0.6015, batch_reg_loss: 0.1989, reg_loss: 0.1990 ||:  49%|####9     | 47/95 [00:32<00:33,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9593, LAS: 0.9229, UEM: 0.6357, LEM: 0.4080, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6555, partial_loss/deprel_loss: 0.5572, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7758, loss: 0.6008, batch_reg_loss: 0.1989, reg_loss: 0.1990 ||:  53%|#####2    | 50/95 [00:34<00:32,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9585, LAS: 0.9220, UEM: 0.6241, LEM: 0.3974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6961, partial_loss/deprel_loss: 0.5424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7720, loss: 0.6065, batch_reg_loss: 0.1989, reg_loss: 0.1990 ||:  56%|#####5    | 53/95 [00:36<00:31,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9579, LAS: 0.9214, UEM: 0.6182, LEM: 0.3921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8112, partial_loss/deprel_loss: 0.5747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8209, loss: 0.6116, batch_reg_loss: 0.1989, reg_loss: 0.1990 ||:  59%|#####8    | 56/95 [00:39<00:29,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9569, LAS: 0.9204, UEM: 0.6100, LEM: 0.3846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5175, partial_loss/deprel_loss: 0.4520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6640, loss: 0.6181, batch_reg_loss: 0.1989, reg_loss: 0.1990 ||:  62%|######2   | 59/95 [00:41<00:26,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9569, LAS: 0.9203, UEM: 0.6064, LEM: 0.3807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6156, partial_loss/deprel_loss: 0.5473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7598, loss: 0.6195, batch_reg_loss: 0.1989, reg_loss: 0.1990 ||:  65%|######5   | 62/95 [00:43<00:25,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9577, UAS: 0.9579, LAS: 0.9213, UEM: 0.6329, LEM: 0.4109, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0794, partial_loss/deprel_loss: 0.1908, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3673, loss: 0.6108, batch_reg_loss: 0.1989, reg_loss: 0.1990 ||:  68%|######8   | 65/95 [00:46<00:23,  1.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9577, LAS: 0.9212, UEM: 0.6300, LEM: 0.4073, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3188, partial_loss/deprel_loss: 0.3842, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5700, loss: 0.6126, batch_reg_loss: 0.1989, reg_loss: 0.1990 ||:  72%|#######1  | 68/95 [00:48<00:21,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9580, LAS: 0.9214, UEM: 0.6344, LEM: 0.4107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4566, partial_loss/deprel_loss: 0.4366, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6395, loss: 0.6101, batch_reg_loss: 0.1989, reg_loss: 0.1990 ||:  75%|#######4  | 71/95 [00:50<00:17,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9579, LAS: 0.9212, UEM: 0.6278, LEM: 0.4024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2838, partial_loss/deprel_loss: 0.3759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5563, loss: 0.6125, batch_reg_loss: 0.1988, reg_loss: 0.1990 ||:  79%|#######8  | 75/95 [00:53<00:14,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9544, UAS: 0.9580, LAS: 0.9211, UEM: 0.6389, LEM: 0.4142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0798, partial_loss/deprel_loss: 0.2407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4073, loss: 0.6137, batch_reg_loss: 0.1988, reg_loss: 0.1990 ||:  82%|########2 | 78/95 [00:55<00:12,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8859, UAS: 0.9574, LAS: 0.9206, UEM: 0.6413, LEM: 0.4196, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9004, partial_loss/deprel_loss: 0.6443, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8944, loss: 0.6174, batch_reg_loss: 0.1988, reg_loss: 0.1990 ||:  85%|########5 | 81/95 [00:57<00:10,  1.38it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9580, LAS: 0.9210, UEM: 0.6499, LEM: 0.4262, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2265, partial_loss/deprel_loss: 0.3796, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5478, loss: 0.6142, batch_reg_loss: 0.1988, reg_loss: 0.1990 ||:  89%|########9 | 85/95 [00:59<00:06,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9586, LAS: 0.9217, UEM: 0.6566, LEM: 0.4312, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1234, partial_loss/deprel_loss: 0.2830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4499, loss: 0.6101, batch_reg_loss: 0.1988, reg_loss: 0.1989 ||:  94%|#########3| 89/95 [01:02<00:04,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9279, UAS: 0.9588, LAS: 0.9217, UEM: 0.6545, LEM: 0.4263, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2995, partial_loss/deprel_loss: 0.3699, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5546, loss: 0.6094, batch_reg_loss: 0.1988, reg_loss: 0.1989 ||:  98%|#########7| 93/95 [01:05<00:01,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9591, LAS: 0.9221, UEM: 0.6580, LEM: 0.4287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2678, partial_loss/deprel_loss: 0.3305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5167, loss: 0.6070, batch_reg_loss: 0.1988, reg_loss: 0.1989 ||: 100%|##########| 95/95 [01:06<00:00,  1.43it/s]\n",
+      "2023-04-07 01:22:38,758 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:22:38,758 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 01:22:38,758 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.199  |       N/A\n",
+      "2023-04-07 01:22:38,758 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:22:38,758 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:22:38,758 - INFO - combo.training.tensorboard_writer - UEM                      |     0.658  |       N/A\n",
+      "2023-04-07 01:22:38,758 - INFO - combo.training.tensorboard_writer - LEM                      |     0.429  |       N/A\n",
+      "2023-04-07 01:22:38,758 - INFO - combo.training.tensorboard_writer - EM                       |     0.934  |       N/A\n",
+      "2023-04-07 01:22:38,758 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.268  |       N/A\n",
+      "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - UAS                      |     0.959  |       N/A\n",
+      "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.330  |       N/A\n",
+      "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - loss                     |     0.607  |       N/A\n",
+      "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - LAS                      |     0.922  |       N/A\n",
+      "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:22:38,759 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:22:38,764 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:22:45,622 - INFO - combo.training.trainer - Epoch duration: 0:01:16.537262\n",
+      "2023-04-07 01:22:45,623 - INFO - combo.training.trainer - Estimated training time remaining: 5:04:01\n",
+      "2023-04-07 01:22:45,623 - INFO - allennlp.training.trainer - Epoch 134/399\n",
+      "2023-04-07 01:22:45,623 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:22:45,624 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:22:45,633 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9587, LAS: 0.9216, UEM: 0.5794, LEM: 0.3084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2872, partial_loss/deprel_loss: 0.3748, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5560, loss: 0.6184, batch_reg_loss: 0.1988, reg_loss: 0.1988 ||:   4%|4         | 4/95 [00:02<00:55,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9627, LAS: 0.9254, UEM: 0.6145, LEM: 0.3311, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3075, partial_loss/deprel_loss: 0.3267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5216, loss: 0.5816, batch_reg_loss: 0.1987, reg_loss: 0.1988 ||:   7%|7         | 7/95 [00:04<00:55,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9634, LAS: 0.9266, UEM: 0.6209, LEM: 0.3499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2019, partial_loss/deprel_loss: 0.2582, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4457, loss: 0.5769, batch_reg_loss: 0.1987, reg_loss: 0.1988 ||:  12%|#1        | 11/95 [00:06<00:52,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9480, UAS: 0.9658, LAS: 0.9284, UEM: 0.6867, LEM: 0.4317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0975, partial_loss/deprel_loss: 0.2502, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4184, loss: 0.5614, batch_reg_loss: 0.1987, reg_loss: 0.1987 ||:  16%|#5        | 15/95 [00:09<00:52,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9657, LAS: 0.9285, UEM: 0.6866, LEM: 0.4276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1655, partial_loss/deprel_loss: 0.3317, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4972, loss: 0.5615, batch_reg_loss: 0.1987, reg_loss: 0.1987 ||:  20%|##        | 19/95 [00:12<00:48,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9659, LAS: 0.9286, UEM: 0.6879, LEM: 0.4316, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4217, partial_loss/deprel_loss: 0.4791, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6663, loss: 0.5634, batch_reg_loss: 0.1987, reg_loss: 0.1987 ||:  23%|##3       | 22/95 [00:14<00:48,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9638, LAS: 0.9263, UEM: 0.6769, LEM: 0.4218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3697, partial_loss/deprel_loss: 0.4395, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6242, loss: 0.5777, batch_reg_loss: 0.1986, reg_loss: 0.1987 ||:  26%|##6       | 25/95 [00:16<00:47,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9532, UAS: 0.9637, LAS: 0.9269, UEM: 0.6751, LEM: 0.4226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1453, partial_loss/deprel_loss: 0.2524, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4296, loss: 0.5786, batch_reg_loss: 0.1986, reg_loss: 0.1987 ||:  29%|##9       | 28/95 [00:18<00:46,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9140, UAS: 0.9634, LAS: 0.9266, UEM: 0.6617, LEM: 0.4079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5527, partial_loss/deprel_loss: 0.5190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7243, loss: 0.5815, batch_reg_loss: 0.1986, reg_loss: 0.1987 ||:  34%|###3      | 32/95 [00:21<00:42,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9643, LAS: 0.9273, UEM: 0.6860, LEM: 0.4334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1710, partial_loss/deprel_loss: 0.2952, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4690, loss: 0.5732, batch_reg_loss: 0.1986, reg_loss: 0.1987 ||:  37%|###6      | 35/95 [00:23<00:41,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9637, LAS: 0.9265, UEM: 0.6841, LEM: 0.4343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7499, partial_loss/deprel_loss: 0.6065, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8338, loss: 0.5772, batch_reg_loss: 0.1986, reg_loss: 0.1987 ||:  40%|####      | 38/95 [00:25<00:41,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9640, LAS: 0.9269, UEM: 0.6920, LEM: 0.4439, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5653, partial_loss/deprel_loss: 0.5201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7277, loss: 0.5742, batch_reg_loss: 0.1986, reg_loss: 0.1987 ||:  43%|####3     | 41/95 [00:28<00:41,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9645, LAS: 0.9272, UEM: 0.6925, LEM: 0.4430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2804, partial_loss/deprel_loss: 0.3900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5666, loss: 0.5728, batch_reg_loss: 0.1986, reg_loss: 0.1987 ||:  46%|####6     | 44/95 [00:30<00:38,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9168, UAS: 0.9633, LAS: 0.9257, UEM: 0.6906, LEM: 0.4415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3622, partial_loss/deprel_loss: 0.4119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6005, loss: 0.5807, batch_reg_loss: 0.1985, reg_loss: 0.1987 ||:  49%|####9     | 47/95 [00:32<00:36,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9372, UAS: 0.9629, LAS: 0.9254, UEM: 0.6836, LEM: 0.4348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2095, partial_loss/deprel_loss: 0.3331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5069, loss: 0.5827, batch_reg_loss: 0.1985, reg_loss: 0.1986 ||:  54%|#####3    | 51/95 [00:35<00:32,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9625, LAS: 0.9251, UEM: 0.6921, LEM: 0.4502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2024, partial_loss/deprel_loss: 0.3444, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5145, loss: 0.5865, batch_reg_loss: 0.1985, reg_loss: 0.1986 ||:  58%|#####7    | 55/95 [00:38<00:29,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9626, LAS: 0.9250, UEM: 0.6952, LEM: 0.4541, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1205, partial_loss/deprel_loss: 0.2485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4214, loss: 0.5862, batch_reg_loss: 0.1985, reg_loss: 0.1986 ||:  61%|######1   | 58/95 [00:40<00:27,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9629, LAS: 0.9255, UEM: 0.6956, LEM: 0.4535, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3908, partial_loss/deprel_loss: 0.4097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6044, loss: 0.5823, batch_reg_loss: 0.1985, reg_loss: 0.1986 ||:  65%|######5   | 62/95 [00:43<00:23,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9629, LAS: 0.9255, UEM: 0.6915, LEM: 0.4492, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3678, partial_loss/deprel_loss: 0.4048, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5959, loss: 0.5824, batch_reg_loss: 0.1985, reg_loss: 0.1986 ||:  68%|######8   | 65/95 [00:45<00:22,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9628, LAS: 0.9254, UEM: 0.6897, LEM: 0.4478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1705, partial_loss/deprel_loss: 0.2590, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4397, loss: 0.5825, batch_reg_loss: 0.1984, reg_loss: 0.1986 ||:  72%|#######1  | 68/95 [00:48<00:20,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9617, LAS: 0.9244, UEM: 0.6812, LEM: 0.4411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8721, partial_loss/deprel_loss: 0.5912, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8458, loss: 0.5900, batch_reg_loss: 0.1984, reg_loss: 0.1986 ||:  75%|#######4  | 71/95 [00:50<00:17,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8971, UAS: 0.9611, LAS: 0.9238, UEM: 0.6721, LEM: 0.4339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7259, partial_loss/deprel_loss: 0.5685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7984, loss: 0.5945, batch_reg_loss: 0.1984, reg_loss: 0.1986 ||:  78%|#######7  | 74/95 [00:52<00:15,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9605, LAS: 0.9232, UEM: 0.6652, LEM: 0.4278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6742, partial_loss/deprel_loss: 0.5349, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7612, loss: 0.5999, batch_reg_loss: 0.1984, reg_loss: 0.1986 ||:  81%|########1 | 77/95 [00:54<00:12,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8480, UAS: 0.9597, LAS: 0.9227, UEM: 0.6757, LEM: 0.4480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4574, partial_loss/deprel_loss: 0.7380, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0803, loss: 0.6039, batch_reg_loss: 0.1984, reg_loss: 0.1986 ||:  84%|########4 | 80/95 [00:56<00:11,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9594, LAS: 0.9223, UEM: 0.6720, LEM: 0.4427, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3185, partial_loss/deprel_loss: 0.4009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5828, loss: 0.6069, batch_reg_loss: 0.1984, reg_loss: 0.1986 ||:  87%|########7 | 83/95 [00:59<00:09,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9592, LAS: 0.9219, UEM: 0.6638, LEM: 0.4343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5500, partial_loss/deprel_loss: 0.5016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7097, loss: 0.6094, batch_reg_loss: 0.1984, reg_loss: 0.1986 ||:  92%|#########1| 87/95 [01:01<00:05,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9592, LAS: 0.9218, UEM: 0.6602, LEM: 0.4297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2254, partial_loss/deprel_loss: 0.3015, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4847, loss: 0.6093, batch_reg_loss: 0.1984, reg_loss: 0.1986 ||:  96%|#########5| 91/95 [01:03<00:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9596, LAS: 0.9221, UEM: 0.6595, LEM: 0.4269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2163, partial_loss/deprel_loss: 0.3548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5255, loss: 0.6066, batch_reg_loss: 0.1984, reg_loss: 0.1986 ||: 100%|##########| 95/95 [01:06<00:00,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9596, LAS: 0.9221, UEM: 0.6595, LEM: 0.4269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2163, partial_loss/deprel_loss: 0.3548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5255, loss: 0.6066, batch_reg_loss: 0.1984, reg_loss: 0.1986 ||: 100%|##########| 95/95 [01:06<00:00,  1.43it/s]\n",
+      "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.199  |       N/A\n",
+      "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - UEM                      |     0.660  |       N/A\n",
+      "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - LEM                      |     0.427  |       N/A\n",
+      "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - EM                       |     0.934  |       N/A\n",
+      "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.216  |       N/A\n",
+      "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:23:55,488 - INFO - combo.training.tensorboard_writer - UAS                      |     0.960  |       N/A\n",
+      "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.355  |       N/A\n",
+      "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - loss                     |     0.607  |       N/A\n",
+      "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - LAS                      |     0.922  |       N/A\n",
+      "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:23:55,489 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:23:55,494 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:24:00,913 - INFO - combo.training.trainer - Epoch duration: 0:01:15.289828\n",
+      "2023-04-07 01:24:00,913 - INFO - combo.training.trainer - Estimated training time remaining: 5:03:06\n",
+      "2023-04-07 01:24:00,913 - INFO - allennlp.training.trainer - Epoch 135/399\n",
+      "2023-04-07 01:24:00,913 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:24:00,914 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:24:00,924 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9090, UAS: 0.9734, LAS: 0.9385, UEM: 0.8424, LEM: 0.6630, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5135, partial_loss/deprel_loss: 0.5183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7157, loss: 0.4844, batch_reg_loss: 0.1984, reg_loss: 0.1984 ||:   4%|4         | 4/95 [00:02<00:47,  1.92it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9621, LAS: 0.9262, UEM: 0.7501, LEM: 0.5557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2303, partial_loss/deprel_loss: 0.3211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5013, loss: 0.5787, batch_reg_loss: 0.1984, reg_loss: 0.1984 ||:   9%|9         | 9/95 [00:04<00:43,  1.99it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9640, LAS: 0.9268, UEM: 0.7403, LEM: 0.5221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3602, partial_loss/deprel_loss: 0.3763, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5714, loss: 0.5684, batch_reg_loss: 0.1984, reg_loss: 0.1984 ||:  15%|#4        | 14/95 [00:06<00:39,  2.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8928, UAS: 0.9642, LAS: 0.9273, UEM: 0.7454, LEM: 0.5255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8161, partial_loss/deprel_loss: 0.5156, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7740, loss: 0.5649, batch_reg_loss: 0.1983, reg_loss: 0.1984 ||:  19%|#8        | 18/95 [00:08<00:39,  1.94it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9608, LAS: 0.9236, UEM: 0.7243, LEM: 0.5029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3672, partial_loss/deprel_loss: 0.3806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5763, loss: 0.5923, batch_reg_loss: 0.1983, reg_loss: 0.1984 ||:  23%|##3       | 22/95 [00:11<00:41,  1.77it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9598, LAS: 0.9227, UEM: 0.7079, LEM: 0.4870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7618, partial_loss/deprel_loss: 0.5350, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7786, loss: 0.5970, batch_reg_loss: 0.1983, reg_loss: 0.1984 ||:  27%|##7       | 26/95 [00:14<00:40,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9609, LAS: 0.9239, UEM: 0.7030, LEM: 0.4766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2092, partial_loss/deprel_loss: 0.3251, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5002, loss: 0.5888, batch_reg_loss: 0.1983, reg_loss: 0.1983 ||:  32%|###1      | 30/95 [00:17<00:40,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9599, LAS: 0.9229, UEM: 0.6832, LEM: 0.4560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6985, partial_loss/deprel_loss: 0.5348, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7658, loss: 0.5973, batch_reg_loss: 0.1983, reg_loss: 0.1983 ||:  36%|###5      | 34/95 [00:19<00:37,  1.65it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9603, LAS: 0.9235, UEM: 0.6796, LEM: 0.4514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3702, partial_loss/deprel_loss: 0.3774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5742, loss: 0.5939, batch_reg_loss: 0.1983, reg_loss: 0.1983 ||:  40%|####      | 38/95 [00:21<00:34,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9244, UAS: 0.9588, LAS: 0.9218, UEM: 0.6668, LEM: 0.4372, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3178, partial_loss/deprel_loss: 0.4070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5874, loss: 0.6046, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||:  44%|####4     | 42/95 [00:24<00:32,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9588, LAS: 0.9219, UEM: 0.6636, LEM: 0.4352, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0991, partial_loss/deprel_loss: 0.2442, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4134, loss: 0.6069, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||:  48%|####8     | 46/95 [00:26<00:30,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9595, LAS: 0.9228, UEM: 0.6722, LEM: 0.4442, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1898, partial_loss/deprel_loss: 0.3519, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5177, loss: 0.6017, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||:  53%|#####2    | 50/95 [00:30<00:30,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9598, LAS: 0.9230, UEM: 0.6752, LEM: 0.4476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1546, partial_loss/deprel_loss: 0.2717, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4465, loss: 0.6022, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||:  56%|#####5    | 53/95 [00:32<00:29,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9170, UAS: 0.9602, LAS: 0.9234, UEM: 0.6769, LEM: 0.4479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4765, partial_loss/deprel_loss: 0.4579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6599, loss: 0.6002, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||:  59%|#####8    | 56/95 [00:34<00:26,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9599, LAS: 0.9233, UEM: 0.6675, LEM: 0.4390, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5892, partial_loss/deprel_loss: 0.4697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6918, loss: 0.6008, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||:  63%|######3   | 60/95 [00:36<00:23,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9588, LAS: 0.9221, UEM: 0.6554, LEM: 0.4282, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6334, partial_loss/deprel_loss: 0.5019, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7264, loss: 0.6090, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||:  67%|######7   | 64/95 [00:39<00:21,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9593, LAS: 0.9229, UEM: 0.6709, LEM: 0.4527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5367, partial_loss/deprel_loss: 0.4702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6817, loss: 0.6044, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||:  71%|#######   | 67/95 [00:42<00:20,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8981, UAS: 0.9592, LAS: 0.9228, UEM: 0.6741, LEM: 0.4570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6735, partial_loss/deprel_loss: 0.5313, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7579, loss: 0.6047, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||:  74%|#######3  | 70/95 [00:44<00:19,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9593, LAS: 0.9228, UEM: 0.6713, LEM: 0.4524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2803, partial_loss/deprel_loss: 0.3732, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5528, loss: 0.6042, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||:  77%|#######6  | 73/95 [00:46<00:16,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9588, LAS: 0.9222, UEM: 0.6636, LEM: 0.4448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2255, partial_loss/deprel_loss: 0.3710, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5401, loss: 0.6087, batch_reg_loss: 0.1982, reg_loss: 0.1983 ||:  81%|########1 | 77/95 [00:49<00:12,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9591, LAS: 0.9224, UEM: 0.6621, LEM: 0.4416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2382, partial_loss/deprel_loss: 0.3699, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5417, loss: 0.6078, batch_reg_loss: 0.1981, reg_loss: 0.1983 ||:  84%|########4 | 80/95 [00:51<00:10,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9592, LAS: 0.9225, UEM: 0.6615, LEM: 0.4401, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4661, partial_loss/deprel_loss: 0.4844, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6789, loss: 0.6062, batch_reg_loss: 0.1981, reg_loss: 0.1983 ||:  87%|########7 | 83/95 [00:53<00:08,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9591, LAS: 0.9224, UEM: 0.6554, LEM: 0.4328, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3490, partial_loss/deprel_loss: 0.4178, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6021, loss: 0.6071, batch_reg_loss: 0.1981, reg_loss: 0.1983 ||:  92%|#########1| 87/95 [00:55<00:05,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9164, UAS: 0.9593, LAS: 0.9226, UEM: 0.6519, LEM: 0.4280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4279, partial_loss/deprel_loss: 0.4535, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6465, loss: 0.6058, batch_reg_loss: 0.1981, reg_loss: 0.1982 ||:  96%|#########5| 91/95 [00:58<00:02,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9596, LAS: 0.9228, UEM: 0.6544, LEM: 0.4292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3878, partial_loss/deprel_loss: 0.4701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6518, loss: 0.6035, batch_reg_loss: 0.1981, reg_loss: 0.1982 ||:  99%|#########8| 94/95 [01:00<00:00,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9596, LAS: 0.9229, UEM: 0.6572, LEM: 0.4325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2029, partial_loss/deprel_loss: 0.2692, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4540, loss: 0.6019, batch_reg_loss: 0.1981, reg_loss: 0.1982 ||: 100%|##########| 95/95 [01:01<00:00,  1.54it/s]\n",
+      "2023-04-07 01:25:05,849 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8570, UAS: 0.9448, LAS: 0.8910, UEM: 0.5697, LEM: 0.3105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5015, partial_loss/deprel_loss: 20.5917, partial_loss/cycle_loss: 0.0000, batch_loss: 16.7736, loss: 10.3735, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  27%|##7       | 3/11 [00:03<00:08,  1.06s/it]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9466, LAS: 0.8907, UEM: 0.5723, LEM: 0.2552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6183, partial_loss/deprel_loss: 7.5705, partial_loss/cycle_loss: 0.0000, batch_loss: 6.1801, loss: 9.4382, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  55%|#####4    | 6/11 [00:05<00:05,  1.01s/it]   \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8838, UAS: 0.9465, LAS: 0.8924, UEM: 0.5659, LEM: 0.2602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9658, partial_loss/deprel_loss: 9.7527, partial_loss/cycle_loss: 0.0000, batch_loss: 7.9953, loss: 9.4572, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  82%|########1 | 9/11 [00:08<00:01,  1.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9518, LAS: 0.9006, UEM: 0.6898, LEM: 0.4146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2077, partial_loss/deprel_loss: 5.1934, partial_loss/cycle_loss: 0.0000, batch_loss: 4.1963, loss: 8.5575, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.03s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9518, LAS: 0.9006, UEM: 0.6898, LEM: 0.4146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2077, partial_loss/deprel_loss: 5.1934, partial_loss/cycle_loss: 0.0000, batch_loss: 4.1963, loss: 8.5575, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.01it/s]\n",
+      "2023-04-07 01:25:16,783 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:25:16,783 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 01:25:16,783 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.198  |     0.000\n",
+      "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - UEM                      |     0.657  |     0.690\n",
+      "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - LEM                      |     0.433  |     0.415\n",
+      "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - EM                       |     0.933  |     0.944\n",
+      "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.203  |     0.208\n",
+      "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - UAS                      |     0.960  |     0.952\n",
+      "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.269  |     5.193\n",
+      "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - loss                     |     0.602  |     8.557\n",
+      "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - LAS                      |     0.923  |     0.901\n",
+      "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:25:16,784 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:25:16,785 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:25:16,785 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 01:25:16,789 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:25:21,507 - INFO - combo.training.trainer - Epoch duration: 0:01:20.593771\n",
+      "2023-04-07 01:25:21,508 - INFO - combo.training.trainer - Estimated training time remaining: 5:02:20\n",
+      "2023-04-07 01:25:21,508 - INFO - allennlp.training.trainer - Epoch 136/399\n",
+      "2023-04-07 01:25:21,508 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:25:21,508 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:25:21,519 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9291, UAS: 0.9477, LAS: 0.9105, UEM: 0.4170, LEM: 0.1993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2722, partial_loss/deprel_loss: 0.3794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5560, loss: 0.6688, batch_reg_loss: 0.1981, reg_loss: 0.1981 ||:   5%|5         | 5/95 [00:02<00:41,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9572, LAS: 0.9211, UEM: 0.6111, LEM: 0.3729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6145, partial_loss/deprel_loss: 0.5036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7239, loss: 0.6007, batch_reg_loss: 0.1981, reg_loss: 0.1981 ||:  11%|#         | 10/95 [00:04<00:39,  2.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9574, LAS: 0.9199, UEM: 0.6279, LEM: 0.3747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2094, partial_loss/deprel_loss: 0.3515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5212, loss: 0.6057, batch_reg_loss: 0.1980, reg_loss: 0.1981 ||:  16%|#5        | 15/95 [00:06<00:36,  2.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9061, UAS: 0.9589, LAS: 0.9215, UEM: 0.6452, LEM: 0.3943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6473, partial_loss/deprel_loss: 0.4565, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6927, loss: 0.5946, batch_reg_loss: 0.1980, reg_loss: 0.1981 ||:  19%|#8        | 18/95 [00:09<00:42,  1.82it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9589, LAS: 0.9216, UEM: 0.6381, LEM: 0.3878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5630, partial_loss/deprel_loss: 0.4474, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6685, loss: 0.5919, batch_reg_loss: 0.1980, reg_loss: 0.1981 ||:  23%|##3       | 22/95 [00:11<00:42,  1.73it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9592, LAS: 0.9222, UEM: 0.6422, LEM: 0.3934, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2009, partial_loss/deprel_loss: 0.3576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5243, loss: 0.5916, batch_reg_loss: 0.1980, reg_loss: 0.1980 ||:  26%|##6       | 25/95 [00:14<00:44,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9168, UAS: 0.9570, LAS: 0.9201, UEM: 0.6178, LEM: 0.3737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4075, partial_loss/deprel_loss: 0.4801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6636, loss: 0.6105, batch_reg_loss: 0.1980, reg_loss: 0.1980 ||:  31%|###       | 29/95 [00:16<00:41,  1.58it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9141, UAS: 0.9571, LAS: 0.9201, UEM: 0.6056, LEM: 0.3611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5901, partial_loss/deprel_loss: 0.4912, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7090, loss: 0.6146, batch_reg_loss: 0.1980, reg_loss: 0.1980 ||:  34%|###3      | 32/95 [00:18<00:41,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9567, LAS: 0.9198, UEM: 0.6082, LEM: 0.3685, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8884, partial_loss/deprel_loss: 0.6101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8637, loss: 0.6163, batch_reg_loss: 0.1980, reg_loss: 0.1980 ||:  37%|###6      | 35/95 [00:20<00:40,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9573, LAS: 0.9206, UEM: 0.6068, LEM: 0.3658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3104, partial_loss/deprel_loss: 0.3744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5596, loss: 0.6127, batch_reg_loss: 0.1980, reg_loss: 0.1980 ||:  40%|####      | 38/95 [00:23<00:40,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9560, UAS: 0.9582, LAS: 0.9216, UEM: 0.6191, LEM: 0.3825, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0835, partial_loss/deprel_loss: 0.2134, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3854, loss: 0.6083, batch_reg_loss: 0.1979, reg_loss: 0.1980 ||:  44%|####4     | 42/95 [00:26<00:38,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9464, UAS: 0.9590, LAS: 0.9223, UEM: 0.6321, LEM: 0.3934, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1725, partial_loss/deprel_loss: 0.3023, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4743, loss: 0.6025, batch_reg_loss: 0.1979, reg_loss: 0.1980 ||:  47%|####7     | 45/95 [00:28<00:35,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8548, UAS: 0.9560, LAS: 0.9194, UEM: 0.6176, LEM: 0.3823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3761, partial_loss/deprel_loss: 0.7035, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0360, loss: 0.6228, batch_reg_loss: 0.1979, reg_loss: 0.1980 ||:  52%|#####1    | 49/95 [00:31<00:32,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9362, UAS: 0.9568, LAS: 0.9201, UEM: 0.6234, LEM: 0.3862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2165, partial_loss/deprel_loss: 0.3401, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5133, loss: 0.6176, batch_reg_loss: 0.1979, reg_loss: 0.1980 ||:  55%|#####4    | 52/95 [00:33<00:30,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8834, UAS: 0.9570, LAS: 0.9205, UEM: 0.6418, LEM: 0.4115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8543, partial_loss/deprel_loss: 0.6344, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8763, loss: 0.6145, batch_reg_loss: 0.1979, reg_loss: 0.1980 ||:  58%|#####7    | 55/95 [00:35<00:28,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9579, LAS: 0.9214, UEM: 0.6563, LEM: 0.4265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2713, partial_loss/deprel_loss: 0.3439, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5273, loss: 0.6074, batch_reg_loss: 0.1979, reg_loss: 0.1980 ||:  61%|######1   | 58/95 [00:37<00:27,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9582, LAS: 0.9217, UEM: 0.6544, LEM: 0.4221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4923, partial_loss/deprel_loss: 0.4504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6567, loss: 0.6058, batch_reg_loss: 0.1979, reg_loss: 0.1980 ||:  64%|######4   | 61/95 [00:39<00:24,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9589, LAS: 0.9225, UEM: 0.6632, LEM: 0.4309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1826, partial_loss/deprel_loss: 0.2583, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4410, loss: 0.6002, batch_reg_loss: 0.1979, reg_loss: 0.1980 ||:  67%|######7   | 64/95 [00:42<00:23,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8962, UAS: 0.9581, LAS: 0.9217, UEM: 0.6515, LEM: 0.4208, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7897, partial_loss/deprel_loss: 0.5498, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7956, loss: 0.6060, batch_reg_loss: 0.1979, reg_loss: 0.1980 ||:  72%|#######1  | 68/95 [00:44<00:19,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9266, UAS: 0.9582, LAS: 0.9218, UEM: 0.6451, LEM: 0.4123, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3828, partial_loss/deprel_loss: 0.3718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5718, loss: 0.6069, batch_reg_loss: 0.1979, reg_loss: 0.1980 ||:  76%|#######5  | 72/95 [00:47<00:15,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9585, LAS: 0.9220, UEM: 0.6490, LEM: 0.4175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2878, partial_loss/deprel_loss: 0.3631, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5459, loss: 0.6041, batch_reg_loss: 0.1978, reg_loss: 0.1980 ||:  79%|#######8  | 75/95 [00:49<00:14,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9586, LAS: 0.9220, UEM: 0.6448, LEM: 0.4125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1703, partial_loss/deprel_loss: 0.3425, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5059, loss: 0.6055, batch_reg_loss: 0.1978, reg_loss: 0.1980 ||:  83%|########3 | 79/95 [00:52<00:10,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9589, LAS: 0.9223, UEM: 0.6472, LEM: 0.4147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4874, partial_loss/deprel_loss: 0.4348, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6431, loss: 0.6029, batch_reg_loss: 0.1978, reg_loss: 0.1980 ||:  86%|########6 | 82/95 [00:54<00:08,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9340, UAS: 0.9589, LAS: 0.9222, UEM: 0.6438, LEM: 0.4102, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3174, partial_loss/deprel_loss: 0.3589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5484, loss: 0.6042, batch_reg_loss: 0.1978, reg_loss: 0.1979 ||:  91%|######### | 86/95 [00:57<00:06,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9588, LAS: 0.9222, UEM: 0.6445, LEM: 0.4116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4299, partial_loss/deprel_loss: 0.4909, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6765, loss: 0.6043, batch_reg_loss: 0.1978, reg_loss: 0.1979 ||:  94%|#########3| 89/95 [00:59<00:04,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9588, LAS: 0.9221, UEM: 0.6399, LEM: 0.4076, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5266, partial_loss/deprel_loss: 0.4846, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6908, loss: 0.6058, batch_reg_loss: 0.1978, reg_loss: 0.1979 ||:  97%|#########6| 92/95 [01:03<00:02,  1.13it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9595, LAS: 0.9230, UEM: 0.6589, LEM: 0.4315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1738, partial_loss/deprel_loss: 0.3277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4947, loss: 0.6001, batch_reg_loss: 0.1978, reg_loss: 0.1979 ||: 100%|##########| 95/95 [01:05<00:00,  1.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9595, LAS: 0.9230, UEM: 0.6589, LEM: 0.4315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1738, partial_loss/deprel_loss: 0.3277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4947, loss: 0.6001, batch_reg_loss: 0.1978, reg_loss: 0.1979 ||: 100%|##########| 95/95 [01:05<00:00,  1.45it/s]\n",
+      "2023-04-07 01:26:29,688 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:26:29,688 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 01:26:29,688 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.198  |       N/A\n",
+      "2023-04-07 01:26:29,688 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:26:29,688 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:26:29,688 - INFO - combo.training.tensorboard_writer - UEM                      |     0.659  |       N/A\n",
+      "2023-04-07 01:26:29,688 - INFO - combo.training.tensorboard_writer - LEM                      |     0.431  |       N/A\n",
+      "2023-04-07 01:26:29,688 - INFO - combo.training.tensorboard_writer - EM                       |     0.939  |       N/A\n",
+      "2023-04-07 01:26:29,688 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.174  |       N/A\n",
+      "2023-04-07 01:26:29,688 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - UAS                      |     0.960  |       N/A\n",
+      "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.328  |       N/A\n",
+      "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - loss                     |     0.600  |       N/A\n",
+      "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - LAS                      |     0.923  |       N/A\n",
+      "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:26:29,689 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:26:29,694 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:26:33,709 - INFO - combo.training.trainer - Epoch duration: 0:01:12.201244\n",
+      "2023-04-07 01:26:33,709 - INFO - combo.training.trainer - Estimated training time remaining: 5:01:18\n",
+      "2023-04-07 01:26:33,710 - INFO - allennlp.training.trainer - Epoch 137/399\n",
+      "2023-04-07 01:26:33,710 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:26:33,710 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:26:33,718 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9578, LAS: 0.9179, UEM: 0.6403, LEM: 0.3515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8409, partial_loss/deprel_loss: 0.6153, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8582, loss: 0.6337, batch_reg_loss: 0.1978, reg_loss: 0.1978 ||:   4%|4         | 4/95 [00:02<00:56,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9617, LAS: 0.9243, UEM: 0.6554, LEM: 0.3759, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2772, partial_loss/deprel_loss: 0.3896, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5648, loss: 0.5891, batch_reg_loss: 0.1977, reg_loss: 0.1978 ||:   8%|8         | 8/95 [00:04<00:54,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9616, LAS: 0.9247, UEM: 0.6517, LEM: 0.3739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2115, partial_loss/deprel_loss: 0.3472, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5177, loss: 0.5920, batch_reg_loss: 0.1977, reg_loss: 0.1977 ||:  13%|#2        | 12/95 [00:07<00:52,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9630, LAS: 0.9263, UEM: 0.6644, LEM: 0.4002, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4985, partial_loss/deprel_loss: 0.5145, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7090, loss: 0.5823, batch_reg_loss: 0.1977, reg_loss: 0.1977 ||:  17%|#6        | 16/95 [00:09<00:47,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9618, LAS: 0.9251, UEM: 0.6491, LEM: 0.3903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2654, partial_loss/deprel_loss: 0.3221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5085, loss: 0.5885, batch_reg_loss: 0.1977, reg_loss: 0.1977 ||:  22%|##2       | 21/95 [00:11<00:40,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9616, LAS: 0.9249, UEM: 0.6594, LEM: 0.4086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1471, partial_loss/deprel_loss: 0.2967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4644, loss: 0.5903, batch_reg_loss: 0.1977, reg_loss: 0.1977 ||:  27%|##7       | 26/95 [00:14<00:37,  1.86it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8684, UAS: 0.9591, LAS: 0.9221, UEM: 0.6384, LEM: 0.3941, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2336, partial_loss/deprel_loss: 0.7373, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0342, loss: 0.6098, batch_reg_loss: 0.1976, reg_loss: 0.1977 ||:  33%|###2      | 31/95 [00:17<00:34,  1.88it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9612, LAS: 0.9247, UEM: 0.6996, LEM: 0.4798, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1872, partial_loss/deprel_loss: 0.3673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5289, loss: 0.5921, batch_reg_loss: 0.1976, reg_loss: 0.1977 ||:  37%|###6      | 35/95 [00:20<00:37,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9609, LAS: 0.9246, UEM: 0.6880, LEM: 0.4679, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4530, partial_loss/deprel_loss: 0.4076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6143, loss: 0.5916, batch_reg_loss: 0.1976, reg_loss: 0.1977 ||:  41%|####1     | 39/95 [00:23<00:36,  1.53it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8979, UAS: 0.9601, LAS: 0.9238, UEM: 0.6744, LEM: 0.4538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8377, partial_loss/deprel_loss: 0.5340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7924, loss: 0.5982, batch_reg_loss: 0.1976, reg_loss: 0.1977 ||:  45%|####5     | 43/95 [00:25<00:32,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9594, LAS: 0.9230, UEM: 0.6606, LEM: 0.4396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3537, partial_loss/deprel_loss: 0.4054, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5927, loss: 0.6032, batch_reg_loss: 0.1976, reg_loss: 0.1977 ||:  49%|####9     | 47/95 [00:28<00:30,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9256, UAS: 0.9600, LAS: 0.9236, UEM: 0.6667, LEM: 0.4433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3820, partial_loss/deprel_loss: 0.4031, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5965, loss: 0.5984, batch_reg_loss: 0.1976, reg_loss: 0.1977 ||:  54%|#####3    | 51/95 [00:30<00:28,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9589, LAS: 0.9223, UEM: 0.6633, LEM: 0.4404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2752, partial_loss/deprel_loss: 0.3877, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5628, loss: 0.6049, batch_reg_loss: 0.1976, reg_loss: 0.1977 ||:  58%|#####7    | 55/95 [00:33<00:25,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9291, UAS: 0.9590, LAS: 0.9223, UEM: 0.6597, LEM: 0.4351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3123, partial_loss/deprel_loss: 0.3900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5720, loss: 0.6049, batch_reg_loss: 0.1976, reg_loss: 0.1976 ||:  62%|######2   | 59/95 [00:35<00:23,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9078, UAS: 0.9592, LAS: 0.9223, UEM: 0.6543, LEM: 0.4280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5126, partial_loss/deprel_loss: 0.4443, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6555, loss: 0.6051, batch_reg_loss: 0.1975, reg_loss: 0.1976 ||:  66%|######6   | 63/95 [00:38<00:21,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9601, LAS: 0.9233, UEM: 0.6704, LEM: 0.4427, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1819, partial_loss/deprel_loss: 0.3038, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4769, loss: 0.5972, batch_reg_loss: 0.1975, reg_loss: 0.1976 ||:  71%|#######   | 67/95 [00:41<00:18,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9381, UAS: 0.9599, LAS: 0.9231, UEM: 0.6695, LEM: 0.4417, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1581, partial_loss/deprel_loss: 0.2901, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4612, loss: 0.5972, batch_reg_loss: 0.1975, reg_loss: 0.1976 ||:  75%|#######4  | 71/95 [00:44<00:15,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9300, UAS: 0.9598, LAS: 0.9232, UEM: 0.6675, LEM: 0.4389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2414, partial_loss/deprel_loss: 0.3645, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5374, loss: 0.5974, batch_reg_loss: 0.1975, reg_loss: 0.1976 ||:  79%|#######8  | 75/95 [00:46<00:13,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9603, LAS: 0.9235, UEM: 0.6675, LEM: 0.4369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5380, partial_loss/deprel_loss: 0.4932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6997, loss: 0.5962, batch_reg_loss: 0.1975, reg_loss: 0.1976 ||:  83%|########3 | 79/95 [00:49<00:10,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8700, UAS: 0.9597, LAS: 0.9228, UEM: 0.6618, LEM: 0.4298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0778, partial_loss/deprel_loss: 0.6155, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9054, loss: 0.6002, batch_reg_loss: 0.1975, reg_loss: 0.1976 ||:  87%|########7 | 83/95 [00:52<00:08,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9596, LAS: 0.9226, UEM: 0.6607, LEM: 0.4300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5729, partial_loss/deprel_loss: 0.5474, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7499, loss: 0.6014, batch_reg_loss: 0.1975, reg_loss: 0.1976 ||:  91%|######### | 86/95 [00:54<00:06,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9594, LAS: 0.9224, UEM: 0.6574, LEM: 0.4264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6314, partial_loss/deprel_loss: 0.5472, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7615, loss: 0.6034, batch_reg_loss: 0.1974, reg_loss: 0.1976 ||:  94%|#########3| 89/95 [00:56<00:04,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9598, LAS: 0.9227, UEM: 0.6653, LEM: 0.4346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1512, partial_loss/deprel_loss: 0.3065, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4729, loss: 0.6003, batch_reg_loss: 0.1974, reg_loss: 0.1976 ||:  97%|#########6| 92/95 [00:59<00:02,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9599, LAS: 0.9228, UEM: 0.6633, LEM: 0.4322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3207, partial_loss/deprel_loss: 0.4402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6137, loss: 0.5997, batch_reg_loss: 0.1974, reg_loss: 0.1976 ||: 100%|##########| 95/95 [01:01<00:00,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9599, LAS: 0.9228, UEM: 0.6633, LEM: 0.4322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3207, partial_loss/deprel_loss: 0.4402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6137, loss: 0.5997, batch_reg_loss: 0.1974, reg_loss: 0.1976 ||: 100%|##########| 95/95 [01:01<00:00,  1.55it/s]\n",
+      "2023-04-07 01:27:38,162 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:27:38,162 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 01:27:38,162 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.198  |       N/A\n",
+      "2023-04-07 01:27:38,162 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:27:38,162 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - UEM                      |     0.663  |       N/A\n",
+      "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - LEM                      |     0.432  |       N/A\n",
+      "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - EM                       |     0.928  |       N/A\n",
+      "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.321  |       N/A\n",
+      "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - UAS                      |     0.960  |       N/A\n",
+      "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.440  |       N/A\n",
+      "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - loss                     |     0.600  |       N/A\n",
+      "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - LAS                      |     0.923  |       N/A\n",
+      "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:27:38,163 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:27:38,164 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:27:38,168 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:27:42,897 - INFO - combo.training.trainer - Epoch duration: 0:01:09.187591\n",
+      "2023-04-07 01:27:42,898 - INFO - combo.training.trainer - Estimated training time remaining: 5:00:10\n",
+      "2023-04-07 01:27:42,898 - INFO - allennlp.training.trainer - Epoch 138/399\n",
+      "2023-04-07 01:27:42,898 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:27:42,899 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:27:42,907 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9656, LAS: 0.9287, UEM: 0.6550, LEM: 0.3899, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2006, partial_loss/deprel_loss: 0.3173, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4914, loss: 0.5460, batch_reg_loss: 0.1974, reg_loss: 0.1974 ||:   3%|3         | 3/95 [00:02<01:04,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9685, LAS: 0.9327, UEM: 0.6778, LEM: 0.4097, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2079, partial_loss/deprel_loss: 0.3084, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4857, loss: 0.5286, batch_reg_loss: 0.1974, reg_loss: 0.1974 ||:   6%|6         | 6/95 [00:04<01:03,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9696, UAS: 0.9720, LAS: 0.9371, UEM: 0.7967, LEM: 0.5964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0302, partial_loss/deprel_loss: 0.1199, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2994, loss: 0.4928, batch_reg_loss: 0.1974, reg_loss: 0.1974 ||:   8%|8         | 8/95 [00:06<01:10,  1.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9212, UAS: 0.9672, LAS: 0.9314, UEM: 0.7446, LEM: 0.5393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3475, partial_loss/deprel_loss: 0.4047, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5906, loss: 0.5362, batch_reg_loss: 0.1974, reg_loss: 0.1974 ||:  12%|#1        | 11/95 [00:08<01:05,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9339, UAS: 0.9653, LAS: 0.9291, UEM: 0.7202, LEM: 0.5100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1821, partial_loss/deprel_loss: 0.3007, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4743, loss: 0.5506, batch_reg_loss: 0.1974, reg_loss: 0.1974 ||:  15%|#4        | 14/95 [00:10<01:01,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9122, UAS: 0.9605, LAS: 0.9237, UEM: 0.6877, LEM: 0.4762, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5680, partial_loss/deprel_loss: 0.4767, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6923, loss: 0.5843, batch_reg_loss: 0.1974, reg_loss: 0.1974 ||:  18%|#7        | 17/95 [00:12<00:58,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9619, LAS: 0.9251, UEM: 0.6909, LEM: 0.4720, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3146, partial_loss/deprel_loss: 0.3693, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5557, loss: 0.5734, batch_reg_loss: 0.1973, reg_loss: 0.1974 ||:  21%|##1       | 20/95 [00:14<00:54,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9457, UAS: 0.9632, LAS: 0.9268, UEM: 0.7058, LEM: 0.4823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1060, partial_loss/deprel_loss: 0.2545, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4221, loss: 0.5637, batch_reg_loss: 0.1973, reg_loss: 0.1974 ||:  24%|##4       | 23/95 [00:16<00:51,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9624, LAS: 0.9259, UEM: 0.6856, LEM: 0.4564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7878, partial_loss/deprel_loss: 0.4806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7394, loss: 0.5732, batch_reg_loss: 0.1973, reg_loss: 0.1974 ||:  28%|##8       | 27/95 [00:19<00:45,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9623, LAS: 0.9256, UEM: 0.6836, LEM: 0.4484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7151, partial_loss/deprel_loss: 0.5253, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7605, loss: 0.5748, batch_reg_loss: 0.1973, reg_loss: 0.1974 ||:  33%|###2      | 31/95 [00:21<00:40,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9614, LAS: 0.9245, UEM: 0.6895, LEM: 0.4566, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1021, partial_loss/deprel_loss: 0.2748, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4375, loss: 0.5830, batch_reg_loss: 0.1973, reg_loss: 0.1974 ||:  37%|###6      | 35/95 [00:23<00:36,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9606, LAS: 0.9239, UEM: 0.6718, LEM: 0.4401, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3850, partial_loss/deprel_loss: 0.4119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6038, loss: 0.5886, batch_reg_loss: 0.1973, reg_loss: 0.1973 ||:  41%|####1     | 39/95 [00:26<00:33,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9584, UAS: 0.9616, LAS: 0.9249, UEM: 0.6908, LEM: 0.4621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0725, partial_loss/deprel_loss: 0.1679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3460, loss: 0.5810, batch_reg_loss: 0.1973, reg_loss: 0.1973 ||:  45%|####5     | 43/95 [00:28<00:33,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9618, LAS: 0.9249, UEM: 0.7016, LEM: 0.4716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1319, partial_loss/deprel_loss: 0.2751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4437, loss: 0.5773, batch_reg_loss: 0.1973, reg_loss: 0.1973 ||:  49%|####9     | 47/95 [00:31<00:30,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9609, LAS: 0.9244, UEM: 0.6875, LEM: 0.4585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3932, partial_loss/deprel_loss: 0.4072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6016, loss: 0.5833, batch_reg_loss: 0.1972, reg_loss: 0.1973 ||:  54%|#####3    | 51/95 [00:33<00:27,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9611, LAS: 0.9247, UEM: 0.6906, LEM: 0.4601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1672, partial_loss/deprel_loss: 0.3010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4715, loss: 0.5804, batch_reg_loss: 0.1972, reg_loss: 0.1973 ||:  58%|#####7    | 55/95 [00:35<00:23,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9053, UAS: 0.9598, LAS: 0.9234, UEM: 0.6782, LEM: 0.4477, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6884, partial_loss/deprel_loss: 0.4733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7135, loss: 0.5895, batch_reg_loss: 0.1972, reg_loss: 0.1973 ||:  63%|######3   | 60/95 [00:38<00:19,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9594, LAS: 0.9229, UEM: 0.6681, LEM: 0.4365, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2406, partial_loss/deprel_loss: 0.4217, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5827, loss: 0.5960, batch_reg_loss: 0.1972, reg_loss: 0.1973 ||:  68%|######8   | 65/95 [00:40<00:15,  1.93it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9601, LAS: 0.9236, UEM: 0.6772, LEM: 0.4460, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2404, partial_loss/deprel_loss: 0.3519, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5268, loss: 0.5907, batch_reg_loss: 0.1972, reg_loss: 0.1973 ||:  73%|#######2  | 69/95 [00:43<00:16,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9607, LAS: 0.9241, UEM: 0.6831, LEM: 0.4510, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1677, partial_loss/deprel_loss: 0.2805, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4551, loss: 0.5868, batch_reg_loss: 0.1972, reg_loss: 0.1973 ||:  77%|#######6  | 73/95 [00:46<00:14,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9056, UAS: 0.9604, LAS: 0.9236, UEM: 0.6764, LEM: 0.4439, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5734, partial_loss/deprel_loss: 0.4774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6938, loss: 0.5904, batch_reg_loss: 0.1971, reg_loss: 0.1973 ||:  81%|########1 | 77/95 [00:49<00:12,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9108, UAS: 0.9603, LAS: 0.9236, UEM: 0.6720, LEM: 0.4374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5311, partial_loss/deprel_loss: 0.5182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7179, loss: 0.5907, batch_reg_loss: 0.1971, reg_loss: 0.1973 ||:  85%|########5 | 81/95 [00:52<00:09,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9596, LAS: 0.9229, UEM: 0.6633, LEM: 0.4306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4483, partial_loss/deprel_loss: 0.4611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6557, loss: 0.5969, batch_reg_loss: 0.1971, reg_loss: 0.1973 ||:  89%|########9 | 85/95 [00:55<00:06,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9308, UAS: 0.9596, LAS: 0.9229, UEM: 0.6591, LEM: 0.4251, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2519, partial_loss/deprel_loss: 0.3435, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5223, loss: 0.5968, batch_reg_loss: 0.1971, reg_loss: 0.1973 ||:  94%|#########3| 89/95 [00:57<00:04,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9599, LAS: 0.9233, UEM: 0.6637, LEM: 0.4300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2108, partial_loss/deprel_loss: 0.2985, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4780, loss: 0.5939, batch_reg_loss: 0.1971, reg_loss: 0.1973 ||:  97%|#########6| 92/95 [01:00<00:02,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9320, UAS: 0.9600, LAS: 0.9233, UEM: 0.6597, LEM: 0.4259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2863, partial_loss/deprel_loss: 0.3374, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5243, loss: 0.5936, batch_reg_loss: 0.1971, reg_loss: 0.1972 ||: 100%|##########| 95/95 [01:02<00:00,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9320, UAS: 0.9600, LAS: 0.9233, UEM: 0.6597, LEM: 0.4259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2863, partial_loss/deprel_loss: 0.3374, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5243, loss: 0.5936, batch_reg_loss: 0.1971, reg_loss: 0.1972 ||: 100%|##########| 95/95 [01:02<00:00,  1.53it/s]\n",
+      "2023-04-07 01:28:48,302 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:28:48,302 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 01:28:48,302 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.197  |       N/A\n",
+      "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - UEM                      |     0.660  |       N/A\n",
+      "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - LEM                      |     0.426  |       N/A\n",
+      "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - EM                       |     0.932  |       N/A\n",
+      "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.286  |       N/A\n",
+      "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - UAS                      |     0.960  |       N/A\n",
+      "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.337  |       N/A\n",
+      "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - loss                     |     0.594  |       N/A\n",
+      "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - LAS                      |     0.923  |       N/A\n",
+      "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:28:48,303 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:28:48,304 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:28:48,304 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:28:48,304 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:28:48,308 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:28:53,247 - INFO - combo.training.trainer - Epoch duration: 0:01:10.348896\n",
+      "2023-04-07 01:28:53,248 - INFO - combo.training.trainer - Estimated training time remaining: 4:59:05\n",
+      "2023-04-07 01:28:53,248 - INFO - allennlp.training.trainer - Epoch 139/399\n",
+      "2023-04-07 01:28:53,248 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:28:53,249 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:28:53,260 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9606, LAS: 0.9218, UEM: 0.6580, LEM: 0.4003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1156, partial_loss/deprel_loss: 0.2599, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4281, loss: 0.5922, batch_reg_loss: 0.1971, reg_loss: 0.1971 ||:   4%|4         | 4/95 [00:02<01:00,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9517, LAS: 0.9137, UEM: 0.6397, LEM: 0.4283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2519, partial_loss/deprel_loss: 0.2646, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4591, loss: 0.6459, batch_reg_loss: 0.1971, reg_loss: 0.1971 ||:   7%|7         | 7/95 [00:04<01:01,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9240, UAS: 0.9535, LAS: 0.9163, UEM: 0.6238, LEM: 0.4033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3397, partial_loss/deprel_loss: 0.3835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5718, loss: 0.6356, batch_reg_loss: 0.1971, reg_loss: 0.1971 ||:  11%|#         | 10/95 [00:07<01:03,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9587, LAS: 0.9227, UEM: 0.6995, LEM: 0.4848, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1266, partial_loss/deprel_loss: 0.2680, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4367, loss: 0.5918, batch_reg_loss: 0.1970, reg_loss: 0.1971 ||:  14%|#3        | 13/95 [00:10<01:02,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9244, UAS: 0.9599, LAS: 0.9239, UEM: 0.6762, LEM: 0.4573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3987, partial_loss/deprel_loss: 0.4457, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6333, loss: 0.5941, batch_reg_loss: 0.1970, reg_loss: 0.1971 ||:  18%|#7        | 17/95 [00:12<00:55,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9584, LAS: 0.9223, UEM: 0.6474, LEM: 0.4253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8026, partial_loss/deprel_loss: 0.5058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7622, loss: 0.6050, batch_reg_loss: 0.1970, reg_loss: 0.1971 ||:  22%|##2       | 21/95 [00:14<00:50,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9586, LAS: 0.9222, UEM: 0.6493, LEM: 0.4246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2957, partial_loss/deprel_loss: 0.3742, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5555, loss: 0.6059, batch_reg_loss: 0.1970, reg_loss: 0.1970 ||:  25%|##5       | 24/95 [00:17<00:50,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9588, LAS: 0.9221, UEM: 0.6425, LEM: 0.4161, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4044, partial_loss/deprel_loss: 0.3984, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5966, loss: 0.6044, batch_reg_loss: 0.1970, reg_loss: 0.1970 ||:  29%|##9       | 28/95 [00:19<00:45,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9609, LAS: 0.9247, UEM: 0.6930, LEM: 0.4803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2666, partial_loss/deprel_loss: 0.3292, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5137, loss: 0.5868, batch_reg_loss: 0.1970, reg_loss: 0.1970 ||:  33%|###2      | 31/95 [00:22<00:46,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9060, UAS: 0.9604, LAS: 0.9243, UEM: 0.6867, LEM: 0.4756, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6902, partial_loss/deprel_loss: 0.4548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6989, loss: 0.5879, batch_reg_loss: 0.1970, reg_loss: 0.1970 ||:  36%|###5      | 34/95 [00:24<00:44,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9481, UAS: 0.9604, LAS: 0.9243, UEM: 0.6827, LEM: 0.4684, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1529, partial_loss/deprel_loss: 0.2892, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4589, loss: 0.5894, batch_reg_loss: 0.1970, reg_loss: 0.1970 ||:  40%|####      | 38/95 [00:27<00:41,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9598, LAS: 0.9235, UEM: 0.6741, LEM: 0.4571, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3820, partial_loss/deprel_loss: 0.4045, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5970, loss: 0.5943, batch_reg_loss: 0.1970, reg_loss: 0.1970 ||:  44%|####4     | 42/95 [00:29<00:36,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9472, UAS: 0.9596, LAS: 0.9232, UEM: 0.6796, LEM: 0.4645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1011, partial_loss/deprel_loss: 0.2468, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4146, loss: 0.5964, batch_reg_loss: 0.1969, reg_loss: 0.1970 ||:  47%|####7     | 45/95 [00:32<00:36,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9592, LAS: 0.9226, UEM: 0.6667, LEM: 0.4491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3255, partial_loss/deprel_loss: 0.4255, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6024, loss: 0.6007, batch_reg_loss: 0.1969, reg_loss: 0.1970 ||:  52%|#####1    | 49/95 [00:34<00:32,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9060, UAS: 0.9585, LAS: 0.9219, UEM: 0.6564, LEM: 0.4384, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4568, partial_loss/deprel_loss: 0.5608, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7370, loss: 0.6071, batch_reg_loss: 0.1969, reg_loss: 0.1970 ||:  55%|#####4    | 52/95 [00:36<00:30,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9590, LAS: 0.9223, UEM: 0.6594, LEM: 0.4388, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1864, partial_loss/deprel_loss: 0.3183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4888, loss: 0.6044, batch_reg_loss: 0.1969, reg_loss: 0.1970 ||:  58%|#####7    | 55/95 [00:38<00:28,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9593, LAS: 0.9227, UEM: 0.6548, LEM: 0.4319, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4273, partial_loss/deprel_loss: 0.3596, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5701, loss: 0.6018, batch_reg_loss: 0.1969, reg_loss: 0.1970 ||:  62%|######2   | 59/95 [00:41<00:24,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9588, LAS: 0.9220, UEM: 0.6436, LEM: 0.4207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7359, partial_loss/deprel_loss: 0.5160, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7569, loss: 0.6058, batch_reg_loss: 0.1969, reg_loss: 0.1970 ||:  66%|######6   | 63/95 [00:43<00:21,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9074, UAS: 0.9595, LAS: 0.9227, UEM: 0.6474, LEM: 0.4215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5647, partial_loss/deprel_loss: 0.4988, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7089, loss: 0.6011, batch_reg_loss: 0.1969, reg_loss: 0.1970 ||:  72%|#######1  | 68/95 [00:46<00:16,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9599, LAS: 0.9232, UEM: 0.6477, LEM: 0.4197, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3547, partial_loss/deprel_loss: 0.3603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5561, loss: 0.5981, batch_reg_loss: 0.1969, reg_loss: 0.1970 ||:  77%|#######6  | 73/95 [00:48<00:12,  1.76it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9224, UAS: 0.9603, LAS: 0.9237, UEM: 0.6488, LEM: 0.4201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2814, partial_loss/deprel_loss: 0.4058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5778, loss: 0.5955, batch_reg_loss: 0.1969, reg_loss: 0.1970 ||:  82%|########2 | 78/95 [00:50<00:08,  1.91it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9602, LAS: 0.9235, UEM: 0.6453, LEM: 0.4163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6260, partial_loss/deprel_loss: 0.5170, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7357, loss: 0.5959, batch_reg_loss: 0.1968, reg_loss: 0.1970 ||:  86%|########6 | 82/95 [00:52<00:06,  1.93it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9557, UAS: 0.9609, LAS: 0.9244, UEM: 0.6631, LEM: 0.4377, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0888, partial_loss/deprel_loss: 0.1850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3626, loss: 0.5888, batch_reg_loss: 0.1968, reg_loss: 0.1970 ||:  91%|######### | 86/95 [00:55<00:05,  1.72it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9311, UAS: 0.9613, LAS: 0.9247, UEM: 0.6672, LEM: 0.4403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3059, partial_loss/deprel_loss: 0.3469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5356, loss: 0.5864, batch_reg_loss: 0.1968, reg_loss: 0.1970 ||:  95%|#########4| 90/95 [00:58<00:02,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9607, LAS: 0.9241, UEM: 0.6642, LEM: 0.4379, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2155, partial_loss/deprel_loss: 0.2877, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4700, loss: 0.5906, batch_reg_loss: 0.1968, reg_loss: 0.1969 ||:  99%|#########8| 94/95 [01:01<00:00,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9608, LAS: 0.9244, UEM: 0.6660, LEM: 0.4396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1725, partial_loss/deprel_loss: 0.2655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4437, loss: 0.5890, batch_reg_loss: 0.1968, reg_loss: 0.1969 ||: 100%|##########| 95/95 [01:02<00:00,  1.53it/s]\n",
+      "2023-04-07 01:29:58,402 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.197  |       N/A\n",
+      "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - UEM                      |     0.666  |       N/A\n",
+      "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - LEM                      |     0.440  |       N/A\n",
+      "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - EM                       |     0.947  |       N/A\n",
+      "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.172  |       N/A\n",
+      "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - UAS                      |     0.961  |       N/A\n",
+      "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.266  |       N/A\n",
+      "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - loss                     |     0.589  |       N/A\n",
+      "2023-04-07 01:29:58,403 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:29:58,404 - INFO - combo.training.tensorboard_writer - LAS                      |     0.924  |       N/A\n",
+      "2023-04-07 01:29:58,404 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:29:58,404 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:29:58,404 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:29:58,404 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:29:58,404 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:29:58,404 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:29:58,408 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:30:02,573 - INFO - combo.training.trainer - Epoch duration: 0:01:09.325241\n",
+      "2023-04-07 01:30:02,574 - INFO - combo.training.trainer - Estimated training time remaining: 4:57:57\n",
+      "2023-04-07 01:30:02,574 - INFO - allennlp.training.trainer - Epoch 140/399\n",
+      "2023-04-07 01:30:02,574 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:30:02,575 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:30:02,584 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9549, LAS: 0.9209, UEM: 0.4025, LEM: 0.1541, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5523, partial_loss/deprel_loss: 0.4377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6574, loss: 0.6231, batch_reg_loss: 0.1968, reg_loss: 0.1968 ||:   3%|3         | 3/95 [00:02<01:03,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9597, LAS: 0.9261, UEM: 0.5462, LEM: 0.2947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2514, partial_loss/deprel_loss: 0.3139, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4982, loss: 0.5811, batch_reg_loss: 0.1968, reg_loss: 0.1968 ||:   6%|6         | 6/95 [00:04<01:05,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9625, LAS: 0.9282, UEM: 0.6070, LEM: 0.3556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3815, partial_loss/deprel_loss: 0.4141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6043, loss: 0.5652, batch_reg_loss: 0.1968, reg_loss: 0.1968 ||:   9%|9         | 9/95 [00:06<01:02,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9641, LAS: 0.9287, UEM: 0.6138, LEM: 0.3559, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3036, partial_loss/deprel_loss: 0.3618, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5469, loss: 0.5624, batch_reg_loss: 0.1967, reg_loss: 0.1968 ||:  14%|#3        | 13/95 [00:09<00:58,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9634, LAS: 0.9279, UEM: 0.5874, LEM: 0.3375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3066, partial_loss/deprel_loss: 0.3654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5504, loss: 0.5709, batch_reg_loss: 0.1967, reg_loss: 0.1968 ||:  18%|#7        | 17/95 [00:11<00:53,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9448, UAS: 0.9626, LAS: 0.9273, UEM: 0.6171, LEM: 0.3748, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1938, partial_loss/deprel_loss: 0.3088, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4825, loss: 0.5762, batch_reg_loss: 0.1967, reg_loss: 0.1967 ||:  22%|##2       | 21/95 [00:14<00:50,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9621, LAS: 0.9271, UEM: 0.6139, LEM: 0.3754, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5532, partial_loss/deprel_loss: 0.4882, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6979, loss: 0.5798, batch_reg_loss: 0.1967, reg_loss: 0.1967 ||:  26%|##6       | 25/95 [00:16<00:45,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9485, UAS: 0.9642, LAS: 0.9293, UEM: 0.6653, LEM: 0.4301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1061, partial_loss/deprel_loss: 0.2268, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3993, loss: 0.5612, batch_reg_loss: 0.1967, reg_loss: 0.1967 ||:  31%|###       | 29/95 [00:19<00:43,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9648, LAS: 0.9300, UEM: 0.6708, LEM: 0.4334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1593, partial_loss/deprel_loss: 0.2767, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4499, loss: 0.5571, batch_reg_loss: 0.1967, reg_loss: 0.1967 ||:  34%|###3      | 32/95 [00:21<00:42,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9654, LAS: 0.9306, UEM: 0.6747, LEM: 0.4355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3367, partial_loss/deprel_loss: 0.3737, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5629, loss: 0.5531, batch_reg_loss: 0.1966, reg_loss: 0.1967 ||:  37%|###6      | 35/95 [00:23<00:40,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9509, UAS: 0.9647, LAS: 0.9300, UEM: 0.6875, LEM: 0.4560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0927, partial_loss/deprel_loss: 0.1957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3717, loss: 0.5578, batch_reg_loss: 0.1966, reg_loss: 0.1967 ||:  40%|####      | 38/95 [00:25<00:38,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9434, UAS: 0.9653, LAS: 0.9305, UEM: 0.6997, LEM: 0.4698, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1231, partial_loss/deprel_loss: 0.2722, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4390, loss: 0.5533, batch_reg_loss: 0.1966, reg_loss: 0.1967 ||:  43%|####3     | 41/95 [00:28<00:38,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9630, LAS: 0.9282, UEM: 0.6846, LEM: 0.4581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4382, partial_loss/deprel_loss: 0.3811, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5891, loss: 0.5681, batch_reg_loss: 0.1966, reg_loss: 0.1967 ||:  46%|####6     | 44/95 [00:30<00:36,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9398, UAS: 0.9621, LAS: 0.9270, UEM: 0.6746, LEM: 0.4490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1712, partial_loss/deprel_loss: 0.3175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4848, loss: 0.5769, batch_reg_loss: 0.1966, reg_loss: 0.1967 ||:  51%|#####     | 48/95 [00:33<00:33,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9622, LAS: 0.9273, UEM: 0.6796, LEM: 0.4551, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4518, partial_loss/deprel_loss: 0.4611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6558, loss: 0.5744, batch_reg_loss: 0.1966, reg_loss: 0.1967 ||:  54%|#####3    | 51/95 [00:35<00:32,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9606, LAS: 0.9253, UEM: 0.6697, LEM: 0.4468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1981, partial_loss/deprel_loss: 0.3362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5051, loss: 0.5853, batch_reg_loss: 0.1966, reg_loss: 0.1967 ||:  58%|#####7    | 55/95 [00:38<00:28,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9613, LAS: 0.9259, UEM: 0.6830, LEM: 0.4606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1258, partial_loss/deprel_loss: 0.2682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4363, loss: 0.5806, batch_reg_loss: 0.1966, reg_loss: 0.1967 ||:  61%|######1   | 58/95 [00:41<00:29,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9259, UAS: 0.9614, LAS: 0.9258, UEM: 0.6792, LEM: 0.4526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3390, partial_loss/deprel_loss: 0.3466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5416, loss: 0.5810, batch_reg_loss: 0.1965, reg_loss: 0.1967 ||:  65%|######5   | 62/95 [00:43<00:23,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9311, UAS: 0.9615, LAS: 0.9259, UEM: 0.6776, LEM: 0.4493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2763, partial_loss/deprel_loss: 0.3455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5282, loss: 0.5802, batch_reg_loss: 0.1965, reg_loss: 0.1966 ||:  69%|######9   | 66/95 [00:45<00:20,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9615, LAS: 0.9259, UEM: 0.6753, LEM: 0.4469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6507, partial_loss/deprel_loss: 0.5641, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7780, loss: 0.5807, batch_reg_loss: 0.1965, reg_loss: 0.1966 ||:  73%|#######2  | 69/95 [00:48<00:18,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9118, UAS: 0.9606, LAS: 0.9247, UEM: 0.6655, LEM: 0.4381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3926, partial_loss/deprel_loss: 0.4924, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6689, loss: 0.5882, batch_reg_loss: 0.1965, reg_loss: 0.1966 ||:  77%|#######6  | 73/95 [00:50<00:15,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9603, LAS: 0.9245, UEM: 0.6605, LEM: 0.4337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2852, partial_loss/deprel_loss: 0.3725, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5515, loss: 0.5893, batch_reg_loss: 0.1965, reg_loss: 0.1966 ||:  80%|########  | 76/95 [00:52<00:13,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9606, LAS: 0.9246, UEM: 0.6631, LEM: 0.4338, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3329, partial_loss/deprel_loss: 0.3601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5512, loss: 0.5882, batch_reg_loss: 0.1965, reg_loss: 0.1966 ||:  83%|########3 | 79/95 [00:54<00:11,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9603, LAS: 0.9243, UEM: 0.6587, LEM: 0.4296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5302, partial_loss/deprel_loss: 0.4732, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6811, loss: 0.5910, batch_reg_loss: 0.1965, reg_loss: 0.1966 ||:  87%|########7 | 83/95 [00:57<00:08,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9356, UAS: 0.9602, LAS: 0.9242, UEM: 0.6559, LEM: 0.4241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2396, partial_loss/deprel_loss: 0.3221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5021, loss: 0.5927, batch_reg_loss: 0.1965, reg_loss: 0.1966 ||:  93%|#########2| 88/95 [00:59<00:04,  1.62it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9603, LAS: 0.9242, UEM: 0.6540, LEM: 0.4215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2837, partial_loss/deprel_loss: 0.3571, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5389, loss: 0.5917, batch_reg_loss: 0.1965, reg_loss: 0.1966 ||:  98%|#########7| 93/95 [01:02<00:01,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9603, LAS: 0.9243, UEM: 0.6653, LEM: 0.4393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8845, partial_loss/deprel_loss: 0.5812, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8383, loss: 0.5912, batch_reg_loss: 0.1965, reg_loss: 0.1966 ||: 100%|##########| 95/95 [01:03<00:00,  1.50it/s]\n",
+      "2023-04-07 01:31:09,161 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.9528, LAS: 0.9029, UEM: 0.8072, LEM: 0.6049, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0580, partial_loss/deprel_loss: 15.0226, partial_loss/cycle_loss: 0.0000, batch_loss: 12.2297, loss: 8.1817, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  18%|#8        | 2/11 [00:02<00:09,  1.05s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9521, LAS: 0.9017, UEM: 0.7197, LEM: 0.4644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3701, partial_loss/deprel_loss: 7.7624, partial_loss/cycle_loss: 0.0000, batch_loss: 6.2839, loss: 8.5380, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:04<00:06,  1.02s/it]  \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9540, LAS: 0.9034, UEM: 0.7199, LEM: 0.4410, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2049, partial_loss/deprel_loss: 5.8722, partial_loss/cycle_loss: 0.0000, batch_loss: 4.7387, loss: 7.7018, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  73%|#######2  | 8/11 [00:07<00:03,  1.01s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9512, LAS: 0.9000, UEM: 0.6878, LEM: 0.4100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9186, partial_loss/deprel_loss: 10.7496, partial_loss/cycle_loss: 0.0000, batch_loss: 8.7834, loss: 8.3488, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.02s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9512, LAS: 0.9000, UEM: 0.6878, LEM: 0.4100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9186, partial_loss/deprel_loss: 10.7496, partial_loss/cycle_loss: 0.0000, batch_loss: 8.7834, loss: 8.3488, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.00it/s]\n",
+      "2023-04-07 01:31:20,174 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.197  |     0.000\n",
+      "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - UEM                      |     0.665  |     0.688\n",
+      "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - LEM                      |     0.439  |     0.410\n",
+      "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - EM                       |     0.888  |     0.892\n",
+      "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.884  |     0.919\n",
+      "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - UAS                      |     0.960  |     0.951\n",
+      "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.581  |    10.750\n",
+      "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - loss                     |     0.591  |     8.349\n",
+      "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - LAS                      |     0.924  |     0.900\n",
+      "2023-04-07 01:31:20,175 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:31:20,176 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:31:20,176 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:31:20,176 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:31:20,176 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:31:20,176 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 01:31:20,180 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:31:24,963 - INFO - combo.training.trainer - Epoch duration: 0:01:22.388611\n",
+      "2023-04-07 01:31:24,963 - INFO - combo.training.trainer - Estimated training time remaining: 4:57:13\n",
+      "2023-04-07 01:31:24,963 - INFO - allennlp.training.trainer - Epoch 141/399\n",
+      "2023-04-07 01:31:24,963 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:31:24,964 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:31:24,973 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9714, LAS: 0.9367, UEM: 0.7460, LEM: 0.4968, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2083, partial_loss/deprel_loss: 0.3262, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4991, loss: 0.5037, batch_reg_loss: 0.1965, reg_loss: 0.1965 ||:   3%|3         | 3/95 [00:02<01:12,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9701, LAS: 0.9349, UEM: 0.7408, LEM: 0.4896, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2253, partial_loss/deprel_loss: 0.3309, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5062, loss: 0.5114, batch_reg_loss: 0.1965, reg_loss: 0.1965 ||:   6%|6         | 6/95 [00:04<01:12,  1.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9166, UAS: 0.9699, LAS: 0.9346, UEM: 0.7492, LEM: 0.5091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4965, partial_loss/deprel_loss: 0.4303, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6400, loss: 0.5193, batch_reg_loss: 0.1964, reg_loss: 0.1965 ||:   9%|9         | 9/95 [00:07<01:10,  1.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9700, LAS: 0.9353, UEM: 0.7390, LEM: 0.4933, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1402, partial_loss/deprel_loss: 0.2776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4466, loss: 0.5176, batch_reg_loss: 0.1964, reg_loss: 0.1965 ||:  14%|#3        | 13/95 [00:10<01:03,  1.29it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9383, UAS: 0.9668, LAS: 0.9321, UEM: 0.6963, LEM: 0.4561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2890, partial_loss/deprel_loss: 0.3554, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5385, loss: 0.5396, batch_reg_loss: 0.1964, reg_loss: 0.1964 ||:  18%|#7        | 17/95 [00:12<00:57,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9660, LAS: 0.9314, UEM: 0.6880, LEM: 0.4502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1620, partial_loss/deprel_loss: 0.2415, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4220, loss: 0.5408, batch_reg_loss: 0.1964, reg_loss: 0.1964 ||:  21%|##1       | 20/95 [00:14<00:54,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9640, LAS: 0.9295, UEM: 0.6576, LEM: 0.4233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4328, partial_loss/deprel_loss: 0.4518, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6444, loss: 0.5569, batch_reg_loss: 0.1964, reg_loss: 0.1964 ||:  25%|##5       | 24/95 [00:17<00:49,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9266, UAS: 0.9644, LAS: 0.9299, UEM: 0.6597, LEM: 0.4243, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3868, partial_loss/deprel_loss: 0.3504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5541, loss: 0.5500, batch_reg_loss: 0.1964, reg_loss: 0.1964 ||:  28%|##8       | 27/95 [00:19<00:47,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9134, UAS: 0.9650, LAS: 0.9310, UEM: 0.6749, LEM: 0.4440, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5194, partial_loss/deprel_loss: 0.4562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6652, loss: 0.5463, batch_reg_loss: 0.1964, reg_loss: 0.1964 ||:  33%|###2      | 31/95 [00:21<00:43,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9653, LAS: 0.9308, UEM: 0.6795, LEM: 0.4468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1588, partial_loss/deprel_loss: 0.3028, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4704, loss: 0.5468, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||:  37%|###6      | 35/95 [00:24<00:41,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9639, LAS: 0.9294, UEM: 0.6681, LEM: 0.4378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6353, partial_loss/deprel_loss: 0.4657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6959, loss: 0.5570, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||:  40%|####      | 38/95 [00:27<00:40,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9192, UAS: 0.9635, LAS: 0.9291, UEM: 0.6576, LEM: 0.4258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4292, partial_loss/deprel_loss: 0.4423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6360, loss: 0.5602, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||:  43%|####3     | 41/95 [00:29<00:39,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9636, LAS: 0.9291, UEM: 0.6645, LEM: 0.4322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5756, partial_loss/deprel_loss: 0.4647, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6832, loss: 0.5583, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||:  47%|####7     | 45/95 [00:32<00:35,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9643, LAS: 0.9298, UEM: 0.6827, LEM: 0.4551, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4058, partial_loss/deprel_loss: 0.3831, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5840, loss: 0.5532, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||:  51%|#####     | 48/95 [00:34<00:33,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9627, LAS: 0.9279, UEM: 0.6729, LEM: 0.4464, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6470, partial_loss/deprel_loss: 0.5355, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7541, loss: 0.5667, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||:  55%|#####4    | 52/95 [00:36<00:30,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9612, LAS: 0.9263, UEM: 0.6632, LEM: 0.4375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3347, partial_loss/deprel_loss: 0.3655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5556, loss: 0.5758, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||:  58%|#####7    | 55/95 [00:39<00:28,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9058, UAS: 0.9617, LAS: 0.9264, UEM: 0.6674, LEM: 0.4358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5713, partial_loss/deprel_loss: 0.5004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7109, loss: 0.5742, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||:  62%|######2   | 59/95 [00:41<00:25,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9613, LAS: 0.9259, UEM: 0.6627, LEM: 0.4299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7711, partial_loss/deprel_loss: 0.4545, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7141, loss: 0.5765, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||:  65%|######5   | 62/95 [00:43<00:22,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9620, LAS: 0.9269, UEM: 0.6826, LEM: 0.4606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2365, partial_loss/deprel_loss: 0.3224, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5014, loss: 0.5707, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||:  68%|######8   | 65/95 [00:46<00:22,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9619, LAS: 0.9268, UEM: 0.6770, LEM: 0.4544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3012, partial_loss/deprel_loss: 0.3422, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5302, loss: 0.5722, batch_reg_loss: 0.1963, reg_loss: 0.1964 ||:  72%|#######1  | 68/95 [00:48<00:19,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9199, UAS: 0.9623, LAS: 0.9269, UEM: 0.6827, LEM: 0.4593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4133, partial_loss/deprel_loss: 0.4139, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6101, loss: 0.5706, batch_reg_loss: 0.1962, reg_loss: 0.1964 ||:  75%|#######4  | 71/95 [00:50<00:17,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9613, LAS: 0.9259, UEM: 0.6748, LEM: 0.4526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8964, partial_loss/deprel_loss: 0.5235, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7943, loss: 0.5785, batch_reg_loss: 0.1962, reg_loss: 0.1963 ||:  78%|#######7  | 74/95 [00:53<00:15,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9617, LAS: 0.9263, UEM: 0.6787, LEM: 0.4550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1303, partial_loss/deprel_loss: 0.2875, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4523, loss: 0.5757, batch_reg_loss: 0.1962, reg_loss: 0.1963 ||:  81%|########1 | 77/95 [00:55<00:13,  1.36it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9610, LAS: 0.9255, UEM: 0.6708, LEM: 0.4476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5844, partial_loss/deprel_loss: 0.5272, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7348, loss: 0.5810, batch_reg_loss: 0.1962, reg_loss: 0.1963 ||:  85%|########5 | 81/95 [00:57<00:09,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9434, UAS: 0.9613, LAS: 0.9257, UEM: 0.6749, LEM: 0.4501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1418, partial_loss/deprel_loss: 0.2624, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4345, loss: 0.5795, batch_reg_loss: 0.1962, reg_loss: 0.1963 ||:  89%|########9 | 85/95 [00:59<00:06,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9608, LAS: 0.9253, UEM: 0.6695, LEM: 0.4445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2800, partial_loss/deprel_loss: 0.4059, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5769, loss: 0.5848, batch_reg_loss: 0.1962, reg_loss: 0.1963 ||:  95%|#########4| 90/95 [01:01<00:02,  1.72it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9602, LAS: 0.9246, UEM: 0.6635, LEM: 0.4379, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2889, partial_loss/deprel_loss: 0.4463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6110, loss: 0.5889, batch_reg_loss: 0.1962, reg_loss: 0.1963 ||: 100%|##########| 95/95 [01:04<00:00,  1.84it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9602, LAS: 0.9246, UEM: 0.6635, LEM: 0.4379, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2889, partial_loss/deprel_loss: 0.4463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6110, loss: 0.5889, batch_reg_loss: 0.1962, reg_loss: 0.1963 ||: 100%|##########| 95/95 [01:04<00:00,  1.48it/s]\n",
+      "2023-04-07 01:32:32,427 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:32:32,427 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 01:32:32,427 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.196  |       N/A\n",
+      "2023-04-07 01:32:32,427 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:32:32,427 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - UEM                      |     0.663  |       N/A\n",
+      "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - LEM                      |     0.438  |       N/A\n",
+      "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - EM                       |     0.919  |       N/A\n",
+      "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.289  |       N/A\n",
+      "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - UAS                      |     0.960  |       N/A\n",
+      "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.446  |       N/A\n",
+      "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - loss                     |     0.589  |       N/A\n",
+      "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - LAS                      |     0.925  |       N/A\n",
+      "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:32:32,428 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:32:32,429 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:32:32,433 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:32:37,205 - INFO - combo.training.trainer - Epoch duration: 0:01:12.242078\n",
+      "2023-04-07 01:32:37,206 - INFO - combo.training.trainer - Estimated training time remaining: 4:56:11\n",
+      "2023-04-07 01:32:37,206 - INFO - allennlp.training.trainer - Epoch 142/399\n",
+      "2023-04-07 01:32:37,206 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:32:37,207 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:32:37,216 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9688, UAS: 0.9777, LAS: 0.9494, UEM: 0.8833, LEM: 0.7480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0388, partial_loss/deprel_loss: 0.1253, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3042, loss: 0.4407, batch_reg_loss: 0.1962, reg_loss: 0.1962 ||:   3%|3         | 3/95 [00:02<01:22,  1.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9649, LAS: 0.9341, UEM: 0.7764, LEM: 0.6172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7783, partial_loss/deprel_loss: 0.5240, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7710, loss: 0.5270, batch_reg_loss: 0.1962, reg_loss: 0.1962 ||:   7%|7         | 7/95 [00:05<01:11,  1.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9649, LAS: 0.9322, UEM: 0.7507, LEM: 0.5661, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5494, partial_loss/deprel_loss: 0.4676, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6801, loss: 0.5340, batch_reg_loss: 0.1962, reg_loss: 0.1962 ||:  11%|#         | 10/95 [00:07<01:06,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9620, LAS: 0.9283, UEM: 0.6980, LEM: 0.5131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4609, partial_loss/deprel_loss: 0.4467, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6457, loss: 0.5675, batch_reg_loss: 0.1962, reg_loss: 0.1962 ||:  14%|#3        | 13/95 [00:09<01:04,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8763, UAS: 0.9587, LAS: 0.9246, UEM: 0.6785, LEM: 0.4945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0301, partial_loss/deprel_loss: 0.6155, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8946, loss: 0.5862, batch_reg_loss: 0.1962, reg_loss: 0.1962 ||:  17%|#6        | 16/95 [00:12<01:02,  1.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9356, UAS: 0.9591, LAS: 0.9244, UEM: 0.6665, LEM: 0.4709, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2481, partial_loss/deprel_loss: 0.3529, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5281, loss: 0.5871, batch_reg_loss: 0.1961, reg_loss: 0.1962 ||:  20%|##        | 19/95 [00:14<00:59,  1.28it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9596, LAS: 0.9249, UEM: 0.6609, LEM: 0.4590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6963, partial_loss/deprel_loss: 0.5092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7427, loss: 0.5863, batch_reg_loss: 0.1961, reg_loss: 0.1962 ||:  23%|##3       | 22/95 [00:16<00:55,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9256, UAS: 0.9600, LAS: 0.9255, UEM: 0.6505, LEM: 0.4409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3017, partial_loss/deprel_loss: 0.3868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5659, loss: 0.5816, batch_reg_loss: 0.1961, reg_loss: 0.1962 ||:  27%|##7       | 26/95 [00:19<00:50,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9594, LAS: 0.9246, UEM: 0.6400, LEM: 0.4298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1459, partial_loss/deprel_loss: 0.2655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4377, loss: 0.5892, batch_reg_loss: 0.1961, reg_loss: 0.1962 ||:  32%|###1      | 30/95 [00:21<00:45,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9601, LAS: 0.9252, UEM: 0.6502, LEM: 0.4362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1923, partial_loss/deprel_loss: 0.3372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5043, loss: 0.5835, batch_reg_loss: 0.1961, reg_loss: 0.1961 ||:  36%|###5      | 34/95 [00:24<00:42,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9610, LAS: 0.9259, UEM: 0.6487, LEM: 0.4274, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2934, partial_loss/deprel_loss: 0.3326, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5209, loss: 0.5772, batch_reg_loss: 0.1961, reg_loss: 0.1961 ||:  40%|####      | 38/95 [00:27<00:39,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9090, UAS: 0.9602, LAS: 0.9251, UEM: 0.6432, LEM: 0.4243, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6596, partial_loss/deprel_loss: 0.5420, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7616, loss: 0.5861, batch_reg_loss: 0.1961, reg_loss: 0.1961 ||:  44%|####4     | 42/95 [00:29<00:36,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9589, LAS: 0.9238, UEM: 0.6306, LEM: 0.4113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3692, partial_loss/deprel_loss: 0.3943, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5854, loss: 0.5962, batch_reg_loss: 0.1961, reg_loss: 0.1961 ||:  48%|####8     | 46/95 [00:32<00:33,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9595, LAS: 0.9244, UEM: 0.6349, LEM: 0.4136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4241, partial_loss/deprel_loss: 0.3944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5964, loss: 0.5920, batch_reg_loss: 0.1961, reg_loss: 0.1961 ||:  52%|#####1    | 49/95 [00:34<00:31,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9529, UAS: 0.9596, LAS: 0.9245, UEM: 0.6418, LEM: 0.4209, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1112, partial_loss/deprel_loss: 0.2305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4027, loss: 0.5904, batch_reg_loss: 0.1960, reg_loss: 0.1961 ||:  55%|#####4    | 52/95 [00:36<00:30,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9600, LAS: 0.9247, UEM: 0.6388, LEM: 0.4148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3810, partial_loss/deprel_loss: 0.3844, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5797, loss: 0.5873, batch_reg_loss: 0.1960, reg_loss: 0.1961 ||:  59%|#####8    | 56/95 [00:39<00:26,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9599, LAS: 0.9246, UEM: 0.6323, LEM: 0.4078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2395, partial_loss/deprel_loss: 0.3450, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5199, loss: 0.5898, batch_reg_loss: 0.1960, reg_loss: 0.1961 ||:  63%|######3   | 60/95 [00:41<00:23,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9607, LAS: 0.9254, UEM: 0.6508, LEM: 0.4267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1561, partial_loss/deprel_loss: 0.2461, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4241, loss: 0.5838, batch_reg_loss: 0.1960, reg_loss: 0.1961 ||:  67%|######7   | 64/95 [00:45<00:22,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9607, LAS: 0.9255, UEM: 0.6534, LEM: 0.4302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2530, partial_loss/deprel_loss: 0.3697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5424, loss: 0.5826, batch_reg_loss: 0.1960, reg_loss: 0.1961 ||:  71%|#######   | 67/95 [00:47<00:21,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9614, LAS: 0.9263, UEM: 0.6692, LEM: 0.4491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2151, partial_loss/deprel_loss: 0.3004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4793, loss: 0.5763, batch_reg_loss: 0.1960, reg_loss: 0.1961 ||:  74%|#######3  | 70/95 [00:50<00:19,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9607, LAS: 0.9256, UEM: 0.6611, LEM: 0.4416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4577, partial_loss/deprel_loss: 0.4822, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6733, loss: 0.5809, batch_reg_loss: 0.1960, reg_loss: 0.1961 ||:  77%|#######6  | 73/95 [00:52<00:16,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8988, UAS: 0.9603, LAS: 0.9251, UEM: 0.6563, LEM: 0.4371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6469, partial_loss/deprel_loss: 0.5195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7410, loss: 0.5840, batch_reg_loss: 0.1960, reg_loss: 0.1961 ||:  80%|########  | 76/95 [00:54<00:14,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9364, UAS: 0.9606, LAS: 0.9252, UEM: 0.6554, LEM: 0.4333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2148, partial_loss/deprel_loss: 0.3316, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5042, loss: 0.5840, batch_reg_loss: 0.1959, reg_loss: 0.1961 ||:  84%|########4 | 80/95 [00:57<00:10,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9608, LAS: 0.9254, UEM: 0.6583, LEM: 0.4371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2209, partial_loss/deprel_loss: 0.3497, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5198, loss: 0.5823, batch_reg_loss: 0.1959, reg_loss: 0.1961 ||:  88%|########8 | 84/95 [00:59<00:07,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9605, LAS: 0.9248, UEM: 0.6545, LEM: 0.4318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3878, partial_loss/deprel_loss: 0.4341, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6208, loss: 0.5860, batch_reg_loss: 0.1959, reg_loss: 0.1961 ||:  93%|#########2| 88/95 [01:02<00:04,  1.50it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9549, UAS: 0.9608, LAS: 0.9254, UEM: 0.6593, LEM: 0.4381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0785, partial_loss/deprel_loss: 0.2125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3816, loss: 0.5826, batch_reg_loss: 0.1959, reg_loss: 0.1961 ||:  97%|#########6| 92/95 [01:05<00:02,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9607, LAS: 0.9253, UEM: 0.6619, LEM: 0.4411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3045, partial_loss/deprel_loss: 0.3832, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5634, loss: 0.5830, batch_reg_loss: 0.1959, reg_loss: 0.1961 ||: 100%|##########| 95/95 [01:07<00:00,  1.42it/s]\n",
+      "2023-04-07 01:33:47,060 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:33:47,060 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 01:33:47,060 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.196  |       N/A\n",
+      "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - UEM                      |     0.662  |       N/A\n",
+      "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - LEM                      |     0.441  |       N/A\n",
+      "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - EM                       |     0.932  |       N/A\n",
+      "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.305  |       N/A\n",
+      "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - UAS                      |     0.961  |       N/A\n",
+      "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.383  |       N/A\n",
+      "2023-04-07 01:33:47,061 - INFO - combo.training.tensorboard_writer - loss                     |     0.583  |       N/A\n",
+      "2023-04-07 01:33:47,062 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:33:47,062 - INFO - combo.training.tensorboard_writer - LAS                      |     0.925  |       N/A\n",
+      "2023-04-07 01:33:47,062 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:33:47,062 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:33:47,062 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:33:47,062 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:33:47,062 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:33:47,062 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:33:47,068 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:33:55,192 - INFO - combo.training.trainer - Epoch duration: 0:01:17.985545\n",
+      "2023-04-07 01:33:55,192 - INFO - combo.training.trainer - Estimated training time remaining: 4:55:18\n",
+      "2023-04-07 01:33:55,192 - INFO - allennlp.training.trainer - Epoch 143/399\n",
+      "2023-04-07 01:33:55,193 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:33:55,193 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:33:55,204 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9612, LAS: 0.9258, UEM: 0.6181, LEM: 0.3611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1987, partial_loss/deprel_loss: 0.3033, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4783, loss: 0.5987, batch_reg_loss: 0.1959, reg_loss: 0.1959 ||:   3%|3         | 3/95 [00:02<01:04,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9529, UAS: 0.9610, LAS: 0.9261, UEM: 0.6852, LEM: 0.4737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1229, partial_loss/deprel_loss: 0.2424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4144, loss: 0.5864, batch_reg_loss: 0.1959, reg_loss: 0.1959 ||:   6%|6         | 6/95 [00:04<01:02,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9638, LAS: 0.9298, UEM: 0.7018, LEM: 0.4829, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4217, partial_loss/deprel_loss: 0.3645, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5718, loss: 0.5592, batch_reg_loss: 0.1959, reg_loss: 0.1959 ||:   9%|9         | 9/95 [00:06<01:00,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9642, LAS: 0.9291, UEM: 0.6939, LEM: 0.4609, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3576, partial_loss/deprel_loss: 0.4495, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6270, loss: 0.5620, batch_reg_loss: 0.1959, reg_loss: 0.1959 ||:  14%|#3        | 13/95 [00:08<00:55,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9656, LAS: 0.9312, UEM: 0.6985, LEM: 0.4561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2052, partial_loss/deprel_loss: 0.3331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5034, loss: 0.5495, batch_reg_loss: 0.1959, reg_loss: 0.1959 ||:  17%|#6        | 16/95 [00:10<00:53,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9652, LAS: 0.9304, UEM: 0.6762, LEM: 0.4302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3206, partial_loss/deprel_loss: 0.4123, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5898, loss: 0.5570, batch_reg_loss: 0.1958, reg_loss: 0.1959 ||:  21%|##1       | 20/95 [00:13<00:49,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9641, LAS: 0.9292, UEM: 0.6711, LEM: 0.4237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8708, partial_loss/deprel_loss: 0.5786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8329, loss: 0.5636, batch_reg_loss: 0.1958, reg_loss: 0.1959 ||:  25%|##5       | 24/95 [00:15<00:46,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9606, LAS: 0.9258, UEM: 0.6350, LEM: 0.3979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7316, partial_loss/deprel_loss: 0.4971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7398, loss: 0.5861, batch_reg_loss: 0.1958, reg_loss: 0.1959 ||:  29%|##9       | 28/95 [00:18<00:42,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9622, LAS: 0.9276, UEM: 0.6612, LEM: 0.4260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1479, partial_loss/deprel_loss: 0.3394, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4969, loss: 0.5753, batch_reg_loss: 0.1958, reg_loss: 0.1959 ||:  33%|###2      | 31/95 [00:20<00:42,  1.49it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9620, LAS: 0.9273, UEM: 0.6577, LEM: 0.4220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5023, partial_loss/deprel_loss: 0.4073, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6221, loss: 0.5765, batch_reg_loss: 0.1958, reg_loss: 0.1958 ||:  37%|###6      | 35/95 [00:23<00:39,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9617, LAS: 0.9270, UEM: 0.6629, LEM: 0.4267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1692, partial_loss/deprel_loss: 0.3001, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4697, loss: 0.5802, batch_reg_loss: 0.1958, reg_loss: 0.1958 ||:  41%|####1     | 39/95 [00:25<00:38,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9618, LAS: 0.9267, UEM: 0.6589, LEM: 0.4212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1680, partial_loss/deprel_loss: 0.2886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4603, loss: 0.5808, batch_reg_loss: 0.1958, reg_loss: 0.1958 ||:  45%|####5     | 43/95 [00:28<00:34,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8751, UAS: 0.9605, LAS: 0.9251, UEM: 0.6532, LEM: 0.4173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1675, partial_loss/deprel_loss: 0.5706, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8857, loss: 0.5888, batch_reg_loss: 0.1958, reg_loss: 0.1958 ||:  49%|####9     | 47/95 [00:31<00:32,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9607, LAS: 0.9252, UEM: 0.6515, LEM: 0.4138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2271, partial_loss/deprel_loss: 0.3638, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5322, loss: 0.5878, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||:  53%|#####2    | 50/95 [00:33<00:31,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9607, LAS: 0.9253, UEM: 0.6461, LEM: 0.4086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3210, partial_loss/deprel_loss: 0.4266, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6012, loss: 0.5878, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||:  56%|#####5    | 53/95 [00:35<00:29,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9070, UAS: 0.9604, LAS: 0.9249, UEM: 0.6493, LEM: 0.4142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6948, partial_loss/deprel_loss: 0.5603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7829, loss: 0.5891, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||:  60%|######    | 57/95 [00:38<00:25,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9609, LAS: 0.9253, UEM: 0.6618, LEM: 0.4295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2951, partial_loss/deprel_loss: 0.3371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5244, loss: 0.5847, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||:  63%|######3   | 60/95 [00:40<00:24,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9430, UAS: 0.9613, LAS: 0.9257, UEM: 0.6606, LEM: 0.4273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1720, partial_loss/deprel_loss: 0.2721, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4478, loss: 0.5817, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||:  67%|######7   | 64/95 [00:42<00:21,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9612, LAS: 0.9256, UEM: 0.6601, LEM: 0.4277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1927, partial_loss/deprel_loss: 0.2857, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4628, loss: 0.5822, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||:  71%|#######   | 67/95 [00:45<00:19,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9606, LAS: 0.9249, UEM: 0.6512, LEM: 0.4198, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4352, partial_loss/deprel_loss: 0.4888, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6738, loss: 0.5877, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||:  74%|#######3  | 70/95 [00:47<00:18,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9605, LAS: 0.9247, UEM: 0.6530, LEM: 0.4212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0181, partial_loss/deprel_loss: 0.5776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8614, loss: 0.5887, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||:  77%|#######6  | 73/95 [00:49<00:15,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9605, LAS: 0.9248, UEM: 0.6503, LEM: 0.4183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4662, partial_loss/deprel_loss: 0.4649, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6608, loss: 0.5886, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||:  80%|########  | 76/95 [00:51<00:13,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9610, LAS: 0.9253, UEM: 0.6573, LEM: 0.4243, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2688, partial_loss/deprel_loss: 0.3295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5130, loss: 0.5846, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||:  83%|########3 | 79/95 [00:54<00:11,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9608, LAS: 0.9250, UEM: 0.6565, LEM: 0.4239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6618, partial_loss/deprel_loss: 0.5038, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7311, loss: 0.5867, batch_reg_loss: 0.1957, reg_loss: 0.1958 ||:  86%|########6 | 82/95 [00:56<00:09,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9610, LAS: 0.9251, UEM: 0.6557, LEM: 0.4212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2986, partial_loss/deprel_loss: 0.3646, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5471, loss: 0.5860, batch_reg_loss: 0.1956, reg_loss: 0.1958 ||:  89%|########9 | 85/95 [00:58<00:07,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9736, UAS: 0.9613, LAS: 0.9255, UEM: 0.6675, LEM: 0.4407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0363, partial_loss/deprel_loss: 0.0917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2763, loss: 0.5831, batch_reg_loss: 0.1956, reg_loss: 0.1958 ||:  93%|#########2| 88/95 [01:01<00:05,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9484, UAS: 0.9614, LAS: 0.9255, UEM: 0.6705, LEM: 0.4451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0890, partial_loss/deprel_loss: 0.2279, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3958, loss: 0.5836, batch_reg_loss: 0.1956, reg_loss: 0.1958 ||:  96%|#########5| 91/95 [01:03<00:03,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9613, LAS: 0.9255, UEM: 0.6654, LEM: 0.4396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3783, partial_loss/deprel_loss: 0.3848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5791, loss: 0.5830, batch_reg_loss: 0.1956, reg_loss: 0.1958 ||: 100%|##########| 95/95 [01:05<00:00,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9613, LAS: 0.9255, UEM: 0.6654, LEM: 0.4396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3783, partial_loss/deprel_loss: 0.3848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5791, loss: 0.5830, batch_reg_loss: 0.1956, reg_loss: 0.1958 ||: 100%|##########| 95/95 [01:05<00:00,  1.44it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.196  |       N/A\n",
+      "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - UEM                      |     0.665  |       N/A\n",
+      "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - LEM                      |     0.440  |       N/A\n",
+      "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - EM                       |     0.918  |       N/A\n",
+      "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.378  |       N/A\n",
+      "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - UAS                      |     0.961  |       N/A\n",
+      "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:35:03,848 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.385  |       N/A\n",
+      "2023-04-07 01:35:03,849 - INFO - combo.training.tensorboard_writer - loss                     |     0.583  |       N/A\n",
+      "2023-04-07 01:35:03,849 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:35:03,849 - INFO - combo.training.tensorboard_writer - LAS                      |     0.925  |       N/A\n",
+      "2023-04-07 01:35:03,849 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:35:03,849 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:35:03,849 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:35:03,849 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:35:03,849 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:35:03,849 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:35:03,853 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:35:08,540 - INFO - combo.training.trainer - Epoch duration: 0:01:13.347534\n",
+      "2023-04-07 01:35:08,540 - INFO - combo.training.trainer - Estimated training time remaining: 4:54:17\n",
+      "2023-04-07 01:35:08,541 - INFO - allennlp.training.trainer - Epoch 144/399\n",
+      "2023-04-07 01:35:08,541 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:35:08,542 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:35:08,551 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9448, UAS: 0.9723, LAS: 0.9370, UEM: 0.7976, LEM: 0.5757, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1629, partial_loss/deprel_loss: 0.3034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4709, loss: 0.5066, batch_reg_loss: 0.1956, reg_loss: 0.1956 ||:   5%|5         | 5/95 [00:02<00:47,  1.91it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9078, UAS: 0.9633, LAS: 0.9280, UEM: 0.7085, LEM: 0.4923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5152, partial_loss/deprel_loss: 0.4897, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6904, loss: 0.5663, batch_reg_loss: 0.1956, reg_loss: 0.1956 ||:   9%|9         | 9/95 [00:05<00:47,  1.82it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9124, UAS: 0.9630, LAS: 0.9273, UEM: 0.6953, LEM: 0.4721, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5477, partial_loss/deprel_loss: 0.5254, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7254, loss: 0.5694, batch_reg_loss: 0.1956, reg_loss: 0.1956 ||:  13%|#2        | 12/95 [00:07<00:49,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9614, LAS: 0.9258, UEM: 0.6516, LEM: 0.4257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3085, partial_loss/deprel_loss: 0.3481, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5357, loss: 0.5813, batch_reg_loss: 0.1956, reg_loss: 0.1956 ||:  17%|#6        | 16/95 [00:09<00:46,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9621, LAS: 0.9269, UEM: 0.6642, LEM: 0.4458, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5289, partial_loss/deprel_loss: 0.4735, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6802, loss: 0.5716, batch_reg_loss: 0.1956, reg_loss: 0.1956 ||:  20%|##        | 19/95 [00:11<00:47,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9613, LAS: 0.9260, UEM: 0.6528, LEM: 0.4331, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6241, partial_loss/deprel_loss: 0.5382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7509, loss: 0.5783, batch_reg_loss: 0.1955, reg_loss: 0.1956 ||:  24%|##4       | 23/95 [00:13<00:42,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9623, LAS: 0.9268, UEM: 0.6690, LEM: 0.4430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1259, partial_loss/deprel_loss: 0.3156, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4732, loss: 0.5720, batch_reg_loss: 0.1955, reg_loss: 0.1956 ||:  28%|##8       | 27/95 [00:15<00:39,  1.71it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9232, UAS: 0.9632, LAS: 0.9280, UEM: 0.6748, LEM: 0.4500, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2753, partial_loss/deprel_loss: 0.3965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5678, loss: 0.5657, batch_reg_loss: 0.1955, reg_loss: 0.1956 ||:  34%|###3      | 32/95 [00:18<00:34,  1.83it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9645, LAS: 0.9294, UEM: 0.6863, LEM: 0.4595, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1585, partial_loss/deprel_loss: 0.2794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4508, loss: 0.5558, batch_reg_loss: 0.1955, reg_loss: 0.1956 ||:  38%|###7      | 36/95 [00:20<00:31,  1.86it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9647, LAS: 0.9295, UEM: 0.6900, LEM: 0.4613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3195, partial_loss/deprel_loss: 0.3555, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5438, loss: 0.5537, batch_reg_loss: 0.1955, reg_loss: 0.1956 ||:  42%|####2     | 40/95 [00:23<00:32,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9224, UAS: 0.9651, LAS: 0.9299, UEM: 0.6876, LEM: 0.4560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3535, partial_loss/deprel_loss: 0.3828, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5724, loss: 0.5509, batch_reg_loss: 0.1955, reg_loss: 0.1955 ||:  46%|####6     | 44/95 [00:25<00:31,  1.64it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9651, LAS: 0.9301, UEM: 0.7024, LEM: 0.4781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8110, partial_loss/deprel_loss: 0.5529, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8000, loss: 0.5480, batch_reg_loss: 0.1954, reg_loss: 0.1955 ||:  51%|#####     | 48/95 [00:28<00:31,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9646, LAS: 0.9293, UEM: 0.6907, LEM: 0.4652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5458, partial_loss/deprel_loss: 0.4938, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6996, loss: 0.5549, batch_reg_loss: 0.1954, reg_loss: 0.1955 ||:  55%|#####4    | 52/95 [00:31<00:28,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9645, LAS: 0.9294, UEM: 0.6857, LEM: 0.4570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1897, partial_loss/deprel_loss: 0.3450, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5094, loss: 0.5570, batch_reg_loss: 0.1954, reg_loss: 0.1955 ||:  59%|#####8    | 56/95 [00:34<00:26,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9640, LAS: 0.9288, UEM: 0.6758, LEM: 0.4477, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3712, partial_loss/deprel_loss: 0.3294, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5331, loss: 0.5605, batch_reg_loss: 0.1954, reg_loss: 0.1955 ||:  62%|######2   | 59/95 [00:36<00:25,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9634, LAS: 0.9284, UEM: 0.6720, LEM: 0.4461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5894, partial_loss/deprel_loss: 0.5012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7142, loss: 0.5645, batch_reg_loss: 0.1954, reg_loss: 0.1955 ||:  65%|######5   | 62/95 [00:39<00:23,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9501, UAS: 0.9638, LAS: 0.9287, UEM: 0.6787, LEM: 0.4522, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1116, partial_loss/deprel_loss: 0.2341, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4050, loss: 0.5608, batch_reg_loss: 0.1954, reg_loss: 0.1955 ||:  68%|######8   | 65/95 [00:41<00:21,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9633, LAS: 0.9283, UEM: 0.6693, LEM: 0.4418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3070, partial_loss/deprel_loss: 0.3886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5677, loss: 0.5637, batch_reg_loss: 0.1954, reg_loss: 0.1955 ||:  73%|#######2  | 69/95 [00:43<00:17,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8996, UAS: 0.9629, LAS: 0.9280, UEM: 0.6674, LEM: 0.4419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7485, partial_loss/deprel_loss: 0.4514, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7062, loss: 0.5651, batch_reg_loss: 0.1954, reg_loss: 0.1955 ||:  76%|#######5  | 72/95 [00:45<00:16,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9617, LAS: 0.9269, UEM: 0.6596, LEM: 0.4359, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3724, partial_loss/deprel_loss: 0.3970, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5874, loss: 0.5729, batch_reg_loss: 0.1954, reg_loss: 0.1955 ||:  79%|#######8  | 75/95 [00:48<00:14,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9619, LAS: 0.9271, UEM: 0.6603, LEM: 0.4343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3534, partial_loss/deprel_loss: 0.4346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6138, loss: 0.5717, batch_reg_loss: 0.1954, reg_loss: 0.1955 ||:  82%|########2 | 78/95 [00:50<00:12,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9615, LAS: 0.9268, UEM: 0.6553, LEM: 0.4300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2096, partial_loss/deprel_loss: 0.2869, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4668, loss: 0.5751, batch_reg_loss: 0.1953, reg_loss: 0.1955 ||:  86%|########6 | 82/95 [00:52<00:09,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9740, UAS: 0.9619, LAS: 0.9272, UEM: 0.6680, LEM: 0.4483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0249, partial_loss/deprel_loss: 0.1024, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2823, loss: 0.5727, batch_reg_loss: 0.1953, reg_loss: 0.1955 ||:  89%|########9 | 85/95 [00:55<00:07,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9620, LAS: 0.9273, UEM: 0.6675, LEM: 0.4461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2200, partial_loss/deprel_loss: 0.3466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5166, loss: 0.5713, batch_reg_loss: 0.1953, reg_loss: 0.1955 ||:  93%|#########2| 88/95 [00:57<00:05,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8677, UAS: 0.9617, LAS: 0.9269, UEM: 0.6699, LEM: 0.4487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1521, partial_loss/deprel_loss: 0.6569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9512, loss: 0.5735, batch_reg_loss: 0.1953, reg_loss: 0.1955 ||:  96%|#########5| 91/95 [00:59<00:02,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9082, UAS: 0.9613, LAS: 0.9264, UEM: 0.6673, LEM: 0.4460, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5637, partial_loss/deprel_loss: 0.4601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6761, loss: 0.5766, batch_reg_loss: 0.1953, reg_loss: 0.1955 ||:  99%|#########8| 94/95 [01:01<00:00,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9610, LAS: 0.9261, UEM: 0.6648, LEM: 0.4443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8027, partial_loss/deprel_loss: 0.5686, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8107, loss: 0.5790, batch_reg_loss: 0.1953, reg_loss: 0.1955 ||: 100%|##########| 95/95 [01:02<00:00,  1.53it/s]\n",
+      "2023-04-07 01:36:13,968 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.195  |       N/A\n",
+      "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - UEM                      |     0.665  |       N/A\n",
+      "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - LEM                      |     0.444  |       N/A\n",
+      "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - EM                       |     0.896  |       N/A\n",
+      "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.803  |       N/A\n",
+      "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - UAS                      |     0.961  |       N/A\n",
+      "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:36:13,969 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.569  |       N/A\n",
+      "2023-04-07 01:36:13,970 - INFO - combo.training.tensorboard_writer - loss                     |     0.579  |       N/A\n",
+      "2023-04-07 01:36:13,970 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:36:13,970 - INFO - combo.training.tensorboard_writer - LAS                      |     0.926  |       N/A\n",
+      "2023-04-07 01:36:13,970 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:36:13,970 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:36:13,970 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:36:13,970 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:36:13,970 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:36:13,970 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:36:13,975 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:36:18,797 - INFO - combo.training.trainer - Epoch duration: 0:01:10.256214\n",
+      "2023-04-07 01:36:18,797 - INFO - combo.training.trainer - Estimated training time remaining: 4:53:10\n",
+      "2023-04-07 01:36:18,797 - INFO - allennlp.training.trainer - Epoch 145/399\n",
+      "2023-04-07 01:36:18,798 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:36:18,798 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:36:18,805 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9674, LAS: 0.9300, UEM: 0.6255, LEM: 0.3333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3173, partial_loss/deprel_loss: 0.3076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5049, loss: 0.5278, batch_reg_loss: 0.1953, reg_loss: 0.1953 ||:   3%|3         | 3/95 [00:02<01:06,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9622, LAS: 0.9265, UEM: 0.5693, LEM: 0.3041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5101, partial_loss/deprel_loss: 0.4328, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6435, loss: 0.5750, batch_reg_loss: 0.1953, reg_loss: 0.1953 ||:   6%|6         | 6/95 [00:04<01:02,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9651, LAS: 0.9292, UEM: 0.6349, LEM: 0.3737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4242, partial_loss/deprel_loss: 0.4547, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6439, loss: 0.5553, batch_reg_loss: 0.1953, reg_loss: 0.1953 ||:   9%|9         | 9/95 [00:06<01:01,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9640, LAS: 0.9284, UEM: 0.6207, LEM: 0.3657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2163, partial_loss/deprel_loss: 0.3321, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5042, loss: 0.5611, batch_reg_loss: 0.1953, reg_loss: 0.1953 ||:  14%|#3        | 13/95 [00:09<00:58,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9604, LAS: 0.9250, UEM: 0.5805, LEM: 0.3355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2846, partial_loss/deprel_loss: 0.3570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5378, loss: 0.5831, batch_reg_loss: 0.1953, reg_loss: 0.1953 ||:  18%|#7        | 17/95 [00:11<00:53,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9228, UAS: 0.9618, LAS: 0.9270, UEM: 0.6036, LEM: 0.3581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4053, partial_loss/deprel_loss: 0.4630, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6467, loss: 0.5713, batch_reg_loss: 0.1953, reg_loss: 0.1953 ||:  21%|##1       | 20/95 [00:13<00:52,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9616, LAS: 0.9270, UEM: 0.6131, LEM: 0.3667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2207, partial_loss/deprel_loss: 0.3642, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5308, loss: 0.5725, batch_reg_loss: 0.1953, reg_loss: 0.1953 ||:  24%|##4       | 23/95 [00:16<00:53,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9614, LAS: 0.9270, UEM: 0.6195, LEM: 0.3757, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7586, partial_loss/deprel_loss: 0.5081, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7535, loss: 0.5743, batch_reg_loss: 0.1952, reg_loss: 0.1953 ||:  27%|##7       | 26/95 [00:18<00:50,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9176, UAS: 0.9593, LAS: 0.9252, UEM: 0.5982, LEM: 0.3582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5271, partial_loss/deprel_loss: 0.4619, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6701, loss: 0.5885, batch_reg_loss: 0.1952, reg_loss: 0.1953 ||:  32%|###1      | 30/95 [00:20<00:44,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9583, LAS: 0.9241, UEM: 0.5792, LEM: 0.3428, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5811, partial_loss/deprel_loss: 0.4399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6633, loss: 0.5922, batch_reg_loss: 0.1952, reg_loss: 0.1953 ||:  37%|###6      | 35/95 [00:23<00:37,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9590, LAS: 0.9250, UEM: 0.5971, LEM: 0.3658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3866, partial_loss/deprel_loss: 0.4137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6035, loss: 0.5853, batch_reg_loss: 0.1952, reg_loss: 0.1953 ||:  42%|####2     | 40/95 [00:25<00:31,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9360, UAS: 0.9598, LAS: 0.9258, UEM: 0.6005, LEM: 0.3642, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2454, partial_loss/deprel_loss: 0.3137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4953, loss: 0.5803, batch_reg_loss: 0.1952, reg_loss: 0.1953 ||:  47%|####7     | 45/95 [00:27<00:26,  1.90it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9589, LAS: 0.9247, UEM: 0.6081, LEM: 0.3712, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1542, partial_loss/deprel_loss: 0.3116, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4753, loss: 0.5880, batch_reg_loss: 0.1952, reg_loss: 0.1952 ||:  52%|#####1    | 49/95 [00:29<00:24,  1.91it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9728, UAS: 0.9588, LAS: 0.9248, UEM: 0.6300, LEM: 0.4076, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0358, partial_loss/deprel_loss: 0.1138, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2934, loss: 0.5870, batch_reg_loss: 0.1952, reg_loss: 0.1952 ||:  56%|#####5    | 53/95 [00:32<00:23,  1.77it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9597, LAS: 0.9255, UEM: 0.6463, LEM: 0.4216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1418, partial_loss/deprel_loss: 0.2376, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4136, loss: 0.5811, batch_reg_loss: 0.1952, reg_loss: 0.1952 ||:  60%|######    | 57/95 [00:35<00:23,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9256, UAS: 0.9604, LAS: 0.9261, UEM: 0.6547, LEM: 0.4304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3106, partial_loss/deprel_loss: 0.3452, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5334, loss: 0.5771, batch_reg_loss: 0.1952, reg_loss: 0.1952 ||:  64%|######4   | 61/95 [00:38<00:22,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9485, UAS: 0.9610, LAS: 0.9265, UEM: 0.6585, LEM: 0.4316, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1048, partial_loss/deprel_loss: 0.2579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4224, loss: 0.5743, batch_reg_loss: 0.1951, reg_loss: 0.1952 ||:  68%|######8   | 65/95 [00:41<00:20,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9617, LAS: 0.9271, UEM: 0.6651, LEM: 0.4340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2053, partial_loss/deprel_loss: 0.2998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4761, loss: 0.5705, batch_reg_loss: 0.1951, reg_loss: 0.1952 ||:  73%|#######2  | 69/95 [00:44<00:17,  1.47it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8759, UAS: 0.9602, LAS: 0.9255, UEM: 0.6554, LEM: 0.4257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0145, partial_loss/deprel_loss: 0.6211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8949, loss: 0.5812, batch_reg_loss: 0.1951, reg_loss: 0.1952 ||:  77%|#######6  | 73/95 [00:46<00:14,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9541, UAS: 0.9605, LAS: 0.9257, UEM: 0.6660, LEM: 0.4389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1002, partial_loss/deprel_loss: 0.1881, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3656, loss: 0.5797, batch_reg_loss: 0.1951, reg_loss: 0.1952 ||:  81%|########1 | 77/95 [00:49<00:12,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9605, LAS: 0.9256, UEM: 0.6679, LEM: 0.4412, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1022, partial_loss/deprel_loss: 0.2672, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4293, loss: 0.5810, batch_reg_loss: 0.1951, reg_loss: 0.1952 ||:  84%|########4 | 80/95 [00:52<00:10,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9605, LAS: 0.9255, UEM: 0.6646, LEM: 0.4366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1667, partial_loss/deprel_loss: 0.3177, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4826, loss: 0.5823, batch_reg_loss: 0.1951, reg_loss: 0.1952 ||:  87%|########7 | 83/95 [00:54<00:08,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9604, LAS: 0.9253, UEM: 0.6573, LEM: 0.4298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3819, partial_loss/deprel_loss: 0.4149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6033, loss: 0.5847, batch_reg_loss: 0.1951, reg_loss: 0.1952 ||:  92%|#########1| 87/95 [00:56<00:05,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9366, UAS: 0.9609, LAS: 0.9258, UEM: 0.6642, LEM: 0.4361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1931, partial_loss/deprel_loss: 0.3149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4856, loss: 0.5812, batch_reg_loss: 0.1951, reg_loss: 0.1952 ||:  96%|#########5| 91/95 [00:59<00:02,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9611, LAS: 0.9259, UEM: 0.6668, LEM: 0.4381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1362, partial_loss/deprel_loss: 0.3189, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4774, loss: 0.5804, batch_reg_loss: 0.1951, reg_loss: 0.1952 ||:  99%|#########8| 94/95 [01:01<00:00,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9400, UAS: 0.9612, LAS: 0.9261, UEM: 0.6660, LEM: 0.4371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2646, partial_loss/deprel_loss: 0.2843, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4754, loss: 0.5793, batch_reg_loss: 0.1950, reg_loss: 0.1952 ||: 100%|##########| 95/95 [01:02<00:00,  1.52it/s]\n",
+      "2023-04-07 01:37:24,348 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8625, UAS: 0.9470, LAS: 0.9012, UEM: 0.8096, LEM: 0.6413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5334, partial_loss/deprel_loss: 19.5984, partial_loss/cycle_loss: 0.0000, batch_loss: 15.9854, loss: 10.0469, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  18%|#8        | 2/11 [00:02<00:10,  1.20s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8950, UAS: 0.9530, LAS: 0.9044, UEM: 0.7198, LEM: 0.4690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8728, partial_loss/deprel_loss: 10.5768, partial_loss/cycle_loss: 0.0000, batch_loss: 8.6360, loss: 8.1821, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:04<00:06,  1.09s/it]  \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8793, UAS: 0.9476, LAS: 0.8963, UEM: 0.6564, LEM: 0.4009, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2028, partial_loss/deprel_loss: 16.7362, partial_loss/cycle_loss: 0.0000, batch_loss: 13.6295, loss: 9.5178, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  64%|######3   | 7/11 [00:07<00:04,  1.09s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8762, UAS: 0.9507, LAS: 0.8985, UEM: 0.6791, LEM: 0.3979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0512, partial_loss/deprel_loss: 9.3839, partial_loss/cycle_loss: 0.0000, batch_loss: 7.7174, loss: 8.5489, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  91%|######### | 10/11 [00:09<00:01,  1.05s/it] \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9227, UAS: 0.9523, LAS: 0.9007, UEM: 0.6903, LEM: 0.4069, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4198, partial_loss/deprel_loss: 6.3904, partial_loss/cycle_loss: 0.0000, batch_loss: 5.1963, loss: 8.2441, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.02it/s]\n",
+      "2023-04-07 01:37:35,130 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.195  |     0.000\n",
+      "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - UEM                      |     0.666  |     0.690\n",
+      "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - LEM                      |     0.437  |     0.407\n",
+      "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - EM                       |     0.940  |     0.923\n",
+      "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.265  |     0.420\n",
+      "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - UAS                      |     0.961  |     0.952\n",
+      "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.284  |     6.390\n",
+      "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - loss                     |     0.579  |     8.244\n",
+      "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:37:35,131 - INFO - combo.training.tensorboard_writer - LAS                      |     0.926  |     0.901\n",
+      "2023-04-07 01:37:35,132 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:37:35,132 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:37:35,132 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:37:35,132 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:37:35,132 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:37:35,132 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 01:37:35,137 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:37:39,900 - INFO - combo.training.trainer - Epoch duration: 0:01:21.102822\n",
+      "2023-04-07 01:37:39,901 - INFO - combo.training.trainer - Estimated training time remaining: 4:52:22\n",
+      "2023-04-07 01:37:39,901 - INFO - allennlp.training.trainer - Epoch 146/399\n",
+      "2023-04-07 01:37:39,905 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:37:39,906 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:37:39,913 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9768, LAS: 0.9408, UEM: 0.8439, LEM: 0.6231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1214, partial_loss/deprel_loss: 0.2641, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4306, loss: 0.4573, batch_reg_loss: 0.1950, reg_loss: 0.1950 ||:   3%|3         | 3/95 [00:02<01:18,  1.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9656, LAS: 0.9303, UEM: 0.7362, LEM: 0.5173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2008, partial_loss/deprel_loss: 0.2163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4082, loss: 0.5202, batch_reg_loss: 0.1950, reg_loss: 0.1950 ||:   7%|7         | 7/95 [00:05<01:10,  1.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9653, LAS: 0.9298, UEM: 0.7205, LEM: 0.4919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2149, partial_loss/deprel_loss: 0.3451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.5366, batch_reg_loss: 0.1950, reg_loss: 0.1950 ||:  11%|#         | 10/95 [00:07<01:07,  1.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9148, UAS: 0.9647, LAS: 0.9291, UEM: 0.7005, LEM: 0.4673, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5481, partial_loss/deprel_loss: 0.4620, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6742, loss: 0.5476, batch_reg_loss: 0.1950, reg_loss: 0.1950 ||:  14%|#3        | 13/95 [00:09<01:02,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9629, LAS: 0.9284, UEM: 0.6838, LEM: 0.4520, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2093, partial_loss/deprel_loss: 0.2970, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4745, loss: 0.5543, batch_reg_loss: 0.1950, reg_loss: 0.1950 ||:  18%|#7        | 17/95 [00:12<00:57,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9323, UAS: 0.9616, LAS: 0.9267, UEM: 0.6563, LEM: 0.4249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2811, partial_loss/deprel_loss: 0.3698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5471, loss: 0.5677, batch_reg_loss: 0.1950, reg_loss: 0.1950 ||:  21%|##1       | 20/95 [00:14<00:54,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9622, LAS: 0.9272, UEM: 0.6612, LEM: 0.4293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4932, partial_loss/deprel_loss: 0.4835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6804, loss: 0.5689, batch_reg_loss: 0.1950, reg_loss: 0.1950 ||:  25%|##5       | 24/95 [00:16<00:49,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9633, LAS: 0.9285, UEM: 0.6871, LEM: 0.4649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6006, partial_loss/deprel_loss: 0.4472, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6728, loss: 0.5618, batch_reg_loss: 0.1950, reg_loss: 0.1950 ||:  28%|##8       | 27/95 [00:18<00:46,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9643, LAS: 0.9289, UEM: 0.6968, LEM: 0.4663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1564, partial_loss/deprel_loss: 0.3049, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4702, loss: 0.5555, batch_reg_loss: 0.1949, reg_loss: 0.1950 ||:  32%|###1      | 30/95 [00:21<00:45,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9625, LAS: 0.9271, UEM: 0.6957, LEM: 0.4706, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9823, partial_loss/deprel_loss: 0.5650, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8434, loss: 0.5663, batch_reg_loss: 0.1949, reg_loss: 0.1950 ||:  36%|###5      | 34/95 [00:23<00:39,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9458, UAS: 0.9636, LAS: 0.9282, UEM: 0.6939, LEM: 0.4637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1359, partial_loss/deprel_loss: 0.2753, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4423, loss: 0.5609, batch_reg_loss: 0.1949, reg_loss: 0.1950 ||:  41%|####1     | 39/95 [00:25<00:33,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9639, LAS: 0.9289, UEM: 0.6881, LEM: 0.4583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1559, partial_loss/deprel_loss: 0.3300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4901, loss: 0.5559, batch_reg_loss: 0.1949, reg_loss: 0.1950 ||:  46%|####6     | 44/95 [00:27<00:27,  1.83it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9631, LAS: 0.9280, UEM: 0.6779, LEM: 0.4502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4824, partial_loss/deprel_loss: 0.4924, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6853, loss: 0.5623, batch_reg_loss: 0.1949, reg_loss: 0.1950 ||:  52%|#####1    | 49/95 [00:30<00:24,  1.85it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9618, LAS: 0.9267, UEM: 0.6693, LEM: 0.4411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2899, partial_loss/deprel_loss: 0.3352, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5210, loss: 0.5714, batch_reg_loss: 0.1949, reg_loss: 0.1950 ||:  56%|#####5    | 53/95 [00:33<00:24,  1.74it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9617, LAS: 0.9264, UEM: 0.6631, LEM: 0.4334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3949, partial_loss/deprel_loss: 0.4529, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6362, loss: 0.5723, batch_reg_loss: 0.1949, reg_loss: 0.1950 ||:  60%|######    | 57/95 [00:35<00:21,  1.73it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9621, LAS: 0.9268, UEM: 0.6765, LEM: 0.4561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5192, partial_loss/deprel_loss: 0.5042, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7021, loss: 0.5705, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||:  64%|######4   | 61/95 [00:38<00:21,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9621, LAS: 0.9267, UEM: 0.6761, LEM: 0.4564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4551, partial_loss/deprel_loss: 0.4019, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6074, loss: 0.5689, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||:  68%|######8   | 65/95 [00:41<00:20,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9030, UAS: 0.9622, LAS: 0.9267, UEM: 0.6769, LEM: 0.4554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6631, partial_loss/deprel_loss: 0.5134, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7382, loss: 0.5699, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||:  73%|#######2  | 69/95 [00:44<00:17,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9615, LAS: 0.9261, UEM: 0.6703, LEM: 0.4496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4632, partial_loss/deprel_loss: 0.3933, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6021, loss: 0.5745, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||:  76%|#######5  | 72/95 [00:46<00:15,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9336, UAS: 0.9615, LAS: 0.9261, UEM: 0.6662, LEM: 0.4440, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2535, partial_loss/deprel_loss: 0.3747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5453, loss: 0.5748, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||:  79%|#######8  | 75/95 [00:48<00:13,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9614, LAS: 0.9259, UEM: 0.6647, LEM: 0.4418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2812, partial_loss/deprel_loss: 0.3371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5207, loss: 0.5753, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||:  83%|########3 | 79/95 [00:50<00:10,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9616, LAS: 0.9261, UEM: 0.6633, LEM: 0.4397, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2467, partial_loss/deprel_loss: 0.2803, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4684, loss: 0.5736, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||:  87%|########7 | 83/95 [00:53<00:07,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9182, UAS: 0.9613, LAS: 0.9258, UEM: 0.6611, LEM: 0.4375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5645, partial_loss/deprel_loss: 0.4562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6726, loss: 0.5760, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||:  92%|#########1| 87/95 [00:55<00:05,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9615, LAS: 0.9260, UEM: 0.6667, LEM: 0.4438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8177, partial_loss/deprel_loss: 0.6482, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8769, loss: 0.5753, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||:  96%|#########5| 91/95 [00:58<00:02,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9611, LAS: 0.9257, UEM: 0.6636, LEM: 0.4424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7940, partial_loss/deprel_loss: 0.4946, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7492, loss: 0.5771, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||: 100%|##########| 95/95 [01:01<00:00,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9611, LAS: 0.9257, UEM: 0.6636, LEM: 0.4424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7940, partial_loss/deprel_loss: 0.4946, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7492, loss: 0.5771, batch_reg_loss: 0.1948, reg_loss: 0.1949 ||: 100%|##########| 95/95 [01:01<00:00,  1.55it/s]\n",
+      "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.195  |       N/A\n",
+      "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - UEM                      |     0.664  |       N/A\n",
+      "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - LEM                      |     0.442  |       N/A\n",
+      "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - EM                       |     0.905  |       N/A\n",
+      "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.794  |       N/A\n",
+      "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:38:44,417 - INFO - combo.training.tensorboard_writer - UAS                      |     0.961  |       N/A\n",
+      "2023-04-07 01:38:44,418 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:38:44,418 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.495  |       N/A\n",
+      "2023-04-07 01:38:44,418 - INFO - combo.training.tensorboard_writer - loss                     |     0.577  |       N/A\n",
+      "2023-04-07 01:38:44,418 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:38:44,418 - INFO - combo.training.tensorboard_writer - LAS                      |     0.926  |       N/A\n",
+      "2023-04-07 01:38:44,418 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:38:44,419 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:38:44,419 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:38:44,419 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:38:44,419 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:38:44,419 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:38:44,424 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:38:49,391 - INFO - combo.training.trainer - Epoch duration: 0:01:09.489946\n",
+      "2023-04-07 01:38:49,391 - INFO - combo.training.trainer - Estimated training time remaining: 4:51:14\n",
+      "2023-04-07 01:38:49,391 - INFO - allennlp.training.trainer - Epoch 147/399\n",
+      "2023-04-07 01:38:49,392 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:38:49,392 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:38:49,401 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9700, LAS: 0.9320, UEM: 0.8024, LEM: 0.5889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0914, partial_loss/deprel_loss: 0.2178, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3873, loss: 0.5235, batch_reg_loss: 0.1948, reg_loss: 0.1948 ||:   3%|3         | 3/95 [00:02<01:16,  1.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9558, LAS: 0.9185, UEM: 0.7202, LEM: 0.4936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4417, partial_loss/deprel_loss: 0.4945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6787, loss: 0.6081, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||:   6%|6         | 6/95 [00:04<01:13,  1.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9308, UAS: 0.9608, LAS: 0.9236, UEM: 0.7109, LEM: 0.4619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3048, partial_loss/deprel_loss: 0.3805, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5601, loss: 0.5829, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||:   9%|9         | 9/95 [00:07<01:08,  1.25it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9461, UAS: 0.9621, LAS: 0.9253, UEM: 0.7227, LEM: 0.4816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1072, partial_loss/deprel_loss: 0.2442, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4116, loss: 0.5705, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||:  13%|#2        | 12/95 [00:09<01:03,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9118, UAS: 0.9590, LAS: 0.9226, UEM: 0.6710, LEM: 0.4354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5053, partial_loss/deprel_loss: 0.4594, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6633, loss: 0.5941, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||:  17%|#6        | 16/95 [00:11<00:57,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9601, LAS: 0.9239, UEM: 0.6670, LEM: 0.4288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3350, partial_loss/deprel_loss: 0.3966, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5790, loss: 0.5888, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||:  21%|##1       | 20/95 [00:14<00:51,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9170, UAS: 0.9612, LAS: 0.9254, UEM: 0.6634, LEM: 0.4235, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4431, partial_loss/deprel_loss: 0.4889, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6745, loss: 0.5834, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||:  25%|##5       | 24/95 [00:16<00:47,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8743, UAS: 0.9598, LAS: 0.9239, UEM: 0.6607, LEM: 0.4259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0689, partial_loss/deprel_loss: 0.6764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9496, loss: 0.5918, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||:  29%|##9       | 28/95 [00:18<00:42,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9590, LAS: 0.9234, UEM: 0.6451, LEM: 0.4120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2733, partial_loss/deprel_loss: 0.3431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5238, loss: 0.5965, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||:  34%|###3      | 32/95 [00:20<00:37,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9580, LAS: 0.9230, UEM: 0.6245, LEM: 0.3955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3928, partial_loss/deprel_loss: 0.3778, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5755, loss: 0.6015, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||:  38%|###7      | 36/95 [00:23<00:36,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9593, LAS: 0.9242, UEM: 0.6439, LEM: 0.4158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1932, partial_loss/deprel_loss: 0.2998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4732, loss: 0.5942, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||:  42%|####2     | 40/95 [00:26<00:35,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9601, LAS: 0.9250, UEM: 0.6481, LEM: 0.4161, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2105, partial_loss/deprel_loss: 0.3241, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4961, loss: 0.5866, batch_reg_loss: 0.1947, reg_loss: 0.1947 ||:  46%|####6     | 44/95 [00:28<00:32,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9606, LAS: 0.9257, UEM: 0.6478, LEM: 0.4152, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5097, partial_loss/deprel_loss: 0.4705, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6730, loss: 0.5840, batch_reg_loss: 0.1946, reg_loss: 0.1947 ||:  51%|#####     | 48/95 [00:31<00:31,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9613, LAS: 0.9265, UEM: 0.6749, LEM: 0.4541, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1654, partial_loss/deprel_loss: 0.2774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4497, loss: 0.5765, batch_reg_loss: 0.1946, reg_loss: 0.1947 ||:  55%|#####4    | 52/95 [00:35<00:30,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9494, UAS: 0.9619, LAS: 0.9270, UEM: 0.6761, LEM: 0.4528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1565, partial_loss/deprel_loss: 0.2634, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4366, loss: 0.5739, batch_reg_loss: 0.1946, reg_loss: 0.1947 ||:  60%|######    | 57/95 [00:37<00:24,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9621, LAS: 0.9269, UEM: 0.6679, LEM: 0.4428, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4023, partial_loss/deprel_loss: 0.4833, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6617, loss: 0.5763, batch_reg_loss: 0.1946, reg_loss: 0.1947 ||:  65%|######5   | 62/95 [00:39<00:19,  1.72it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9616, LAS: 0.9263, UEM: 0.6622, LEM: 0.4380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4189, partial_loss/deprel_loss: 0.4651, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6504, loss: 0.5801, batch_reg_loss: 0.1946, reg_loss: 0.1947 ||:  71%|#######   | 67/95 [00:41<00:15,  1.82it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9609, LAS: 0.9256, UEM: 0.6548, LEM: 0.4306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3425, partial_loss/deprel_loss: 0.3956, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5795, loss: 0.5847, batch_reg_loss: 0.1946, reg_loss: 0.1947 ||:  75%|#######4  | 71/95 [00:44<00:13,  1.82it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9612, LAS: 0.9259, UEM: 0.6641, LEM: 0.4436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6663, partial_loss/deprel_loss: 0.5419, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7613, loss: 0.5817, batch_reg_loss: 0.1945, reg_loss: 0.1947 ||:  79%|#######8  | 75/95 [00:49<00:15,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8793, UAS: 0.9612, LAS: 0.9259, UEM: 0.6713, LEM: 0.4514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9395, partial_loss/deprel_loss: 0.6295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8860, loss: 0.5815, batch_reg_loss: 0.1945, reg_loss: 0.1947 ||:  83%|########3 | 79/95 [00:52<00:12,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9617, LAS: 0.9264, UEM: 0.6751, LEM: 0.4529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1674, partial_loss/deprel_loss: 0.2679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4423, loss: 0.5777, batch_reg_loss: 0.1945, reg_loss: 0.1946 ||:  86%|########6 | 82/95 [00:54<00:09,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9166, UAS: 0.9615, LAS: 0.9262, UEM: 0.6700, LEM: 0.4482, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4818, partial_loss/deprel_loss: 0.4349, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6388, loss: 0.5791, batch_reg_loss: 0.1945, reg_loss: 0.1946 ||:  89%|########9 | 85/95 [00:56<00:07,  1.32it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9294, UAS: 0.9614, LAS: 0.9261, UEM: 0.6673, LEM: 0.4444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1892, partial_loss/deprel_loss: 0.3540, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5155, loss: 0.5804, batch_reg_loss: 0.1945, reg_loss: 0.1946 ||:  94%|#########3| 89/95 [00:59<00:04,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9614, LAS: 0.9261, UEM: 0.6708, LEM: 0.4493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3842, partial_loss/deprel_loss: 0.4363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6203, loss: 0.5801, batch_reg_loss: 0.1945, reg_loss: 0.1946 ||:  97%|#########6| 92/95 [01:01<00:02,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9613, LAS: 0.9259, UEM: 0.6690, LEM: 0.4465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2026, partial_loss/deprel_loss: 0.3294, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4985, loss: 0.5819, batch_reg_loss: 0.1945, reg_loss: 0.1946 ||: 100%|##########| 95/95 [01:03<00:00,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9613, LAS: 0.9259, UEM: 0.6690, LEM: 0.4465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2026, partial_loss/deprel_loss: 0.3294, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4985, loss: 0.5819, batch_reg_loss: 0.1945, reg_loss: 0.1946 ||: 100%|##########| 95/95 [01:03<00:00,  1.49it/s]\n",
+      "2023-04-07 01:39:56,277 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:39:56,277 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.195  |       N/A\n",
+      "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - UEM                      |     0.669  |       N/A\n",
+      "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - LEM                      |     0.447  |       N/A\n",
+      "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - EM                       |     0.927  |       N/A\n",
+      "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.203  |       N/A\n",
+      "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - UAS                      |     0.961  |       N/A\n",
+      "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.329  |       N/A\n",
+      "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - loss                     |     0.582  |       N/A\n",
+      "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - LAS                      |     0.926  |       N/A\n",
+      "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:39:56,278 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:39:56,279 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:39:56,279 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:39:56,279 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:39:56,284 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:40:02,411 - INFO - combo.training.trainer - Epoch duration: 0:01:13.019938\n",
+      "2023-04-07 01:40:02,412 - INFO - combo.training.trainer - Estimated training time remaining: 4:50:12\n",
+      "2023-04-07 01:40:02,413 - INFO - allennlp.training.trainer - Epoch 148/399\n",
+      "2023-04-07 01:40:02,413 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:40:02,413 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:40:02,420 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9484, UAS: 0.9744, LAS: 0.9410, UEM: 0.7404, LEM: 0.4791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1520, partial_loss/deprel_loss: 0.2852, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4530, loss: 0.4921, batch_reg_loss: 0.1945, reg_loss: 0.1945 ||:   3%|3         | 3/95 [00:02<01:05,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9688, LAS: 0.9367, UEM: 0.6836, LEM: 0.4344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1890, partial_loss/deprel_loss: 0.2594, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4398, loss: 0.5078, batch_reg_loss: 0.1945, reg_loss: 0.1945 ||:   7%|7         | 7/95 [00:04<00:59,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8783, UAS: 0.9651, LAS: 0.9312, UEM: 0.7144, LEM: 0.4688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0441, partial_loss/deprel_loss: 0.6488, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9223, loss: 0.5370, batch_reg_loss: 0.1945, reg_loss: 0.1945 ||:  11%|#         | 10/95 [00:07<01:02,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9626, LAS: 0.9289, UEM: 0.6773, LEM: 0.4341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3531, partial_loss/deprel_loss: 0.4054, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5894, loss: 0.5538, batch_reg_loss: 0.1944, reg_loss: 0.1945 ||:  14%|#3        | 13/95 [00:09<00:59,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9644, LAS: 0.9311, UEM: 0.7024, LEM: 0.4640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1947, partial_loss/deprel_loss: 0.2653, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4456, loss: 0.5368, batch_reg_loss: 0.1944, reg_loss: 0.1945 ||:  17%|#6        | 16/95 [00:11<01:00,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9351, UAS: 0.9654, LAS: 0.9322, UEM: 0.6880, LEM: 0.4464, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2423, partial_loss/deprel_loss: 0.3128, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4931, loss: 0.5309, batch_reg_loss: 0.1944, reg_loss: 0.1945 ||:  21%|##1       | 20/95 [00:14<00:53,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9655, LAS: 0.9318, UEM: 0.6834, LEM: 0.4356, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2004, partial_loss/deprel_loss: 0.3251, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4945, loss: 0.5338, batch_reg_loss: 0.1944, reg_loss: 0.1944 ||:  25%|##5       | 24/95 [00:16<00:47,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9496, UAS: 0.9652, LAS: 0.9317, UEM: 0.6777, LEM: 0.4352, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1851, partial_loss/deprel_loss: 0.2392, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4228, loss: 0.5354, batch_reg_loss: 0.1944, reg_loss: 0.1944 ||:  28%|##8       | 27/95 [00:18<00:46,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9654, LAS: 0.9316, UEM: 0.6774, LEM: 0.4347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4127, partial_loss/deprel_loss: 0.4125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6069, loss: 0.5384, batch_reg_loss: 0.1944, reg_loss: 0.1944 ||:  32%|###1      | 30/95 [00:20<00:44,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9659, LAS: 0.9320, UEM: 0.6825, LEM: 0.4370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3103, partial_loss/deprel_loss: 0.4138, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5875, loss: 0.5368, batch_reg_loss: 0.1944, reg_loss: 0.1944 ||:  35%|###4      | 33/95 [00:22<00:42,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8819, UAS: 0.9649, LAS: 0.9308, UEM: 0.6832, LEM: 0.4376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2323, partial_loss/deprel_loss: 0.5903, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9130, loss: 0.5444, batch_reg_loss: 0.1944, reg_loss: 0.1944 ||:  38%|###7      | 36/95 [00:24<00:40,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9635, LAS: 0.9291, UEM: 0.6664, LEM: 0.4232, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7926, partial_loss/deprel_loss: 0.5206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7694, loss: 0.5546, batch_reg_loss: 0.1943, reg_loss: 0.1944 ||:  42%|####2     | 40/95 [00:27<00:36,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9509, UAS: 0.9640, LAS: 0.9295, UEM: 0.6878, LEM: 0.4542, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0724, partial_loss/deprel_loss: 0.1789, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3519, loss: 0.5502, batch_reg_loss: 0.1943, reg_loss: 0.1944 ||:  46%|####6     | 44/95 [00:30<00:35,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9291, UAS: 0.9631, LAS: 0.9284, UEM: 0.6779, LEM: 0.4454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2713, partial_loss/deprel_loss: 0.3649, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5405, loss: 0.5579, batch_reg_loss: 0.1943, reg_loss: 0.1944 ||:  49%|####9     | 47/95 [00:32<00:34,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9623, LAS: 0.9276, UEM: 0.6673, LEM: 0.4331, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2135, partial_loss/deprel_loss: 0.3543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5204, loss: 0.5629, batch_reg_loss: 0.1943, reg_loss: 0.1944 ||:  54%|#####3    | 51/95 [00:35<00:30,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9622, LAS: 0.9275, UEM: 0.6637, LEM: 0.4302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5394, partial_loss/deprel_loss: 0.4958, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6988, loss: 0.5639, batch_reg_loss: 0.1943, reg_loss: 0.1944 ||:  57%|#####6    | 54/95 [00:37<00:28,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9625, LAS: 0.9277, UEM: 0.6680, LEM: 0.4336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1957, partial_loss/deprel_loss: 0.2777, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4556, loss: 0.5613, batch_reg_loss: 0.1943, reg_loss: 0.1944 ||:  61%|######1   | 58/95 [00:39<00:25,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9500, UAS: 0.9631, LAS: 0.9283, UEM: 0.6834, LEM: 0.4509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0752, partial_loss/deprel_loss: 0.2441, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4046, loss: 0.5568, batch_reg_loss: 0.1943, reg_loss: 0.1944 ||:  64%|######4   | 61/95 [00:42<00:23,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8829, UAS: 0.9616, LAS: 0.9267, UEM: 0.6699, LEM: 0.4399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8370, partial_loss/deprel_loss: 0.5899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8336, loss: 0.5667, batch_reg_loss: 0.1943, reg_loss: 0.1944 ||:  68%|######8   | 65/95 [00:44<00:20,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9692, UAS: 0.9619, LAS: 0.9273, UEM: 0.6804, LEM: 0.4598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0577, partial_loss/deprel_loss: 0.1130, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2962, loss: 0.5648, batch_reg_loss: 0.1943, reg_loss: 0.1944 ||:  74%|#######3  | 70/95 [00:47<00:15,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9621, LAS: 0.9274, UEM: 0.6767, LEM: 0.4554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1719, partial_loss/deprel_loss: 0.2579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4349, loss: 0.5652, batch_reg_loss: 0.1943, reg_loss: 0.1944 ||:  79%|#######8  | 75/95 [00:49<00:11,  1.71it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9623, LAS: 0.9276, UEM: 0.6764, LEM: 0.4531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6284, partial_loss/deprel_loss: 0.5133, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7305, loss: 0.5645, batch_reg_loss: 0.1942, reg_loss: 0.1944 ||:  84%|########4 | 80/95 [00:51<00:08,  1.82it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9171, UAS: 0.9615, LAS: 0.9268, UEM: 0.6698, LEM: 0.4466, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5624, partial_loss/deprel_loss: 0.4455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6631, loss: 0.5706, batch_reg_loss: 0.1942, reg_loss: 0.1943 ||:  88%|########8 | 84/95 [00:55<00:06,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9619, LAS: 0.9270, UEM: 0.6704, LEM: 0.4465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2817, partial_loss/deprel_loss: 0.4192, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5859, loss: 0.5695, batch_reg_loss: 0.1942, reg_loss: 0.1943 ||:  93%|#########2| 88/95 [00:58<00:04,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9620, LAS: 0.9270, UEM: 0.6698, LEM: 0.4438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6388, partial_loss/deprel_loss: 0.5363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7510, loss: 0.5693, batch_reg_loss: 0.1942, reg_loss: 0.1943 ||:  97%|#########6| 92/95 [01:01<00:02,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9080, UAS: 0.9618, LAS: 0.9268, UEM: 0.6647, LEM: 0.4383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6035, partial_loss/deprel_loss: 0.5098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7227, loss: 0.5714, batch_reg_loss: 0.1942, reg_loss: 0.1943 ||: 100%|##########| 95/95 [01:03<00:00,  1.51it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:41:08,690 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.194  |       N/A\n",
+      "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - UEM                      |     0.665  |       N/A\n",
+      "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - LEM                      |     0.438  |       N/A\n",
+      "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - EM                       |     0.908  |       N/A\n",
+      "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.603  |       N/A\n",
+      "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |       N/A\n",
+      "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.510  |       N/A\n",
+      "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - loss                     |     0.571  |       N/A\n",
+      "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:41:08,691 - INFO - combo.training.tensorboard_writer - LAS                      |     0.927  |       N/A\n",
+      "2023-04-07 01:41:08,692 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:41:08,692 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:41:08,692 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:41:08,692 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:41:08,692 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:41:08,692 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:41:08,697 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:41:13,618 - INFO - combo.training.trainer - Epoch duration: 0:01:11.205192\n",
+      "2023-04-07 01:41:13,618 - INFO - combo.training.trainer - Estimated training time remaining: 4:49:06\n",
+      "2023-04-07 01:41:13,618 - INFO - allennlp.training.trainer - Epoch 149/399\n",
+      "2023-04-07 01:41:13,618 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:41:13,619 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:41:13,628 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9614, LAS: 0.9257, UEM: 0.6583, LEM: 0.4530, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1289, partial_loss/deprel_loss: 0.2566, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4253, loss: 0.5710, batch_reg_loss: 0.1942, reg_loss: 0.1942 ||:   3%|3         | 3/95 [00:02<01:09,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9590, LAS: 0.9226, UEM: 0.5729, LEM: 0.3497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4041, partial_loss/deprel_loss: 0.4479, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6333, loss: 0.5999, batch_reg_loss: 0.1942, reg_loss: 0.1942 ||:   6%|6         | 6/95 [00:04<01:05,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9594, LAS: 0.9240, UEM: 0.5481, LEM: 0.3214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4907, partial_loss/deprel_loss: 0.4389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6434, loss: 0.6039, batch_reg_loss: 0.1942, reg_loss: 0.1942 ||:   9%|9         | 9/95 [00:06<01:03,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9468, UAS: 0.9640, LAS: 0.9293, UEM: 0.6384, LEM: 0.3999, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1567, partial_loss/deprel_loss: 0.2807, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4500, loss: 0.5638, batch_reg_loss: 0.1942, reg_loss: 0.1942 ||:  13%|#2        | 12/95 [00:08<01:02,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9641, LAS: 0.9295, UEM: 0.6795, LEM: 0.4486, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2402, partial_loss/deprel_loss: 0.3336, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5091, loss: 0.5631, batch_reg_loss: 0.1942, reg_loss: 0.1942 ||:  16%|#5        | 15/95 [00:11<00:59,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9182, UAS: 0.9641, LAS: 0.9299, UEM: 0.6658, LEM: 0.4330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4784, partial_loss/deprel_loss: 0.4553, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6541, loss: 0.5623, batch_reg_loss: 0.1941, reg_loss: 0.1942 ||:  19%|#8        | 18/95 [00:13<00:56,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9486, UAS: 0.9644, LAS: 0.9301, UEM: 0.6699, LEM: 0.4357, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1440, partial_loss/deprel_loss: 0.2600, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4309, loss: 0.5605, batch_reg_loss: 0.1941, reg_loss: 0.1942 ||:  22%|##2       | 21/95 [00:15<00:55,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9627, LAS: 0.9285, UEM: 0.6464, LEM: 0.4167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4797, partial_loss/deprel_loss: 0.4261, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6309, loss: 0.5696, batch_reg_loss: 0.1941, reg_loss: 0.1942 ||:  25%|##5       | 24/95 [00:17<00:52,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9632, LAS: 0.9292, UEM: 0.6490, LEM: 0.4152, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2529, partial_loss/deprel_loss: 0.3305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5091, loss: 0.5631, batch_reg_loss: 0.1941, reg_loss: 0.1942 ||:  28%|##8       | 27/95 [00:19<00:50,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9637, LAS: 0.9297, UEM: 0.6502, LEM: 0.4138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3560, partial_loss/deprel_loss: 0.3734, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5640, loss: 0.5609, batch_reg_loss: 0.1941, reg_loss: 0.1942 ||:  32%|###1      | 30/95 [00:22<00:47,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9398, UAS: 0.9633, LAS: 0.9293, UEM: 0.6401, LEM: 0.4038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2135, partial_loss/deprel_loss: 0.3372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5065, loss: 0.5665, batch_reg_loss: 0.1941, reg_loss: 0.1941 ||:  35%|###4      | 33/95 [00:24<00:44,  1.38it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9615, LAS: 0.9274, UEM: 0.6421, LEM: 0.4118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1411, partial_loss/deprel_loss: 0.2652, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4345, loss: 0.5764, batch_reg_loss: 0.1941, reg_loss: 0.1941 ||:  38%|###7      | 36/95 [00:26<00:42,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9622, LAS: 0.9280, UEM: 0.6450, LEM: 0.4120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3323, partial_loss/deprel_loss: 0.3509, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5412, loss: 0.5730, batch_reg_loss: 0.1941, reg_loss: 0.1941 ||:  42%|####2     | 40/95 [00:28<00:37,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9625, LAS: 0.9282, UEM: 0.6431, LEM: 0.4064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2572, partial_loss/deprel_loss: 0.3487, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5244, loss: 0.5720, batch_reg_loss: 0.1941, reg_loss: 0.1941 ||:  45%|####5     | 43/95 [00:30<00:36,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9626, LAS: 0.9281, UEM: 0.6375, LEM: 0.3997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1883, partial_loss/deprel_loss: 0.2949, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4676, loss: 0.5702, batch_reg_loss: 0.1941, reg_loss: 0.1941 ||:  49%|####9     | 47/95 [00:33<00:32,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9485, UAS: 0.9620, LAS: 0.9276, UEM: 0.6397, LEM: 0.4051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1029, partial_loss/deprel_loss: 0.2344, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4021, loss: 0.5730, batch_reg_loss: 0.1940, reg_loss: 0.1941 ||:  53%|#####2    | 50/95 [00:35<00:31,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9628, LAS: 0.9284, UEM: 0.6473, LEM: 0.4108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2029, partial_loss/deprel_loss: 0.3205, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4910, loss: 0.5673, batch_reg_loss: 0.1940, reg_loss: 0.1941 ||:  56%|#####5    | 53/95 [00:37<00:29,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9452, UAS: 0.9627, LAS: 0.9284, UEM: 0.6482, LEM: 0.4126, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1409, partial_loss/deprel_loss: 0.2844, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4497, loss: 0.5673, batch_reg_loss: 0.1940, reg_loss: 0.1941 ||:  59%|#####8    | 56/95 [00:40<00:28,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9037, UAS: 0.9618, LAS: 0.9274, UEM: 0.6350, LEM: 0.4016, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5930, partial_loss/deprel_loss: 0.5383, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7432, loss: 0.5728, batch_reg_loss: 0.1940, reg_loss: 0.1941 ||:  63%|######3   | 60/95 [00:42<00:24,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9623, LAS: 0.9279, UEM: 0.6453, LEM: 0.4129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2537, partial_loss/deprel_loss: 0.3706, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5412, loss: 0.5693, batch_reg_loss: 0.1940, reg_loss: 0.1941 ||:  66%|######6   | 63/95 [00:44<00:22,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9612, LAS: 0.9269, UEM: 0.6377, LEM: 0.4055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4288, partial_loss/deprel_loss: 0.4065, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6049, loss: 0.5769, batch_reg_loss: 0.1940, reg_loss: 0.1941 ||:  69%|######9   | 66/95 [00:47<00:21,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9612, LAS: 0.9269, UEM: 0.6398, LEM: 0.4071, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2262, partial_loss/deprel_loss: 0.3117, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4886, loss: 0.5758, batch_reg_loss: 0.1940, reg_loss: 0.1941 ||:  73%|#######2  | 69/95 [00:49<00:19,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9622, LAS: 0.9279, UEM: 0.6668, LEM: 0.4411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1521, partial_loss/deprel_loss: 0.3423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4982, loss: 0.5689, batch_reg_loss: 0.1940, reg_loss: 0.1941 ||:  76%|#######5  | 72/95 [00:52<00:18,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9618, LAS: 0.9275, UEM: 0.6608, LEM: 0.4356, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6352, partial_loss/deprel_loss: 0.4216, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6583, loss: 0.5719, batch_reg_loss: 0.1940, reg_loss: 0.1941 ||:  79%|#######8  | 75/95 [00:54<00:15,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9224, UAS: 0.9614, LAS: 0.9270, UEM: 0.6562, LEM: 0.4294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3477, partial_loss/deprel_loss: 0.4311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6083, loss: 0.5751, batch_reg_loss: 0.1940, reg_loss: 0.1941 ||:  82%|########2 | 78/95 [00:56<00:12,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9616, UAS: 0.9613, LAS: 0.9269, UEM: 0.6668, LEM: 0.4448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0557, partial_loss/deprel_loss: 0.1716, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3424, loss: 0.5738, batch_reg_loss: 0.1939, reg_loss: 0.1941 ||:  86%|########6 | 82/95 [00:58<00:09,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9614, LAS: 0.9270, UEM: 0.6651, LEM: 0.4404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2140, partial_loss/deprel_loss: 0.3683, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5314, loss: 0.5739, batch_reg_loss: 0.1939, reg_loss: 0.1941 ||:  92%|#########1| 87/95 [01:01<00:05,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9620, LAS: 0.9275, UEM: 0.6744, LEM: 0.4491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1524, partial_loss/deprel_loss: 0.2935, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4592, loss: 0.5696, batch_reg_loss: 0.1939, reg_loss: 0.1941 ||:  96%|#########5| 91/95 [01:04<00:02,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9619, LAS: 0.9274, UEM: 0.6710, LEM: 0.4449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1426, partial_loss/deprel_loss: 0.3042, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4658, loss: 0.5702, batch_reg_loss: 0.1939, reg_loss: 0.1940 ||: 100%|##########| 95/95 [01:06<00:00,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9619, LAS: 0.9274, UEM: 0.6710, LEM: 0.4449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1426, partial_loss/deprel_loss: 0.3042, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4658, loss: 0.5702, batch_reg_loss: 0.1939, reg_loss: 0.1940 ||: 100%|##########| 95/95 [01:06<00:00,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.194  |       N/A\n",
+      "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - UEM                      |     0.671  |       N/A\n",
+      "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - LEM                      |     0.445  |       N/A\n",
+      "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - EM                       |     0.941  |       N/A\n",
+      "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.143  |       N/A\n",
+      "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:42:23,399 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |       N/A\n",
+      "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.304  |       N/A\n",
+      "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - loss                     |     0.570  |       N/A\n",
+      "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - LAS                      |     0.927  |       N/A\n",
+      "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:42:23,400 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:42:23,405 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:42:30,545 - INFO - combo.training.trainer - Epoch duration: 0:01:16.926598\n",
+      "2023-04-07 01:42:30,545 - INFO - combo.training.trainer - Estimated training time remaining: 4:48:10\n",
+      "2023-04-07 01:42:30,546 - INFO - allennlp.training.trainer - Epoch 150/399\n",
+      "2023-04-07 01:42:30,546 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:42:30,547 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:42:30,557 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9660, LAS: 0.9301, UEM: 0.7472, LEM: 0.5735, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5523, partial_loss/deprel_loss: 0.5159, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7171, loss: 0.5174, batch_reg_loss: 0.1939, reg_loss: 0.1939 ||:   3%|3         | 3/95 [00:02<01:04,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9654, LAS: 0.9296, UEM: 0.7582, LEM: 0.5888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3937, partial_loss/deprel_loss: 0.3616, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5619, loss: 0.5311, batch_reg_loss: 0.1939, reg_loss: 0.1939 ||:   6%|6         | 6/95 [00:04<01:02,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9632, LAS: 0.9271, UEM: 0.7234, LEM: 0.5403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5025, partial_loss/deprel_loss: 0.3931, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6089, loss: 0.5487, batch_reg_loss: 0.1939, reg_loss: 0.1939 ||:   9%|9         | 9/95 [00:06<01:03,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9621, LAS: 0.9274, UEM: 0.6765, LEM: 0.4894, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6303, partial_loss/deprel_loss: 0.4333, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6665, loss: 0.5548, batch_reg_loss: 0.1939, reg_loss: 0.1939 ||:  14%|#3        | 13/95 [00:08<00:56,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9601, LAS: 0.9255, UEM: 0.6530, LEM: 0.4608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2864, partial_loss/deprel_loss: 0.3684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5459, loss: 0.5703, batch_reg_loss: 0.1938, reg_loss: 0.1939 ||:  18%|#7        | 17/95 [00:11<00:52,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9610, LAS: 0.9265, UEM: 0.6526, LEM: 0.4545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2210, partial_loss/deprel_loss: 0.3544, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5216, loss: 0.5622, batch_reg_loss: 0.1938, reg_loss: 0.1939 ||:  21%|##1       | 20/95 [00:13<00:51,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9602, LAS: 0.9258, UEM: 0.6538, LEM: 0.4479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2309, partial_loss/deprel_loss: 0.3187, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4950, loss: 0.5697, batch_reg_loss: 0.1938, reg_loss: 0.1939 ||:  24%|##4       | 23/95 [00:16<00:52,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9525, UAS: 0.9603, LAS: 0.9256, UEM: 0.6631, LEM: 0.4543, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0864, partial_loss/deprel_loss: 0.2300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3951, loss: 0.5738, batch_reg_loss: 0.1938, reg_loss: 0.1939 ||:  27%|##7       | 26/95 [00:18<00:49,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9601, LAS: 0.9251, UEM: 0.6614, LEM: 0.4472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1643, partial_loss/deprel_loss: 0.3030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4691, loss: 0.5745, batch_reg_loss: 0.1938, reg_loss: 0.1939 ||:  32%|###1      | 30/95 [00:21<00:47,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9614, LAS: 0.9263, UEM: 0.6774, LEM: 0.4565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1403, partial_loss/deprel_loss: 0.2896, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4535, loss: 0.5672, batch_reg_loss: 0.1938, reg_loss: 0.1938 ||:  35%|###4      | 33/95 [00:23<00:45,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9606, LAS: 0.9259, UEM: 0.6663, LEM: 0.4474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2420, partial_loss/deprel_loss: 0.2978, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4805, loss: 0.5706, batch_reg_loss: 0.1938, reg_loss: 0.1938 ||:  39%|###8      | 37/95 [00:26<00:41,  1.40it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9610, LAS: 0.9263, UEM: 0.6568, LEM: 0.4333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3393, partial_loss/deprel_loss: 0.3593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5491, loss: 0.5693, batch_reg_loss: 0.1938, reg_loss: 0.1938 ||:  43%|####3     | 41/95 [00:28<00:37,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9607, LAS: 0.9261, UEM: 0.6518, LEM: 0.4284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1285, partial_loss/deprel_loss: 0.2848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4473, loss: 0.5723, batch_reg_loss: 0.1938, reg_loss: 0.1938 ||:  46%|####6     | 44/95 [00:31<00:37,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9613, LAS: 0.9269, UEM: 0.6689, LEM: 0.4485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4425, partial_loss/deprel_loss: 0.3508, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5629, loss: 0.5654, batch_reg_loss: 0.1938, reg_loss: 0.1938 ||:  49%|####9     | 47/95 [00:33<00:37,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9617, LAS: 0.9273, UEM: 0.6746, LEM: 0.4532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1656, partial_loss/deprel_loss: 0.2683, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4416, loss: 0.5625, batch_reg_loss: 0.1938, reg_loss: 0.1938 ||:  53%|#####2    | 50/95 [00:35<00:34,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9078, UAS: 0.9613, LAS: 0.9269, UEM: 0.6674, LEM: 0.4465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6161, partial_loss/deprel_loss: 0.4413, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6700, loss: 0.5647, batch_reg_loss: 0.1938, reg_loss: 0.1938 ||:  56%|#####5    | 53/95 [00:38<00:31,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9611, LAS: 0.9265, UEM: 0.6608, LEM: 0.4385, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2018, partial_loss/deprel_loss: 0.3626, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5242, loss: 0.5683, batch_reg_loss: 0.1937, reg_loss: 0.1938 ||:  59%|#####8    | 56/95 [00:40<00:28,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9243, UAS: 0.9602, LAS: 0.9257, UEM: 0.6464, LEM: 0.4265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4386, partial_loss/deprel_loss: 0.3756, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5819, loss: 0.5758, batch_reg_loss: 0.1937, reg_loss: 0.1938 ||:  63%|######3   | 60/95 [00:42<00:24,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9752, UAS: 0.9611, LAS: 0.9269, UEM: 0.6718, LEM: 0.4589, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0250, partial_loss/deprel_loss: 0.1154, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2911, loss: 0.5690, batch_reg_loss: 0.1937, reg_loss: 0.1938 ||:  66%|######6   | 63/95 [00:44<00:22,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9618, LAS: 0.9275, UEM: 0.6753, LEM: 0.4585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2018, partial_loss/deprel_loss: 0.3104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4824, loss: 0.5649, batch_reg_loss: 0.1937, reg_loss: 0.1938 ||:  71%|#######   | 67/95 [00:47<00:19,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9456, UAS: 0.9622, LAS: 0.9279, UEM: 0.6779, LEM: 0.4590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1592, partial_loss/deprel_loss: 0.2677, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4397, loss: 0.5626, batch_reg_loss: 0.1937, reg_loss: 0.1938 ||:  74%|#######3  | 70/95 [00:49<00:17,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9228, UAS: 0.9623, LAS: 0.9279, UEM: 0.6740, LEM: 0.4526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4977, partial_loss/deprel_loss: 0.4358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6419, loss: 0.5636, batch_reg_loss: 0.1937, reg_loss: 0.1938 ||:  77%|#######6  | 73/95 [00:51<00:15,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9624, LAS: 0.9278, UEM: 0.6712, LEM: 0.4476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2408, partial_loss/deprel_loss: 0.3397, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5136, loss: 0.5636, batch_reg_loss: 0.1937, reg_loss: 0.1938 ||:  80%|########  | 76/95 [00:54<00:14,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9464, UAS: 0.9630, LAS: 0.9283, UEM: 0.6791, LEM: 0.4545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1598, partial_loss/deprel_loss: 0.2910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4584, loss: 0.5600, batch_reg_loss: 0.1937, reg_loss: 0.1938 ||:  84%|########4 | 80/95 [00:57<00:10,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9628, LAS: 0.9281, UEM: 0.6764, LEM: 0.4518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1033, partial_loss/deprel_loss: 0.2547, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4181, loss: 0.5623, batch_reg_loss: 0.1936, reg_loss: 0.1938 ||:  88%|########8 | 84/95 [00:59<00:07,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9625, LAS: 0.9277, UEM: 0.6714, LEM: 0.4459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5945, partial_loss/deprel_loss: 0.5072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7183, loss: 0.5645, batch_reg_loss: 0.1936, reg_loss: 0.1938 ||:  93%|#########2| 88/95 [01:02<00:04,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9626, LAS: 0.9278, UEM: 0.6743, LEM: 0.4488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1555, partial_loss/deprel_loss: 0.2837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4517, loss: 0.5638, batch_reg_loss: 0.1936, reg_loss: 0.1938 ||:  97%|#########6| 92/95 [01:04<00:01,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9623, LAS: 0.9275, UEM: 0.6714, LEM: 0.4458, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1766, partial_loss/deprel_loss: 0.3487, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5079, loss: 0.5658, batch_reg_loss: 0.1936, reg_loss: 0.1938 ||: 100%|##########| 95/95 [01:06<00:00,  1.43it/s]\n",
+      "2023-04-07 01:43:40,329 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9546, LAS: 0.9034, UEM: 0.6531, LEM: 0.3225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5055, partial_loss/deprel_loss: 7.8762, partial_loss/cycle_loss: 0.0000, batch_loss: 6.4020, loss: 6.6940, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  27%|##7       | 3/11 [00:02<00:06,  1.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9639, LAS: 0.9178, UEM: 0.7926, LEM: 0.5240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2003, partial_loss/deprel_loss: 5.6713, partial_loss/cycle_loss: 0.0000, batch_loss: 4.5771, loss: 5.6320, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  55%|#####4    | 6/11 [00:05<00:04,  1.10it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8989, UAS: 0.9541, LAS: 0.9039, UEM: 0.7210, LEM: 0.4471, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6134, partial_loss/deprel_loss: 7.0592, partial_loss/cycle_loss: 0.0000, batch_loss: 5.7700, loss: 7.5659, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  82%|########1 | 9/11 [00:08<00:01,  1.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.9517, LAS: 0.9005, UEM: 0.6847, LEM: 0.4120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2930, partial_loss/deprel_loss: 16.4667, partial_loss/cycle_loss: 0.0000, batch_loss: 13.4320, loss: 8.1682, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:09<00:00,  1.13it/s]\n",
+      "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.194  |     0.000\n",
+      "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - UEM                      |     0.671  |     0.685\n",
+      "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - LEM                      |     0.446  |     0.412\n",
+      "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - EM                       |     0.941  |     0.879\n",
+      "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.177  |     1.293\n",
+      "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 01:43:50,107 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |     0.952\n",
+      "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.349  |    16.467\n",
+      "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - loss                     |     0.566  |     8.168\n",
+      "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - LAS                      |     0.927  |     0.901\n",
+      "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:43:50,108 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 01:43:50,113 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:44:00,106 - INFO - combo.training.trainer - Epoch duration: 0:01:29.560242\n",
+      "2023-04-07 01:44:00,107 - INFO - combo.training.trainer - Estimated training time remaining: 4:47:35\n",
+      "2023-04-07 01:44:00,107 - INFO - allennlp.training.trainer - Epoch 151/399\n",
+      "2023-04-07 01:44:00,107 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:44:00,108 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:44:00,117 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9609, LAS: 0.9235, UEM: 0.7176, LEM: 0.5126, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1536, partial_loss/deprel_loss: 0.2770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4459, loss: 0.5892, batch_reg_loss: 0.1936, reg_loss: 0.1936 ||:   3%|3         | 3/95 [00:02<01:06,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9565, LAS: 0.9205, UEM: 0.6866, LEM: 0.4729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1358, partial_loss/deprel_loss: 0.3196, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4764, loss: 0.6192, batch_reg_loss: 0.1936, reg_loss: 0.1936 ||:   6%|6         | 6/95 [00:04<01:04,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9518, LAS: 0.9166, UEM: 0.6304, LEM: 0.4212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6188, partial_loss/deprel_loss: 0.4459, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6740, loss: 0.6535, batch_reg_loss: 0.1936, reg_loss: 0.1936 ||:  11%|#         | 10/95 [00:06<00:59,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9565, LAS: 0.9215, UEM: 0.6676, LEM: 0.4406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2009, partial_loss/deprel_loss: 0.2795, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4574, loss: 0.6097, batch_reg_loss: 0.1936, reg_loss: 0.1936 ||:  14%|#3        | 13/95 [00:09<01:02,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9595, LAS: 0.9243, UEM: 0.6698, LEM: 0.4267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3932, partial_loss/deprel_loss: 0.3966, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5895, loss: 0.5908, batch_reg_loss: 0.1936, reg_loss: 0.1936 ||:  18%|#7        | 17/95 [00:12<00:57,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9597, LAS: 0.9247, UEM: 0.6644, LEM: 0.4259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6641, partial_loss/deprel_loss: 0.4789, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7095, loss: 0.5852, batch_reg_loss: 0.1936, reg_loss: 0.1936 ||:  22%|##2       | 21/95 [00:14<00:51,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9596, LAS: 0.9243, UEM: 0.6369, LEM: 0.3989, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4559, partial_loss/deprel_loss: 0.4409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6374, loss: 0.5890, batch_reg_loss: 0.1936, reg_loss: 0.1936 ||:  26%|##6       | 25/95 [00:17<00:47,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9590, LAS: 0.9236, UEM: 0.6199, LEM: 0.3832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3745, partial_loss/deprel_loss: 0.3930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5828, loss: 0.5937, batch_reg_loss: 0.1935, reg_loss: 0.1936 ||:  29%|##9       | 28/95 [00:19<00:45,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9586, LAS: 0.9238, UEM: 0.6553, LEM: 0.4447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6416, partial_loss/deprel_loss: 0.4670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6955, loss: 0.5927, batch_reg_loss: 0.1935, reg_loss: 0.1936 ||:  33%|###2      | 31/95 [00:22<00:47,  1.35it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9587, LAS: 0.9240, UEM: 0.6528, LEM: 0.4421, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3300, partial_loss/deprel_loss: 0.3677, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5537, loss: 0.5907, batch_reg_loss: 0.1935, reg_loss: 0.1936 ||:  36%|###5      | 34/95 [00:24<00:44,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9541, UAS: 0.9604, LAS: 0.9261, UEM: 0.6791, LEM: 0.4685, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0871, partial_loss/deprel_loss: 0.2256, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3914, loss: 0.5778, batch_reg_loss: 0.1935, reg_loss: 0.1936 ||:  39%|###8      | 37/95 [00:26<00:43,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9303, UAS: 0.9611, LAS: 0.9269, UEM: 0.6815, LEM: 0.4689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2208, partial_loss/deprel_loss: 0.2999, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4777, loss: 0.5705, batch_reg_loss: 0.1935, reg_loss: 0.1936 ||:  42%|####2     | 40/95 [00:28<00:41,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9615, LAS: 0.9275, UEM: 0.6845, LEM: 0.4712, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2482, partial_loss/deprel_loss: 0.3329, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5095, loss: 0.5650, batch_reg_loss: 0.1935, reg_loss: 0.1936 ||:  45%|####5     | 43/95 [00:31<00:39,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9613, LAS: 0.9272, UEM: 0.6755, LEM: 0.4621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4317, partial_loss/deprel_loss: 0.4471, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6375, loss: 0.5672, batch_reg_loss: 0.1935, reg_loss: 0.1936 ||:  48%|####8     | 46/95 [00:33<00:36,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9618, LAS: 0.9277, UEM: 0.6789, LEM: 0.4637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1184, partial_loss/deprel_loss: 0.2675, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4311, loss: 0.5634, batch_reg_loss: 0.1935, reg_loss: 0.1936 ||:  52%|#####1    | 49/95 [00:35<00:33,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9611, LAS: 0.9270, UEM: 0.6670, LEM: 0.4520, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3595, partial_loss/deprel_loss: 0.3445, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5410, loss: 0.5680, batch_reg_loss: 0.1935, reg_loss: 0.1935 ||:  56%|#####5    | 53/95 [00:37<00:28,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9208, UAS: 0.9618, LAS: 0.9271, UEM: 0.6702, LEM: 0.4513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3766, partial_loss/deprel_loss: 0.4459, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6255, loss: 0.5663, batch_reg_loss: 0.1935, reg_loss: 0.1935 ||:  60%|######    | 57/95 [00:40<00:25,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9626, LAS: 0.9279, UEM: 0.6817, LEM: 0.4618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1669, partial_loss/deprel_loss: 0.3602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5150, loss: 0.5599, batch_reg_loss: 0.1934, reg_loss: 0.1935 ||:  64%|######4   | 61/95 [00:43<00:23,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9627, LAS: 0.9279, UEM: 0.6785, LEM: 0.4557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4057, partial_loss/deprel_loss: 0.3609, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5633, loss: 0.5593, batch_reg_loss: 0.1934, reg_loss: 0.1935 ||:  67%|######7   | 64/95 [00:45<00:21,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9617, LAS: 0.9270, UEM: 0.6698, LEM: 0.4479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4893, partial_loss/deprel_loss: 0.4235, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6301, loss: 0.5659, batch_reg_loss: 0.1934, reg_loss: 0.1935 ||:  72%|#######1  | 68/95 [00:47<00:18,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9146, UAS: 0.9620, LAS: 0.9274, UEM: 0.6724, LEM: 0.4492, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4837, partial_loss/deprel_loss: 0.4864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6793, loss: 0.5645, batch_reg_loss: 0.1934, reg_loss: 0.1935 ||:  75%|#######4  | 71/95 [00:49<00:16,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9569, UAS: 0.9623, LAS: 0.9278, UEM: 0.6786, LEM: 0.4588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0840, partial_loss/deprel_loss: 0.1542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3335, loss: 0.5623, batch_reg_loss: 0.1934, reg_loss: 0.1935 ||:  79%|#######8  | 75/95 [00:52<00:13,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9620, LAS: 0.9274, UEM: 0.6722, LEM: 0.4518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4358, partial_loss/deprel_loss: 0.4788, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6636, loss: 0.5649, batch_reg_loss: 0.1934, reg_loss: 0.1935 ||:  82%|########2 | 78/95 [00:54<00:11,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9390, UAS: 0.9621, LAS: 0.9276, UEM: 0.6706, LEM: 0.4497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2036, partial_loss/deprel_loss: 0.3381, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5046, loss: 0.5636, batch_reg_loss: 0.1934, reg_loss: 0.1935 ||:  86%|########6 | 82/95 [00:57<00:08,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9627, LAS: 0.9281, UEM: 0.6791, LEM: 0.4576, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1542, partial_loss/deprel_loss: 0.3010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4650, loss: 0.5601, batch_reg_loss: 0.1934, reg_loss: 0.1935 ||:  91%|######### | 86/95 [00:59<00:06,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9629, LAS: 0.9283, UEM: 0.6831, LEM: 0.4615, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3320, partial_loss/deprel_loss: 0.4114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5889, loss: 0.5585, batch_reg_loss: 0.1934, reg_loss: 0.1935 ||:  94%|#########3| 89/95 [01:02<00:04,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9621, LAS: 0.9273, UEM: 0.6730, LEM: 0.4528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7520, partial_loss/deprel_loss: 0.5173, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7576, loss: 0.5648, batch_reg_loss: 0.1933, reg_loss: 0.1935 ||:  98%|#########7| 93/95 [01:04<00:01,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9617, LAS: 0.9269, UEM: 0.6690, LEM: 0.4492, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4188, partial_loss/deprel_loss: 0.4986, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6760, loss: 0.5690, batch_reg_loss: 0.1933, reg_loss: 0.1935 ||: 100%|##########| 95/95 [01:05<00:00,  1.45it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:45:08,431 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.193  |       N/A\n",
+      "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - UEM                      |     0.669  |       N/A\n",
+      "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - LEM                      |     0.449  |       N/A\n",
+      "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - EM                       |     0.919  |       N/A\n",
+      "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.419  |       N/A\n",
+      "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |       N/A\n",
+      "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.499  |       N/A\n",
+      "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - loss                     |     0.569  |       N/A\n",
+      "2023-04-07 01:45:08,432 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:45:08,433 - INFO - combo.training.tensorboard_writer - LAS                      |     0.927  |       N/A\n",
+      "2023-04-07 01:45:08,433 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:45:08,433 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:45:08,433 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:45:08,433 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:45:08,433 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:45:08,433 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:45:08,437 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:45:13,292 - INFO - combo.training.trainer - Epoch duration: 0:01:13.185240\n",
+      "2023-04-07 01:45:13,293 - INFO - combo.training.trainer - Estimated training time remaining: 4:46:32\n",
+      "2023-04-07 01:45:13,293 - INFO - allennlp.training.trainer - Epoch 152/399\n",
+      "2023-04-07 01:45:13,293 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:45:13,294 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:45:13,303 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9648, LAS: 0.9306, UEM: 0.6706, LEM: 0.4281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2947, partial_loss/deprel_loss: 0.3594, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5398, loss: 0.5604, batch_reg_loss: 0.1933, reg_loss: 0.1933 ||:   5%|5         | 5/95 [00:02<00:42,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9627, LAS: 0.9267, UEM: 0.6190, LEM: 0.3671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2238, partial_loss/deprel_loss: 0.3424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5120, loss: 0.5719, batch_reg_loss: 0.1933, reg_loss: 0.1933 ||:  11%|#         | 10/95 [00:04<00:40,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9643, LAS: 0.9288, UEM: 0.7303, LEM: 0.5263, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3319, partial_loss/deprel_loss: 0.4157, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5923, loss: 0.5558, batch_reg_loss: 0.1933, reg_loss: 0.1933 ||:  15%|#4        | 14/95 [00:06<00:39,  2.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9645, LAS: 0.9296, UEM: 0.7163, LEM: 0.5095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3716, partial_loss/deprel_loss: 0.3478, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5459, loss: 0.5503, batch_reg_loss: 0.1933, reg_loss: 0.1933 ||:  19%|#8        | 18/95 [00:09<00:39,  1.96it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9622, LAS: 0.9271, UEM: 0.6931, LEM: 0.4872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6067, partial_loss/deprel_loss: 0.5146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7263, loss: 0.5661, batch_reg_loss: 0.1933, reg_loss: 0.1933 ||:  22%|##2       | 21/95 [00:11<00:43,  1.72it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9456, UAS: 0.9607, LAS: 0.9260, UEM: 0.6901, LEM: 0.4842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2320, partial_loss/deprel_loss: 0.2290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4229, loss: 0.5708, batch_reg_loss: 0.1933, reg_loss: 0.1933 ||:  25%|##5       | 24/95 [00:13<00:44,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9553, UAS: 0.9600, LAS: 0.9256, UEM: 0.6950, LEM: 0.4992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0893, partial_loss/deprel_loss: 0.1721, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3488, loss: 0.5732, batch_reg_loss: 0.1933, reg_loss: 0.1933 ||:  29%|##9       | 28/95 [00:16<00:42,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9371, UAS: 0.9614, LAS: 0.9271, UEM: 0.7062, LEM: 0.5077, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2809, partial_loss/deprel_loss: 0.3315, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5147, loss: 0.5640, batch_reg_loss: 0.1933, reg_loss: 0.1933 ||:  33%|###2      | 31/95 [00:18<00:43,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9608, LAS: 0.9264, UEM: 0.6887, LEM: 0.4898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5052, partial_loss/deprel_loss: 0.4907, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6869, loss: 0.5703, batch_reg_loss: 0.1933, reg_loss: 0.1933 ||:  36%|###5      | 34/95 [00:20<00:41,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9617, LAS: 0.9273, UEM: 0.6921, LEM: 0.4883, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3621, partial_loss/deprel_loss: 0.3911, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5786, loss: 0.5651, batch_reg_loss: 0.1933, reg_loss: 0.1933 ||:  39%|###8      | 37/95 [00:22<00:39,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9620, LAS: 0.9275, UEM: 0.6851, LEM: 0.4755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4416, partial_loss/deprel_loss: 0.4813, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6666, loss: 0.5657, batch_reg_loss: 0.1932, reg_loss: 0.1933 ||:  43%|####3     | 41/95 [00:24<00:34,  1.54it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9630, LAS: 0.9288, UEM: 0.6947, LEM: 0.4836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1287, partial_loss/deprel_loss: 0.2286, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4019, loss: 0.5575, batch_reg_loss: 0.1932, reg_loss: 0.1933 ||:  47%|####7     | 45/95 [00:27<00:33,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9638, LAS: 0.9297, UEM: 0.7002, LEM: 0.4856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1377, partial_loss/deprel_loss: 0.2813, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4458, loss: 0.5526, batch_reg_loss: 0.1932, reg_loss: 0.1933 ||:  51%|#####     | 48/95 [00:30<00:33,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9637, LAS: 0.9294, UEM: 0.6944, LEM: 0.4783, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4207, partial_loss/deprel_loss: 0.4358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6260, loss: 0.5551, batch_reg_loss: 0.1932, reg_loss: 0.1933 ||:  54%|#####3    | 51/95 [00:32<00:30,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9633, LAS: 0.9287, UEM: 0.6831, LEM: 0.4660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4890, partial_loss/deprel_loss: 0.4775, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6730, loss: 0.5592, batch_reg_loss: 0.1932, reg_loss: 0.1933 ||:  58%|#####7    | 55/95 [00:34<00:26,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9632, LAS: 0.9287, UEM: 0.6790, LEM: 0.4609, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3341, partial_loss/deprel_loss: 0.4006, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5805, loss: 0.5607, batch_reg_loss: 0.1932, reg_loss: 0.1933 ||:  62%|######2   | 59/95 [00:37<00:23,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9622, LAS: 0.9275, UEM: 0.6744, LEM: 0.4566, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1663, partial_loss/deprel_loss: 0.2727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4446, loss: 0.5681, batch_reg_loss: 0.1932, reg_loss: 0.1933 ||:  66%|######6   | 63/95 [00:40<00:21,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9627, LAS: 0.9281, UEM: 0.6756, LEM: 0.4548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2209, partial_loss/deprel_loss: 0.3555, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5217, loss: 0.5650, batch_reg_loss: 0.1932, reg_loss: 0.1933 ||:  71%|#######   | 67/95 [00:42<00:18,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9613, UAS: 0.9632, LAS: 0.9286, UEM: 0.6861, LEM: 0.4671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0724, partial_loss/deprel_loss: 0.1966, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3649, loss: 0.5610, batch_reg_loss: 0.1932, reg_loss: 0.1933 ||:  75%|#######4  | 71/95 [00:45<00:16,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9633, LAS: 0.9287, UEM: 0.6829, LEM: 0.4647, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0953, partial_loss/deprel_loss: 0.2526, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4142, loss: 0.5609, batch_reg_loss: 0.1931, reg_loss: 0.1932 ||:  79%|#######8  | 75/95 [00:48<00:13,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9632, LAS: 0.9287, UEM: 0.6810, LEM: 0.4615, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3365, partial_loss/deprel_loss: 0.3297, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5242, loss: 0.5611, batch_reg_loss: 0.1931, reg_loss: 0.1932 ||:  82%|########2 | 78/95 [00:50<00:12,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9316, UAS: 0.9635, LAS: 0.9291, UEM: 0.6777, LEM: 0.4563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2915, partial_loss/deprel_loss: 0.3460, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5282, loss: 0.5593, batch_reg_loss: 0.1931, reg_loss: 0.1932 ||:  86%|########6 | 82/95 [00:53<00:09,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9630, LAS: 0.9285, UEM: 0.6734, LEM: 0.4515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2280, partial_loss/deprel_loss: 0.3802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5428, loss: 0.5626, batch_reg_loss: 0.1931, reg_loss: 0.1932 ||:  89%|########9 | 85/95 [00:55<00:06,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9468, UAS: 0.9631, LAS: 0.9287, UEM: 0.6759, LEM: 0.4544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1918, partial_loss/deprel_loss: 0.2593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4389, loss: 0.5614, batch_reg_loss: 0.1931, reg_loss: 0.1932 ||:  93%|#########2| 88/95 [00:57<00:04,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9633, LAS: 0.9287, UEM: 0.6769, LEM: 0.4534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1660, partial_loss/deprel_loss: 0.3621, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5160, loss: 0.5614, batch_reg_loss: 0.1931, reg_loss: 0.1932 ||:  97%|#########6| 92/95 [00:59<00:02,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9070, UAS: 0.9630, LAS: 0.9284, UEM: 0.6751, LEM: 0.4527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5550, partial_loss/deprel_loss: 0.5504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7444, loss: 0.5642, batch_reg_loss: 0.1931, reg_loss: 0.1932 ||: 100%|##########| 95/95 [01:01<00:00,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9070, UAS: 0.9630, LAS: 0.9284, UEM: 0.6751, LEM: 0.4527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5550, partial_loss/deprel_loss: 0.5504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7444, loss: 0.5642, batch_reg_loss: 0.1931, reg_loss: 0.1932 ||: 100%|##########| 95/95 [01:01<00:00,  1.53it/s]\n",
+      "2023-04-07 01:46:18,477 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:46:18,477 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 01:46:18,477 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.193  |       N/A\n",
+      "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - UEM                      |     0.675  |       N/A\n",
+      "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - LEM                      |     0.453  |       N/A\n",
+      "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - EM                       |     0.907  |       N/A\n",
+      "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.555  |       N/A\n",
+      "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |       N/A\n",
+      "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:46:18,478 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.550  |       N/A\n",
+      "2023-04-07 01:46:18,479 - INFO - combo.training.tensorboard_writer - loss                     |     0.564  |       N/A\n",
+      "2023-04-07 01:46:18,479 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:46:18,479 - INFO - combo.training.tensorboard_writer - LAS                      |     0.928  |       N/A\n",
+      "2023-04-07 01:46:18,479 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:46:18,479 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:46:18,479 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:46:18,479 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:46:18,479 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:46:18,479 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:46:18,484 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:46:23,248 - INFO - combo.training.trainer - Epoch duration: 0:01:09.955236\n",
+      "2023-04-07 01:46:23,249 - INFO - combo.training.trainer - Estimated training time remaining: 4:45:23\n",
+      "2023-04-07 01:46:23,249 - INFO - allennlp.training.trainer - Epoch 153/399\n",
+      "2023-04-07 01:46:23,249 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:46:23,249 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:46:23,258 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9771, LAS: 0.9493, UEM: 0.8953, LEM: 0.7781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4817, partial_loss/deprel_loss: 0.4267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6308, loss: 0.4343, batch_reg_loss: 0.1931, reg_loss: 0.1931 ||:   3%|3         | 3/95 [00:02<01:22,  1.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9461, UAS: 0.9711, LAS: 0.9399, UEM: 0.8135, LEM: 0.6574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2107, partial_loss/deprel_loss: 0.2550, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4392, loss: 0.4993, batch_reg_loss: 0.1931, reg_loss: 0.1931 ||:   6%|6         | 6/95 [00:04<01:15,  1.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9343, UAS: 0.9663, LAS: 0.9337, UEM: 0.7370, LEM: 0.5718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2946, partial_loss/deprel_loss: 0.3613, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5410, loss: 0.5429, batch_reg_loss: 0.1931, reg_loss: 0.1931 ||:   9%|9         | 9/95 [00:07<01:10,  1.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9506, UAS: 0.9677, LAS: 0.9344, UEM: 0.7167, LEM: 0.5239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2023, partial_loss/deprel_loss: 0.2878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4638, loss: 0.5343, batch_reg_loss: 0.1931, reg_loss: 0.1931 ||:  14%|#3        | 13/95 [00:09<01:02,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9276, UAS: 0.9664, LAS: 0.9334, UEM: 0.6901, LEM: 0.4919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4230, partial_loss/deprel_loss: 0.4130, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6081, loss: 0.5385, batch_reg_loss: 0.1930, reg_loss: 0.1931 ||:  17%|#6        | 16/95 [00:11<00:58,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9504, UAS: 0.9642, LAS: 0.9310, UEM: 0.6634, LEM: 0.4599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1400, partial_loss/deprel_loss: 0.2451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4171, loss: 0.5492, batch_reg_loss: 0.1930, reg_loss: 0.1931 ||:  22%|##2       | 21/95 [00:13<00:48,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9628, LAS: 0.9295, UEM: 0.6412, LEM: 0.4324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5040, partial_loss/deprel_loss: 0.4501, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6539, loss: 0.5579, batch_reg_loss: 0.1930, reg_loss: 0.1931 ||:  27%|##7       | 26/95 [00:16<00:40,  1.72it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9631, LAS: 0.9300, UEM: 0.6525, LEM: 0.4449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3238, partial_loss/deprel_loss: 0.4227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5959, loss: 0.5518, batch_reg_loss: 0.1930, reg_loss: 0.1930 ||:  33%|###2      | 31/95 [00:18<00:34,  1.87it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9615, LAS: 0.9284, UEM: 0.6319, LEM: 0.4265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4570, partial_loss/deprel_loss: 0.4195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6200, loss: 0.5611, batch_reg_loss: 0.1930, reg_loss: 0.1930 ||:  37%|###6      | 35/95 [00:20<00:33,  1.79it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9614, LAS: 0.9283, UEM: 0.6278, LEM: 0.4211, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1774, partial_loss/deprel_loss: 0.3100, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4765, loss: 0.5609, batch_reg_loss: 0.1930, reg_loss: 0.1930 ||:  41%|####1     | 39/95 [00:23<00:32,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9140, UAS: 0.9606, LAS: 0.9271, UEM: 0.6268, LEM: 0.4194, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5077, partial_loss/deprel_loss: 0.4792, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6779, loss: 0.5675, batch_reg_loss: 0.1930, reg_loss: 0.1930 ||:  45%|####5     | 43/95 [00:26<00:33,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9603, LAS: 0.9268, UEM: 0.6262, LEM: 0.4176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1813, partial_loss/deprel_loss: 0.2470, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4268, loss: 0.5698, batch_reg_loss: 0.1930, reg_loss: 0.1930 ||:  49%|####9     | 47/95 [00:29<00:32,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9413, UAS: 0.9617, LAS: 0.9280, UEM: 0.6514, LEM: 0.4374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1773, partial_loss/deprel_loss: 0.3006, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4689, loss: 0.5614, batch_reg_loss: 0.1930, reg_loss: 0.1930 ||:  54%|#####3    | 51/95 [00:32<00:31,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9434, UAS: 0.9622, LAS: 0.9285, UEM: 0.6540, LEM: 0.4367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1640, partial_loss/deprel_loss: 0.2882, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4564, loss: 0.5598, batch_reg_loss: 0.1930, reg_loss: 0.1930 ||:  58%|#####7    | 55/95 [00:35<00:28,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9536, UAS: 0.9628, LAS: 0.9291, UEM: 0.6585, LEM: 0.4395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1173, partial_loss/deprel_loss: 0.2618, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4259, loss: 0.5565, batch_reg_loss: 0.1930, reg_loss: 0.1930 ||:  61%|######1   | 58/95 [00:37<00:26,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9464, UAS: 0.9635, LAS: 0.9298, UEM: 0.6767, LEM: 0.4580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0988, partial_loss/deprel_loss: 0.2582, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4193, loss: 0.5503, batch_reg_loss: 0.1929, reg_loss: 0.1930 ||:  64%|######4   | 61/95 [00:39<00:25,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9638, LAS: 0.9301, UEM: 0.6752, LEM: 0.4553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2344, partial_loss/deprel_loss: 0.3192, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4952, loss: 0.5482, batch_reg_loss: 0.1929, reg_loss: 0.1930 ||:  67%|######7   | 64/95 [00:42<00:22,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9635, LAS: 0.9300, UEM: 0.6734, LEM: 0.4544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6799, partial_loss/deprel_loss: 0.5022, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7306, loss: 0.5498, batch_reg_loss: 0.1929, reg_loss: 0.1930 ||:  71%|#######   | 67/95 [00:44<00:20,  1.35it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9638, LAS: 0.9303, UEM: 0.6732, LEM: 0.4529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3393, partial_loss/deprel_loss: 0.4257, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6013, loss: 0.5486, batch_reg_loss: 0.1929, reg_loss: 0.1930 ||:  74%|#######3  | 70/95 [00:46<00:18,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9584, UAS: 0.9635, LAS: 0.9300, UEM: 0.6789, LEM: 0.4620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0780, partial_loss/deprel_loss: 0.1876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3586, loss: 0.5509, batch_reg_loss: 0.1929, reg_loss: 0.1930 ||:  77%|#######6  | 73/95 [00:48<00:16,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9635, LAS: 0.9299, UEM: 0.6765, LEM: 0.4568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1778, partial_loss/deprel_loss: 0.3246, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4881, loss: 0.5520, batch_reg_loss: 0.1929, reg_loss: 0.1930 ||:  81%|########1 | 77/95 [00:51<00:12,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9631, LAS: 0.9294, UEM: 0.6768, LEM: 0.4564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1478, partial_loss/deprel_loss: 0.2834, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4492, loss: 0.5553, batch_reg_loss: 0.1929, reg_loss: 0.1930 ||:  84%|########4 | 80/95 [00:53<00:10,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9517, UAS: 0.9628, LAS: 0.9291, UEM: 0.6762, LEM: 0.4574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1173, partial_loss/deprel_loss: 0.2424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4103, loss: 0.5563, batch_reg_loss: 0.1929, reg_loss: 0.1930 ||:  87%|########7 | 83/95 [00:55<00:08,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9632, LAS: 0.9295, UEM: 0.6797, LEM: 0.4598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3616, partial_loss/deprel_loss: 0.4243, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6046, loss: 0.5544, batch_reg_loss: 0.1928, reg_loss: 0.1930 ||:  92%|#########1| 87/95 [00:58<00:05,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8850, UAS: 0.9625, LAS: 0.9287, UEM: 0.6712, LEM: 0.4517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9480, partial_loss/deprel_loss: 0.5740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8416, loss: 0.5597, batch_reg_loss: 0.1928, reg_loss: 0.1930 ||:  96%|#########5| 91/95 [01:00<00:02,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9624, LAS: 0.9286, UEM: 0.6717, LEM: 0.4545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5954, partial_loss/deprel_loss: 0.4826, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6980, loss: 0.5606, batch_reg_loss: 0.1928, reg_loss: 0.1930 ||: 100%|##########| 95/95 [01:03<00:00,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9624, LAS: 0.9286, UEM: 0.6717, LEM: 0.4545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5954, partial_loss/deprel_loss: 0.4826, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6980, loss: 0.5606, batch_reg_loss: 0.1928, reg_loss: 0.1930 ||: 100%|##########| 95/95 [01:03<00:00,  1.49it/s]\n",
+      "2023-04-07 01:47:29,975 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:47:29,975 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 01:47:29,975 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.193  |       N/A\n",
+      "2023-04-07 01:47:29,975 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:47:29,975 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - UEM                      |     0.672  |       N/A\n",
+      "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - LEM                      |     0.454  |       N/A\n",
+      "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - EM                       |     0.911  |       N/A\n",
+      "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.595  |       N/A\n",
+      "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |       N/A\n",
+      "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.483  |       N/A\n",
+      "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - loss                     |     0.561  |       N/A\n",
+      "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - LAS                      |     0.929  |       N/A\n",
+      "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:47:29,976 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:47:29,983 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:47:34,665 - INFO - combo.training.trainer - Epoch duration: 0:01:11.416434\n",
+      "2023-04-07 01:47:34,666 - INFO - combo.training.trainer - Estimated training time remaining: 4:44:17\n",
+      "2023-04-07 01:47:34,666 - INFO - allennlp.training.trainer - Epoch 154/399\n",
+      "2023-04-07 01:47:34,666 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:47:34,666 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:47:34,675 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9472, UAS: 0.9608, LAS: 0.9279, UEM: 0.7436, LEM: 0.5331, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1496, partial_loss/deprel_loss: 0.2507, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4233, loss: 0.5443, batch_reg_loss: 0.1928, reg_loss: 0.1928 ||:   3%|3         | 3/95 [00:02<01:10,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9662, LAS: 0.9326, UEM: 0.7900, LEM: 0.6003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1724, partial_loss/deprel_loss: 0.3194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4828, loss: 0.5179, batch_reg_loss: 0.1928, reg_loss: 0.1928 ||:   6%|6         | 6/95 [00:04<01:05,  1.36it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9381, UAS: 0.9690, LAS: 0.9349, UEM: 0.7779, LEM: 0.5632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2334, partial_loss/deprel_loss: 0.3593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5269, loss: 0.5133, batch_reg_loss: 0.1928, reg_loss: 0.1928 ||:  11%|#         | 10/95 [00:06<00:59,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9295, UAS: 0.9673, LAS: 0.9324, UEM: 0.7386, LEM: 0.5174, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2396, partial_loss/deprel_loss: 0.3731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5392, loss: 0.5312, batch_reg_loss: 0.1928, reg_loss: 0.1928 ||:  14%|#3        | 13/95 [00:08<00:57,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9652, LAS: 0.9304, UEM: 0.6980, LEM: 0.4796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4147, partial_loss/deprel_loss: 0.4058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6004, loss: 0.5489, batch_reg_loss: 0.1928, reg_loss: 0.1928 ||:  18%|#7        | 17/95 [00:11<00:53,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9644, LAS: 0.9295, UEM: 0.6804, LEM: 0.4585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6424, partial_loss/deprel_loss: 0.4568, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6867, loss: 0.5554, batch_reg_loss: 0.1928, reg_loss: 0.1928 ||:  22%|##2       | 21/95 [00:13<00:49,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9514, UAS: 0.9657, LAS: 0.9310, UEM: 0.7083, LEM: 0.4953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1441, partial_loss/deprel_loss: 0.2520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4232, loss: 0.5453, batch_reg_loss: 0.1928, reg_loss: 0.1928 ||:  25%|##5       | 24/95 [00:16<00:49,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9670, LAS: 0.9332, UEM: 0.7441, LEM: 0.5471, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3460, partial_loss/deprel_loss: 0.3733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5606, loss: 0.5323, batch_reg_loss: 0.1928, reg_loss: 0.1928 ||:  28%|##8       | 27/95 [00:18<00:50,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9304, UAS: 0.9672, LAS: 0.9335, UEM: 0.7319, LEM: 0.5283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3969, partial_loss/deprel_loss: 0.3813, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5772, loss: 0.5337, batch_reg_loss: 0.1928, reg_loss: 0.1928 ||:  33%|###2      | 31/95 [00:21<00:45,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9284, UAS: 0.9652, LAS: 0.9320, UEM: 0.7065, LEM: 0.5027, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4192, partial_loss/deprel_loss: 0.3733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5752, loss: 0.5440, batch_reg_loss: 0.1927, reg_loss: 0.1928 ||:  38%|###7      | 36/95 [00:23<00:37,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9648, LAS: 0.9312, UEM: 0.6991, LEM: 0.4924, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6344, partial_loss/deprel_loss: 0.5251, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7397, loss: 0.5485, batch_reg_loss: 0.1927, reg_loss: 0.1928 ||:  43%|####3     | 41/95 [00:26<00:31,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9390, UAS: 0.9652, LAS: 0.9317, UEM: 0.6909, LEM: 0.4790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3004, partial_loss/deprel_loss: 0.3089, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4999, loss: 0.5428, batch_reg_loss: 0.1927, reg_loss: 0.1928 ||:  48%|####8     | 46/95 [00:28<00:26,  1.83it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9654, LAS: 0.9319, UEM: 0.6949, LEM: 0.4822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1893, partial_loss/deprel_loss: 0.3457, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5071, loss: 0.5413, batch_reg_loss: 0.1927, reg_loss: 0.1928 ||:  54%|#####3    | 51/95 [00:30<00:23,  1.90it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8626, UAS: 0.9645, LAS: 0.9307, UEM: 0.6942, LEM: 0.4826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0792, partial_loss/deprel_loss: 0.6491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9278, loss: 0.5480, batch_reg_loss: 0.1927, reg_loss: 0.1928 ||:  58%|#####7    | 55/95 [00:33<00:22,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9643, LAS: 0.9303, UEM: 0.6942, LEM: 0.4802, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1887, partial_loss/deprel_loss: 0.3228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4886, loss: 0.5500, batch_reg_loss: 0.1927, reg_loss: 0.1928 ||:  62%|######2   | 59/95 [00:36<00:22,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9348, UAS: 0.9645, LAS: 0.9304, UEM: 0.6892, LEM: 0.4732, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2624, partial_loss/deprel_loss: 0.3684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5398, loss: 0.5500, batch_reg_loss: 0.1927, reg_loss: 0.1927 ||:  66%|######6   | 63/95 [00:38<00:19,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9643, LAS: 0.9301, UEM: 0.6898, LEM: 0.4738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1419, partial_loss/deprel_loss: 0.2940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4562, loss: 0.5522, batch_reg_loss: 0.1927, reg_loss: 0.1927 ||:  71%|#######   | 67/95 [00:41<00:18,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9643, LAS: 0.9300, UEM: 0.6867, LEM: 0.4705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1890, partial_loss/deprel_loss: 0.2696, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4461, loss: 0.5519, batch_reg_loss: 0.1926, reg_loss: 0.1927 ||:  75%|#######4  | 71/95 [00:44<00:16,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9632, LAS: 0.9289, UEM: 0.6760, LEM: 0.4606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5151, partial_loss/deprel_loss: 0.4756, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6761, loss: 0.5604, batch_reg_loss: 0.1926, reg_loss: 0.1927 ||:  79%|#######8  | 75/95 [00:47<00:13,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8991, UAS: 0.9629, LAS: 0.9287, UEM: 0.6774, LEM: 0.4652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7689, partial_loss/deprel_loss: 0.5712, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8034, loss: 0.5623, batch_reg_loss: 0.1926, reg_loss: 0.1927 ||:  82%|########2 | 78/95 [00:49<00:11,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9626, LAS: 0.9284, UEM: 0.6756, LEM: 0.4626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2878, partial_loss/deprel_loss: 0.3204, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5065, loss: 0.5640, batch_reg_loss: 0.1926, reg_loss: 0.1927 ||:  85%|########5 | 81/95 [00:51<00:10,  1.38it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9622, LAS: 0.9280, UEM: 0.6737, LEM: 0.4606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1969, partial_loss/deprel_loss: 0.3246, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4916, loss: 0.5692, batch_reg_loss: 0.1926, reg_loss: 0.1927 ||:  88%|########8 | 84/95 [00:53<00:07,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9624, LAS: 0.9282, UEM: 0.6741, LEM: 0.4587, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6484, partial_loss/deprel_loss: 0.4866, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7116, loss: 0.5675, batch_reg_loss: 0.1926, reg_loss: 0.1927 ||:  93%|#########2| 88/95 [00:56<00:04,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9625, LAS: 0.9283, UEM: 0.6744, LEM: 0.4581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3919, partial_loss/deprel_loss: 0.4826, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6571, loss: 0.5661, batch_reg_loss: 0.1926, reg_loss: 0.1927 ||:  96%|#########5| 91/95 [00:58<00:02,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9627, LAS: 0.9284, UEM: 0.6749, LEM: 0.4557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1751, partial_loss/deprel_loss: 0.3422, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5014, loss: 0.5655, batch_reg_loss: 0.1926, reg_loss: 0.1927 ||:  99%|#########8| 94/95 [01:00<00:00,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9626, LAS: 0.9282, UEM: 0.6726, LEM: 0.4536, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5320, partial_loss/deprel_loss: 0.4197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6347, loss: 0.5662, batch_reg_loss: 0.1926, reg_loss: 0.1927 ||: 100%|##########| 95/95 [01:01<00:00,  1.54it/s]\n",
+      "2023-04-07 01:48:39,035 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.193  |       N/A\n",
+      "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - UEM                      |     0.673  |       N/A\n",
+      "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - LEM                      |     0.454  |       N/A\n",
+      "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - EM                       |     0.909  |       N/A\n",
+      "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.532  |       N/A\n",
+      "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |       N/A\n",
+      "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.420  |       N/A\n",
+      "2023-04-07 01:48:39,036 - INFO - combo.training.tensorboard_writer - loss                     |     0.566  |       N/A\n",
+      "2023-04-07 01:48:39,037 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:48:39,037 - INFO - combo.training.tensorboard_writer - LAS                      |     0.928  |       N/A\n",
+      "2023-04-07 01:48:39,037 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:48:39,037 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:48:39,037 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:48:39,037 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:48:39,037 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:48:39,037 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:48:39,042 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:48:43,859 - INFO - combo.training.trainer - Epoch duration: 0:01:09.193646\n",
+      "2023-04-07 01:48:43,860 - INFO - combo.training.trainer - Estimated training time remaining: 4:43:08\n",
+      "2023-04-07 01:48:43,860 - INFO - allennlp.training.trainer - Epoch 155/399\n",
+      "2023-04-07 01:48:43,860 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:48:43,861 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:48:43,870 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9608, LAS: 0.9276, UEM: 0.6483, LEM: 0.4555, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5723, partial_loss/deprel_loss: 0.4925, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7011, loss: 0.5914, batch_reg_loss: 0.1926, reg_loss: 0.1926 ||:   3%|3         | 3/95 [00:02<01:08,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9570, LAS: 0.9259, UEM: 0.5925, LEM: 0.3870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5579, partial_loss/deprel_loss: 0.4107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6328, loss: 0.6037, batch_reg_loss: 0.1926, reg_loss: 0.1926 ||:   6%|6         | 6/95 [00:04<01:05,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9636, LAS: 0.9320, UEM: 0.6805, LEM: 0.4508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1039, partial_loss/deprel_loss: 0.2436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4082, loss: 0.5590, batch_reg_loss: 0.1926, reg_loss: 0.1926 ||:   9%|9         | 9/95 [00:06<01:04,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9625, LAS: 0.9313, UEM: 0.6726, LEM: 0.4485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2871, partial_loss/deprel_loss: 0.3332, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5166, loss: 0.5573, batch_reg_loss: 0.1926, reg_loss: 0.1926 ||:  13%|#2        | 12/95 [00:08<01:02,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9631, LAS: 0.9307, UEM: 0.6691, LEM: 0.4400, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6312, partial_loss/deprel_loss: 0.4830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7052, loss: 0.5559, batch_reg_loss: 0.1926, reg_loss: 0.1926 ||:  17%|#6        | 16/95 [00:11<00:57,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9641, LAS: 0.9316, UEM: 0.6668, LEM: 0.4319, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2240, partial_loss/deprel_loss: 0.3047, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4812, loss: 0.5485, batch_reg_loss: 0.1926, reg_loss: 0.1926 ||:  21%|##1       | 20/95 [00:14<00:53,  1.40it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9516, UAS: 0.9643, LAS: 0.9317, UEM: 0.6792, LEM: 0.4498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0868, partial_loss/deprel_loss: 0.2085, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3767, loss: 0.5462, batch_reg_loss: 0.1926, reg_loss: 0.1926 ||:  24%|##4       | 23/95 [00:16<00:52,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9637, LAS: 0.9306, UEM: 0.6644, LEM: 0.4343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4079, partial_loss/deprel_loss: 0.4262, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6151, loss: 0.5520, batch_reg_loss: 0.1925, reg_loss: 0.1926 ||:  27%|##7       | 26/95 [00:18<00:49,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9629, LAS: 0.9300, UEM: 0.6600, LEM: 0.4311, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1871, partial_loss/deprel_loss: 0.2694, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4455, loss: 0.5526, batch_reg_loss: 0.1925, reg_loss: 0.1926 ||:  31%|###       | 29/95 [00:21<00:48,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9623, LAS: 0.9295, UEM: 0.6463, LEM: 0.4178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3637, partial_loss/deprel_loss: 0.3682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5599, loss: 0.5559, batch_reg_loss: 0.1925, reg_loss: 0.1926 ||:  34%|###3      | 32/95 [00:23<00:45,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9168, UAS: 0.9624, LAS: 0.9296, UEM: 0.6430, LEM: 0.4124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5302, partial_loss/deprel_loss: 0.4414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6517, loss: 0.5559, batch_reg_loss: 0.1925, reg_loss: 0.1926 ||:  37%|###6      | 35/95 [00:25<00:43,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9434, UAS: 0.9633, LAS: 0.9307, UEM: 0.6570, LEM: 0.4261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2356, partial_loss/deprel_loss: 0.2285, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4224, loss: 0.5459, batch_reg_loss: 0.1925, reg_loss: 0.1926 ||:  40%|####      | 38/95 [00:27<00:41,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9634, LAS: 0.9309, UEM: 0.6660, LEM: 0.4383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6523, partial_loss/deprel_loss: 0.4400, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6750, loss: 0.5447, batch_reg_loss: 0.1925, reg_loss: 0.1926 ||:  43%|####3     | 41/95 [00:29<00:40,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9140, UAS: 0.9628, LAS: 0.9300, UEM: 0.6541, LEM: 0.4259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4980, partial_loss/deprel_loss: 0.4890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6833, loss: 0.5498, batch_reg_loss: 0.1925, reg_loss: 0.1926 ||:  47%|####7     | 45/95 [00:32<00:35,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9460, UAS: 0.9621, LAS: 0.9292, UEM: 0.6542, LEM: 0.4261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1845, partial_loss/deprel_loss: 0.2696, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4450, loss: 0.5548, batch_reg_loss: 0.1925, reg_loss: 0.1925 ||:  51%|#####     | 48/95 [00:34<00:33,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9628, LAS: 0.9295, UEM: 0.6600, LEM: 0.4277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2775, partial_loss/deprel_loss: 0.4158, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5806, loss: 0.5522, batch_reg_loss: 0.1925, reg_loss: 0.1925 ||:  54%|#####3    | 51/95 [00:36<00:31,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9618, LAS: 0.9283, UEM: 0.6547, LEM: 0.4228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4740, partial_loss/deprel_loss: 0.4610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6561, loss: 0.5598, batch_reg_loss: 0.1925, reg_loss: 0.1925 ||:  58%|#####7    | 55/95 [00:38<00:26,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9617, LAS: 0.9282, UEM: 0.6626, LEM: 0.4351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8209, partial_loss/deprel_loss: 0.5248, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7765, loss: 0.5588, batch_reg_loss: 0.1925, reg_loss: 0.1925 ||:  62%|######2   | 59/95 [00:41<00:22,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9619, LAS: 0.9282, UEM: 0.6584, LEM: 0.4296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1698, partial_loss/deprel_loss: 0.2726, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4445, loss: 0.5606, batch_reg_loss: 0.1924, reg_loss: 0.1925 ||:  66%|######6   | 63/95 [00:43<00:19,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9624, LAS: 0.9287, UEM: 0.6644, LEM: 0.4367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2067, partial_loss/deprel_loss: 0.2426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4279, loss: 0.5565, batch_reg_loss: 0.1924, reg_loss: 0.1925 ||:  71%|#######   | 67/95 [00:45<00:16,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9428, UAS: 0.9623, LAS: 0.9285, UEM: 0.6710, LEM: 0.4432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1447, partial_loss/deprel_loss: 0.2664, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4345, loss: 0.5571, batch_reg_loss: 0.1924, reg_loss: 0.1925 ||:  75%|#######4  | 71/95 [00:48<00:15,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9626, LAS: 0.9289, UEM: 0.6697, LEM: 0.4396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2112, partial_loss/deprel_loss: 0.2956, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4712, loss: 0.5544, batch_reg_loss: 0.1924, reg_loss: 0.1925 ||:  79%|#######8  | 75/95 [00:51<00:13,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9631, LAS: 0.9293, UEM: 0.6757, LEM: 0.4458, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1953, partial_loss/deprel_loss: 0.3077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4776, loss: 0.5512, batch_reg_loss: 0.1924, reg_loss: 0.1925 ||:  83%|########3 | 79/95 [00:53<00:09,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9625, LAS: 0.9286, UEM: 0.6716, LEM: 0.4420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2198, partial_loss/deprel_loss: 0.2848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4642, loss: 0.5562, batch_reg_loss: 0.1924, reg_loss: 0.1925 ||:  87%|########7 | 83/95 [00:55<00:07,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9624, LAS: 0.9285, UEM: 0.6668, LEM: 0.4366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2696, partial_loss/deprel_loss: 0.3556, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5308, loss: 0.5571, batch_reg_loss: 0.1924, reg_loss: 0.1925 ||:  93%|#########2| 88/95 [00:57<00:03,  1.82it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9621, LAS: 0.9281, UEM: 0.6598, LEM: 0.4296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5084, partial_loss/deprel_loss: 0.4923, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6879, loss: 0.5596, batch_reg_loss: 0.1924, reg_loss: 0.1925 ||:  97%|#########6| 92/95 [01:00<00:01,  1.77it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9016, UAS: 0.9622, LAS: 0.9282, UEM: 0.6700, LEM: 0.4463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6357, partial_loss/deprel_loss: 0.5351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7476, loss: 0.5587, batch_reg_loss: 0.1924, reg_loss: 0.1925 ||: 100%|##########| 95/95 [01:02<00:00,  1.51it/s]\n",
+      "2023-04-07 01:49:49,763 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9701, LAS: 0.9299, UEM: 0.8368, LEM: 0.6131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3931, partial_loss/deprel_loss: 6.0986, partial_loss/cycle_loss: 0.0000, batch_loss: 4.9575, loss: 4.9463, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  27%|##7       | 3/11 [00:02<00:07,  1.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8502, UAS: 0.9506, LAS: 0.9037, UEM: 0.7416, LEM: 0.5267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6095, partial_loss/deprel_loss: 18.9605, partial_loss/cycle_loss: 0.0000, batch_loss: 15.4903, loss: 8.5861, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  45%|####5     | 5/11 [00:04<00:05,  1.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9530, LAS: 0.9025, UEM: 0.7042, LEM: 0.4349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4562, partial_loss/deprel_loss: 7.5291, partial_loss/cycle_loss: 0.0000, batch_loss: 6.1145, loss: 7.8166, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  73%|#######2  | 8/11 [00:07<00:02,  1.08it/s]  \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9512, LAS: 0.9002, UEM: 0.6878, LEM: 0.4213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2184, partial_loss/deprel_loss: 5.5646, partial_loss/cycle_loss: 0.0000, batch_loss: 4.4954, loss: 7.7988, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9512, LAS: 0.9002, UEM: 0.6878, LEM: 0.4213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2184, partial_loss/deprel_loss: 5.5646, partial_loss/cycle_loss: 0.0000, batch_loss: 4.4954, loss: 7.7988, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.04it/s]\n",
+      "2023-04-07 01:50:00,314 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:50:00,314 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 01:50:00,314 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.192  |     0.000\n",
+      "2023-04-07 01:50:00,314 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:50:00,314 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:50:00,314 - INFO - combo.training.tensorboard_writer - UEM                      |     0.670  |     0.688\n",
+      "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - LEM                      |     0.446  |     0.421\n",
+      "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - EM                       |     0.902  |     0.935\n",
+      "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.636  |     0.218\n",
+      "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |     0.951\n",
+      "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.535  |     5.565\n",
+      "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - loss                     |     0.559  |     7.799\n",
+      "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - LAS                      |     0.928  |     0.900\n",
+      "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:50:00,315 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 01:50:00,320 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:50:04,527 - INFO - combo.training.trainer - Epoch duration: 0:01:20.667316\n",
+      "2023-04-07 01:50:04,528 - INFO - combo.training.trainer - Estimated training time remaining: 4:42:16\n",
+      "2023-04-07 01:50:04,528 - INFO - allennlp.training.trainer - Epoch 156/399\n",
+      "2023-04-07 01:50:04,528 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:50:04,529 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:50:04,538 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9481, UAS: 0.9720, LAS: 0.9388, UEM: 0.7689, LEM: 0.5378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1274, partial_loss/deprel_loss: 0.2506, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4183, loss: 0.4725, batch_reg_loss: 0.1924, reg_loss: 0.1924 ||:   3%|3         | 3/95 [00:02<01:18,  1.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9457, UAS: 0.9635, LAS: 0.9312, UEM: 0.6470, LEM: 0.4319, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2137, partial_loss/deprel_loss: 0.2940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4703, loss: 0.5486, batch_reg_loss: 0.1923, reg_loss: 0.1924 ||:   7%|7         | 7/95 [00:04<01:07,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9643, LAS: 0.9318, UEM: 0.6621, LEM: 0.4444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3464, partial_loss/deprel_loss: 0.3820, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5672, loss: 0.5366, batch_reg_loss: 0.1923, reg_loss: 0.1924 ||:  11%|#         | 10/95 [00:06<01:02,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9637, LAS: 0.9310, UEM: 0.6443, LEM: 0.4260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2167, partial_loss/deprel_loss: 0.3162, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4886, loss: 0.5449, batch_reg_loss: 0.1923, reg_loss: 0.1923 ||:  14%|#3        | 13/95 [00:09<01:00,  1.36it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9632, LAS: 0.9304, UEM: 0.6377, LEM: 0.4124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3898, partial_loss/deprel_loss: 0.3899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5822, loss: 0.5523, batch_reg_loss: 0.1923, reg_loss: 0.1923 ||:  17%|#6        | 16/95 [00:11<00:59,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9620, LAS: 0.9297, UEM: 0.6260, LEM: 0.4080, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2540, partial_loss/deprel_loss: 0.2591, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4504, loss: 0.5535, batch_reg_loss: 0.1923, reg_loss: 0.1923 ||:  20%|##        | 19/95 [00:13<00:55,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9637, LAS: 0.9310, UEM: 0.6589, LEM: 0.4373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1565, partial_loss/deprel_loss: 0.3142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4749, loss: 0.5424, batch_reg_loss: 0.1923, reg_loss: 0.1923 ||:  23%|##3       | 22/95 [00:15<00:53,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8739, UAS: 0.9598, LAS: 0.9271, UEM: 0.6327, LEM: 0.4175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9984, partial_loss/deprel_loss: 0.6266, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8933, loss: 0.5673, batch_reg_loss: 0.1923, reg_loss: 0.1923 ||:  26%|##6       | 25/95 [00:17<00:51,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9478, UAS: 0.9616, LAS: 0.9289, UEM: 0.6562, LEM: 0.4383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1413, partial_loss/deprel_loss: 0.2387, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4116, loss: 0.5540, batch_reg_loss: 0.1923, reg_loss: 0.1923 ||:  31%|###       | 29/95 [00:20<00:46,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9615, LAS: 0.9287, UEM: 0.6530, LEM: 0.4374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3790, partial_loss/deprel_loss: 0.3616, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5573, loss: 0.5562, batch_reg_loss: 0.1923, reg_loss: 0.1923 ||:  34%|###3      | 32/95 [00:22<00:45,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9615, LAS: 0.9284, UEM: 0.6475, LEM: 0.4283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5956, partial_loss/deprel_loss: 0.4945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7070, loss: 0.5583, batch_reg_loss: 0.1923, reg_loss: 0.1923 ||:  38%|###7      | 36/95 [00:25<00:40,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9623, LAS: 0.9290, UEM: 0.6547, LEM: 0.4303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1599, partial_loss/deprel_loss: 0.3209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4810, loss: 0.5537, batch_reg_loss: 0.1923, reg_loss: 0.1923 ||:  42%|####2     | 40/95 [00:27<00:37,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9627, LAS: 0.9291, UEM: 0.6520, LEM: 0.4224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3807, partial_loss/deprel_loss: 0.4060, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5932, loss: 0.5514, batch_reg_loss: 0.1922, reg_loss: 0.1923 ||:  46%|####6     | 44/95 [00:30<00:34,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9626, LAS: 0.9287, UEM: 0.6578, LEM: 0.4270, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1378, partial_loss/deprel_loss: 0.2436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4146, loss: 0.5531, batch_reg_loss: 0.1922, reg_loss: 0.1923 ||:  49%|####9     | 47/95 [00:32<00:33,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9626, LAS: 0.9287, UEM: 0.6575, LEM: 0.4248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1696, partial_loss/deprel_loss: 0.3004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4665, loss: 0.5530, batch_reg_loss: 0.1922, reg_loss: 0.1923 ||:  53%|#####2    | 50/95 [00:34<00:32,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9565, UAS: 0.9630, LAS: 0.9291, UEM: 0.6669, LEM: 0.4378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0686, partial_loss/deprel_loss: 0.1883, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3566, loss: 0.5501, batch_reg_loss: 0.1922, reg_loss: 0.1923 ||:  56%|#####5    | 53/95 [00:37<00:29,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9635, LAS: 0.9296, UEM: 0.6707, LEM: 0.4385, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2763, partial_loss/deprel_loss: 0.3287, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5104, loss: 0.5468, batch_reg_loss: 0.1922, reg_loss: 0.1923 ||:  59%|#####8    | 56/95 [00:39<00:27,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9641, LAS: 0.9303, UEM: 0.6868, LEM: 0.4605, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2544, partial_loss/deprel_loss: 0.3112, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4921, loss: 0.5414, batch_reg_loss: 0.1922, reg_loss: 0.1923 ||:  62%|######2   | 59/95 [00:41<00:26,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9432, UAS: 0.9644, LAS: 0.9305, UEM: 0.6866, LEM: 0.4582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1881, partial_loss/deprel_loss: 0.2736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4487, loss: 0.5393, batch_reg_loss: 0.1922, reg_loss: 0.1923 ||:  65%|######5   | 62/95 [00:43<00:23,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9648, LAS: 0.9310, UEM: 0.6928, LEM: 0.4653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2850, partial_loss/deprel_loss: 0.3949, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5651, loss: 0.5360, batch_reg_loss: 0.1922, reg_loss: 0.1923 ||:  68%|######8   | 65/95 [00:46<00:22,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8921, UAS: 0.9635, LAS: 0.9296, UEM: 0.6842, LEM: 0.4569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8027, partial_loss/deprel_loss: 0.5600, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8007, loss: 0.5462, batch_reg_loss: 0.1921, reg_loss: 0.1923 ||:  73%|#######2  | 69/95 [00:48<00:18,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9636, LAS: 0.9297, UEM: 0.6881, LEM: 0.4622, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2738, partial_loss/deprel_loss: 0.3515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5281, loss: 0.5464, batch_reg_loss: 0.1921, reg_loss: 0.1923 ||:  77%|#######6  | 73/95 [00:50<00:14,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9764, UAS: 0.9636, LAS: 0.9300, UEM: 0.6977, LEM: 0.4795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0214, partial_loss/deprel_loss: 0.0955, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2728, loss: 0.5453, batch_reg_loss: 0.1921, reg_loss: 0.1923 ||:  81%|########1 | 77/95 [00:52<00:11,  1.60it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9624, LAS: 0.9288, UEM: 0.6878, LEM: 0.4712, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3479, partial_loss/deprel_loss: 0.4048, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5855, loss: 0.5535, batch_reg_loss: 0.1921, reg_loss: 0.1922 ||:  85%|########5 | 81/95 [00:55<00:08,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9623, LAS: 0.9287, UEM: 0.6844, LEM: 0.4670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3306, partial_loss/deprel_loss: 0.4380, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6087, loss: 0.5546, batch_reg_loss: 0.1921, reg_loss: 0.1922 ||:  91%|######### | 86/95 [00:57<00:04,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9617, LAS: 0.9279, UEM: 0.6748, LEM: 0.4568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4644, partial_loss/deprel_loss: 0.4204, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6213, loss: 0.5612, batch_reg_loss: 0.1921, reg_loss: 0.1922 ||:  96%|#########5| 91/95 [00:59<00:02,  1.88it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9347, UAS: 0.9616, LAS: 0.9277, UEM: 0.6721, LEM: 0.4518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2221, partial_loss/deprel_loss: 0.3361, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5054, loss: 0.5621, batch_reg_loss: 0.1921, reg_loss: 0.1922 ||: 100%|##########| 95/95 [01:02<00:00,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9347, UAS: 0.9616, LAS: 0.9277, UEM: 0.6721, LEM: 0.4518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2221, partial_loss/deprel_loss: 0.3361, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5054, loss: 0.5621, batch_reg_loss: 0.1921, reg_loss: 0.1922 ||: 100%|##########| 95/95 [01:02<00:00,  1.51it/s]\n",
+      "2023-04-07 01:51:10,708 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:51:10,708 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 01:51:10,708 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.192  |       N/A\n",
+      "2023-04-07 01:51:10,708 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:51:10,708 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - UEM                      |     0.672  |       N/A\n",
+      "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - LEM                      |     0.452  |       N/A\n",
+      "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - EM                       |     0.935  |       N/A\n",
+      "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.222  |       N/A\n",
+      "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |       N/A\n",
+      "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.336  |       N/A\n",
+      "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - loss                     |     0.562  |       N/A\n",
+      "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - LAS                      |     0.928  |       N/A\n",
+      "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:51:10,709 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:51:10,733 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:51:15,513 - INFO - combo.training.trainer - Epoch duration: 0:01:10.985362\n",
+      "2023-04-07 01:51:15,514 - INFO - combo.training.trainer - Estimated training time remaining: 4:41:09\n",
+      "2023-04-07 01:51:15,514 - INFO - allennlp.training.trainer - Epoch 157/399\n",
+      "2023-04-07 01:51:15,514 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:51:15,515 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:51:15,526 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9344, UAS: 0.9738, LAS: 0.9382, UEM: 0.7844, LEM: 0.5275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2396, partial_loss/deprel_loss: 0.3805, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5444, loss: 0.5026, batch_reg_loss: 0.1921, reg_loss: 0.1921 ||:   4%|4         | 4/95 [00:02<00:58,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8612, UAS: 0.9582, LAS: 0.9227, UEM: 0.6872, LEM: 0.4457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2120, partial_loss/deprel_loss: 0.6602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9627, loss: 0.5984, batch_reg_loss: 0.1921, reg_loss: 0.1921 ||:   8%|8         | 8/95 [00:05<00:56,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9627, LAS: 0.9272, UEM: 0.7279, LEM: 0.4885, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3766, partial_loss/deprel_loss: 0.3992, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5868, loss: 0.5602, batch_reg_loss: 0.1921, reg_loss: 0.1921 ||:  13%|#2        | 12/95 [00:07<00:54,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9492, UAS: 0.9634, LAS: 0.9286, UEM: 0.7222, LEM: 0.4908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1806, partial_loss/deprel_loss: 0.2052, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3923, loss: 0.5488, batch_reg_loss: 0.1921, reg_loss: 0.1921 ||:  16%|#5        | 15/95 [00:10<00:53,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9613, LAS: 0.9273, UEM: 0.6857, LEM: 0.4577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3573, partial_loss/deprel_loss: 0.3671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5572, loss: 0.5681, batch_reg_loss: 0.1921, reg_loss: 0.1921 ||:  20%|##        | 19/95 [00:12<00:50,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9617, LAS: 0.9278, UEM: 0.6919, LEM: 0.4669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1804, partial_loss/deprel_loss: 0.2561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4330, loss: 0.5624, batch_reg_loss: 0.1921, reg_loss: 0.1921 ||:  24%|##4       | 23/95 [00:15<00:47,  1.51it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9630, LAS: 0.9291, UEM: 0.7137, LEM: 0.4966, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1964, partial_loss/deprel_loss: 0.2525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4333, loss: 0.5527, batch_reg_loss: 0.1921, reg_loss: 0.1921 ||:  27%|##7       | 26/95 [00:17<00:47,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9634, LAS: 0.9295, UEM: 0.7100, LEM: 0.4893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1755, partial_loss/deprel_loss: 0.2720, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4447, loss: 0.5503, batch_reg_loss: 0.1921, reg_loss: 0.1921 ||:  31%|###       | 29/95 [00:19<00:46,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9638, LAS: 0.9299, UEM: 0.7098, LEM: 0.4877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3978, partial_loss/deprel_loss: 0.3517, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5530, loss: 0.5488, batch_reg_loss: 0.1921, reg_loss: 0.1921 ||:  34%|###3      | 32/95 [00:22<00:45,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9084, UAS: 0.9628, LAS: 0.9285, UEM: 0.6919, LEM: 0.4684, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5739, partial_loss/deprel_loss: 0.5345, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7344, loss: 0.5599, batch_reg_loss: 0.1920, reg_loss: 0.1921 ||:  38%|###7      | 36/95 [00:24<00:41,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9634, LAS: 0.9293, UEM: 0.7012, LEM: 0.4788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5302, partial_loss/deprel_loss: 0.4308, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6427, loss: 0.5536, batch_reg_loss: 0.1920, reg_loss: 0.1921 ||:  41%|####1     | 39/95 [00:26<00:39,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9629, LAS: 0.9287, UEM: 0.6886, LEM: 0.4653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3934, partial_loss/deprel_loss: 0.4782, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6533, loss: 0.5574, batch_reg_loss: 0.1920, reg_loss: 0.1921 ||:  45%|####5     | 43/95 [00:29<00:36,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9615, LAS: 0.9273, UEM: 0.6715, LEM: 0.4505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4694, partial_loss/deprel_loss: 0.3812, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5908, loss: 0.5673, batch_reg_loss: 0.1920, reg_loss: 0.1921 ||:  49%|####9     | 47/95 [00:31<00:32,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9616, LAS: 0.9273, UEM: 0.6700, LEM: 0.4465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2493, partial_loss/deprel_loss: 0.3382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5124, loss: 0.5664, batch_reg_loss: 0.1920, reg_loss: 0.1921 ||:  53%|#####2    | 50/95 [00:33<00:30,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9618, LAS: 0.9275, UEM: 0.6755, LEM: 0.4539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1519, partial_loss/deprel_loss: 0.2576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4284, loss: 0.5625, batch_reg_loss: 0.1920, reg_loss: 0.1921 ||:  56%|#####5    | 53/95 [00:36<00:29,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8838, UAS: 0.9614, LAS: 0.9269, UEM: 0.6713, LEM: 0.4483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9562, partial_loss/deprel_loss: 0.5576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8293, loss: 0.5657, batch_reg_loss: 0.1920, reg_loss: 0.1921 ||:  59%|#####8    | 56/95 [00:38<00:27,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9609, LAS: 0.9267, UEM: 0.6684, LEM: 0.4456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2975, partial_loss/deprel_loss: 0.2845, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4790, loss: 0.5669, batch_reg_loss: 0.1920, reg_loss: 0.1921 ||:  62%|######2   | 59/95 [00:40<00:25,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9610, LAS: 0.9268, UEM: 0.6650, LEM: 0.4399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3575, partial_loss/deprel_loss: 0.4162, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5965, loss: 0.5666, batch_reg_loss: 0.1920, reg_loss: 0.1920 ||:  66%|######6   | 63/95 [00:42<00:21,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9352, UAS: 0.9614, LAS: 0.9274, UEM: 0.6638, LEM: 0.4374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2857, partial_loss/deprel_loss: 0.3097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4968, loss: 0.5629, batch_reg_loss: 0.1920, reg_loss: 0.1920 ||:  71%|#######   | 67/95 [00:45<00:18,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9615, LAS: 0.9277, UEM: 0.6603, LEM: 0.4336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5243, partial_loss/deprel_loss: 0.4155, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6292, loss: 0.5623, batch_reg_loss: 0.1919, reg_loss: 0.1920 ||:  75%|#######4  | 71/95 [00:48<00:16,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9614, LAS: 0.9276, UEM: 0.6570, LEM: 0.4291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5893, partial_loss/deprel_loss: 0.4940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7050, loss: 0.5624, batch_reg_loss: 0.1919, reg_loss: 0.1920 ||:  78%|#######7  | 74/95 [00:50<00:15,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9616, LAS: 0.9279, UEM: 0.6575, LEM: 0.4292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5763, partial_loss/deprel_loss: 0.4984, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7059, loss: 0.5618, batch_reg_loss: 0.1919, reg_loss: 0.1920 ||:  81%|########1 | 77/95 [00:52<00:12,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9580, UAS: 0.9619, LAS: 0.9281, UEM: 0.6649, LEM: 0.4390, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0667, partial_loss/deprel_loss: 0.2107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3739, loss: 0.5604, batch_reg_loss: 0.1919, reg_loss: 0.1920 ||:  84%|########4 | 80/95 [00:55<00:11,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9623, LAS: 0.9286, UEM: 0.6652, LEM: 0.4371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2707, partial_loss/deprel_loss: 0.3376, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5161, loss: 0.5585, batch_reg_loss: 0.1919, reg_loss: 0.1920 ||:  88%|########8 | 84/95 [00:57<00:07,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9250, UAS: 0.9626, LAS: 0.9291, UEM: 0.6767, LEM: 0.4553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3567, partial_loss/deprel_loss: 0.4304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6076, loss: 0.5566, batch_reg_loss: 0.1919, reg_loss: 0.1920 ||:  92%|#########1| 87/95 [01:00<00:06,  1.32it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8896, UAS: 0.9621, LAS: 0.9284, UEM: 0.6697, LEM: 0.4488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8095, partial_loss/deprel_loss: 0.5292, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7772, loss: 0.5611, batch_reg_loss: 0.1919, reg_loss: 0.1920 ||:  96%|#########5| 91/95 [01:02<00:02,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9624, LAS: 0.9285, UEM: 0.6747, LEM: 0.4533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1141, partial_loss/deprel_loss: 0.2310, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3995, loss: 0.5591, batch_reg_loss: 0.1919, reg_loss: 0.1920 ||: 100%|##########| 95/95 [01:04<00:00,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9624, LAS: 0.9285, UEM: 0.6747, LEM: 0.4533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1141, partial_loss/deprel_loss: 0.2310, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3995, loss: 0.5591, batch_reg_loss: 0.1919, reg_loss: 0.1920 ||: 100%|##########| 95/95 [01:04<00:00,  1.46it/s]\n",
+      "2023-04-07 01:52:24,158 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:52:24,158 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 01:52:24,158 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.192  |       N/A\n",
+      "2023-04-07 01:52:24,158 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - UEM                      |     0.675  |       N/A\n",
+      "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - LEM                      |     0.453  |       N/A\n",
+      "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - EM                       |     0.947  |       N/A\n",
+      "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.114  |       N/A\n",
+      "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |       N/A\n",
+      "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.231  |       N/A\n",
+      "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - loss                     |     0.559  |       N/A\n",
+      "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - LAS                      |     0.929  |       N/A\n",
+      "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:52:24,159 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:52:24,160 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:52:24,160 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:52:24,160 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:52:24,160 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:52:24,165 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:52:30,974 - INFO - combo.training.trainer - Epoch duration: 0:01:15.460015\n",
+      "2023-04-07 01:52:30,975 - INFO - combo.training.trainer - Estimated training time remaining: 4:40:09\n",
+      "2023-04-07 01:52:30,975 - INFO - allennlp.training.trainer - Epoch 158/399\n",
+      "2023-04-07 01:52:30,975 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:52:30,975 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:52:30,983 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9512, LAS: 0.9167, UEM: 0.4082, LEM: 0.1803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4347, partial_loss/deprel_loss: 0.3830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5852, loss: 0.6455, batch_reg_loss: 0.1919, reg_loss: 0.1919 ||:   3%|3         | 3/95 [00:02<01:03,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9431, UAS: 0.9581, LAS: 0.9261, UEM: 0.5239, LEM: 0.2775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2727, partial_loss/deprel_loss: 0.3076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4925, loss: 0.5920, batch_reg_loss: 0.1919, reg_loss: 0.1919 ||:   6%|6         | 6/95 [00:04<01:03,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9609, LAS: 0.9278, UEM: 0.5954, LEM: 0.3433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1440, partial_loss/deprel_loss: 0.3057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4652, loss: 0.5821, batch_reg_loss: 0.1919, reg_loss: 0.1919 ||:   9%|9         | 9/95 [00:06<01:00,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9646, LAS: 0.9328, UEM: 0.7253, LEM: 0.5343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2249, partial_loss/deprel_loss: 0.2992, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4762, loss: 0.5446, batch_reg_loss: 0.1919, reg_loss: 0.1919 ||:  12%|#1        | 11/95 [00:08<01:07,  1.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9428, UAS: 0.9666, LAS: 0.9345, UEM: 0.7312, LEM: 0.5271, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1664, partial_loss/deprel_loss: 0.2457, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4217, loss: 0.5319, batch_reg_loss: 0.1919, reg_loss: 0.1919 ||:  15%|#4        | 14/95 [00:10<01:03,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9312, UAS: 0.9677, LAS: 0.9352, UEM: 0.7371, LEM: 0.5285, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3120, partial_loss/deprel_loss: 0.3147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5060, loss: 0.5235, batch_reg_loss: 0.1919, reg_loss: 0.1919 ||:  18%|#7        | 17/95 [00:13<01:00,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9514, UAS: 0.9656, LAS: 0.9328, UEM: 0.7227, LEM: 0.5151, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1606, partial_loss/deprel_loss: 0.2426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4180, loss: 0.5381, batch_reg_loss: 0.1918, reg_loss: 0.1919 ||:  21%|##1       | 20/95 [00:15<00:56,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9658, LAS: 0.9335, UEM: 0.7145, LEM: 0.5046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2215, partial_loss/deprel_loss: 0.2695, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4517, loss: 0.5310, batch_reg_loss: 0.1918, reg_loss: 0.1919 ||:  25%|##5       | 24/95 [00:17<00:50,  1.39it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9430, UAS: 0.9668, LAS: 0.9342, UEM: 0.7202, LEM: 0.5015, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1747, partial_loss/deprel_loss: 0.3145, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4783, loss: 0.5258, batch_reg_loss: 0.1918, reg_loss: 0.1919 ||:  28%|##8       | 27/95 [00:19<00:49,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9669, LAS: 0.9343, UEM: 0.7249, LEM: 0.5062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5693, partial_loss/deprel_loss: 0.4659, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6784, loss: 0.5244, batch_reg_loss: 0.1918, reg_loss: 0.1919 ||:  32%|###1      | 30/95 [00:22<00:47,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9650, LAS: 0.9322, UEM: 0.7041, LEM: 0.4847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3941, partial_loss/deprel_loss: 0.4029, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5930, loss: 0.5382, batch_reg_loss: 0.1918, reg_loss: 0.1918 ||:  36%|###5      | 34/95 [00:24<00:42,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9383, UAS: 0.9654, LAS: 0.9326, UEM: 0.7031, LEM: 0.4802, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2435, partial_loss/deprel_loss: 0.3212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4975, loss: 0.5356, batch_reg_loss: 0.1918, reg_loss: 0.1918 ||:  40%|####      | 38/95 [00:27<00:38,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9647, LAS: 0.9321, UEM: 0.6988, LEM: 0.4791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1723, partial_loss/deprel_loss: 0.2438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4213, loss: 0.5386, batch_reg_loss: 0.1918, reg_loss: 0.1918 ||:  44%|####4     | 42/95 [00:30<00:36,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9647, LAS: 0.9319, UEM: 0.6935, LEM: 0.4689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3095, partial_loss/deprel_loss: 0.3647, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5454, loss: 0.5406, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||:  48%|####8     | 46/95 [00:32<00:32,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9651, LAS: 0.9325, UEM: 0.7000, LEM: 0.4756, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3892, partial_loss/deprel_loss: 0.3993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5890, loss: 0.5369, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||:  52%|#####1    | 49/95 [00:34<00:31,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9501, UAS: 0.9653, LAS: 0.9327, UEM: 0.7027, LEM: 0.4786, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1235, partial_loss/deprel_loss: 0.2544, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4200, loss: 0.5361, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||:  55%|#####4    | 52/95 [00:36<00:29,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9647, LAS: 0.9320, UEM: 0.6959, LEM: 0.4718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6449, partial_loss/deprel_loss: 0.5230, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7391, loss: 0.5420, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||:  58%|#####7    | 55/95 [00:39<00:29,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9284, UAS: 0.9646, LAS: 0.9317, UEM: 0.6893, LEM: 0.4628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3482, partial_loss/deprel_loss: 0.4070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5869, loss: 0.5438, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||:  61%|######1   | 58/95 [00:41<00:26,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9250, UAS: 0.9652, LAS: 0.9324, UEM: 0.6942, LEM: 0.4672, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3748, partial_loss/deprel_loss: 0.3522, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5484, loss: 0.5389, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||:  65%|######5   | 62/95 [00:43<00:22,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9508, UAS: 0.9651, LAS: 0.9322, UEM: 0.6969, LEM: 0.4718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0805, partial_loss/deprel_loss: 0.2259, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3885, loss: 0.5402, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||:  68%|######8   | 65/95 [00:46<00:22,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8767, UAS: 0.9640, LAS: 0.9312, UEM: 0.6889, LEM: 0.4655, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1801, partial_loss/deprel_loss: 0.5861, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8966, loss: 0.5461, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||:  72%|#######1  | 68/95 [00:48<00:19,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9360, UAS: 0.9641, LAS: 0.9313, UEM: 0.6869, LEM: 0.4629, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2721, partial_loss/deprel_loss: 0.3842, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5535, loss: 0.5456, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||:  76%|#######5  | 72/95 [00:51<00:16,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9638, LAS: 0.9309, UEM: 0.6826, LEM: 0.4588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1630, partial_loss/deprel_loss: 0.2580, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4307, loss: 0.5491, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||:  80%|########  | 76/95 [00:53<00:13,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9636, LAS: 0.9306, UEM: 0.6749, LEM: 0.4507, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2799, partial_loss/deprel_loss: 0.3554, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5320, loss: 0.5515, batch_reg_loss: 0.1917, reg_loss: 0.1918 ||:  84%|########4 | 80/95 [00:56<00:09,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9636, LAS: 0.9306, UEM: 0.6741, LEM: 0.4485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6128, partial_loss/deprel_loss: 0.4970, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7118, loss: 0.5511, batch_reg_loss: 0.1916, reg_loss: 0.1918 ||:  88%|########8 | 84/95 [00:59<00:07,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9636, LAS: 0.9305, UEM: 0.6716, LEM: 0.4454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2457, partial_loss/deprel_loss: 0.3890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5520, loss: 0.5515, batch_reg_loss: 0.1916, reg_loss: 0.1918 ||:  92%|#########1| 87/95 [01:01<00:05,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9638, LAS: 0.9305, UEM: 0.6772, LEM: 0.4532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4094, partial_loss/deprel_loss: 0.4092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6009, loss: 0.5505, batch_reg_loss: 0.1916, reg_loss: 0.1918 ||:  95%|#########4| 90/95 [01:03<00:03,  1.44it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8988, UAS: 0.9631, LAS: 0.9297, UEM: 0.6746, LEM: 0.4512, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8202, partial_loss/deprel_loss: 0.5688, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8107, loss: 0.5554, batch_reg_loss: 0.1916, reg_loss: 0.1917 ||:  99%|#########8| 94/95 [01:05<00:00,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9557, UAS: 0.9633, LAS: 0.9300, UEM: 0.6788, LEM: 0.4560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0983, partial_loss/deprel_loss: 0.2248, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3911, loss: 0.5537, batch_reg_loss: 0.1916, reg_loss: 0.1917 ||: 100%|##########| 95/95 [01:06<00:00,  1.43it/s]\n",
+      "2023-04-07 01:53:40,249 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.192  |       N/A\n",
+      "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - UEM                      |     0.679  |       N/A\n",
+      "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - LEM                      |     0.456  |       N/A\n",
+      "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - EM                       |     0.956  |       N/A\n",
+      "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.098  |       N/A\n",
+      "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |       N/A\n",
+      "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.225  |       N/A\n",
+      "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - loss                     |     0.554  |       N/A\n",
+      "2023-04-07 01:53:40,250 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:53:40,251 - INFO - combo.training.tensorboard_writer - LAS                      |     0.930  |       N/A\n",
+      "2023-04-07 01:53:40,251 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:53:40,251 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:53:40,251 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:53:40,251 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:53:40,251 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:53:40,251 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:53:42,138 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:53:46,737 - INFO - combo.training.trainer - Epoch duration: 0:01:15.762648\n",
+      "2023-04-07 01:53:46,738 - INFO - combo.training.trainer - Estimated training time remaining: 4:39:09\n",
+      "2023-04-07 01:53:46,738 - INFO - allennlp.training.trainer - Epoch 159/399\n",
+      "2023-04-07 01:53:46,738 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:53:46,739 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:53:46,748 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9460, UAS: 0.9558, LAS: 0.9254, UEM: 0.4000, LEM: 0.1876, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2381, partial_loss/deprel_loss: 0.3095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4869, loss: 0.5982, batch_reg_loss: 0.1916, reg_loss: 0.1916 ||:   5%|5         | 5/95 [00:02<00:42,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9537, UAS: 0.9604, LAS: 0.9288, UEM: 0.5916, LEM: 0.3703, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0738, partial_loss/deprel_loss: 0.2280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3887, loss: 0.5749, batch_reg_loss: 0.1916, reg_loss: 0.1916 ||:  11%|#         | 10/95 [00:04<00:40,  2.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9642, LAS: 0.9318, UEM: 0.6435, LEM: 0.4006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1799, partial_loss/deprel_loss: 0.3075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4736, loss: 0.5529, batch_reg_loss: 0.1916, reg_loss: 0.1916 ||:  14%|#3        | 13/95 [00:07<00:48,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9672, LAS: 0.9347, UEM: 0.7097, LEM: 0.4734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1916, partial_loss/deprel_loss: 0.2404, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4223, loss: 0.5279, batch_reg_loss: 0.1916, reg_loss: 0.1916 ||:  17%|#6        | 16/95 [00:09<00:51,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9663, LAS: 0.9337, UEM: 0.6978, LEM: 0.4673, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3619, partial_loss/deprel_loss: 0.3682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5585, loss: 0.5315, batch_reg_loss: 0.1916, reg_loss: 0.1916 ||:  20%|##        | 19/95 [00:12<00:52,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9658, LAS: 0.9327, UEM: 0.6779, LEM: 0.4455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3998, partial_loss/deprel_loss: 0.4361, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6204, loss: 0.5353, batch_reg_loss: 0.1916, reg_loss: 0.1916 ||:  23%|##3       | 22/95 [00:14<00:51,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9652, LAS: 0.9323, UEM: 0.6699, LEM: 0.4401, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4226, partial_loss/deprel_loss: 0.4153, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6083, loss: 0.5388, batch_reg_loss: 0.1916, reg_loss: 0.1916 ||:  26%|##6       | 25/95 [00:16<00:49,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9366, UAS: 0.9638, LAS: 0.9309, UEM: 0.6480, LEM: 0.4216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2334, partial_loss/deprel_loss: 0.3410, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5111, loss: 0.5503, batch_reg_loss: 0.1916, reg_loss: 0.1916 ||:  31%|###       | 29/95 [00:19<00:46,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9647, LAS: 0.9317, UEM: 0.6596, LEM: 0.4328, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4591, partial_loss/deprel_loss: 0.4312, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6283, loss: 0.5452, batch_reg_loss: 0.1915, reg_loss: 0.1916 ||:  35%|###4      | 33/95 [00:21<00:41,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9648, LAS: 0.9318, UEM: 0.6602, LEM: 0.4320, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1464, partial_loss/deprel_loss: 0.2929, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4551, loss: 0.5421, batch_reg_loss: 0.1915, reg_loss: 0.1916 ||:  38%|###7      | 36/95 [00:23<00:40,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9636, LAS: 0.9308, UEM: 0.6529, LEM: 0.4255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2751, partial_loss/deprel_loss: 0.3254, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5068, loss: 0.5493, batch_reg_loss: 0.1915, reg_loss: 0.1916 ||:  41%|####1     | 39/95 [00:26<00:39,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9493, UAS: 0.9634, LAS: 0.9305, UEM: 0.6588, LEM: 0.4336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1040, partial_loss/deprel_loss: 0.2207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3889, loss: 0.5507, batch_reg_loss: 0.1915, reg_loss: 0.1916 ||:  44%|####4     | 42/95 [00:28<00:37,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9628, LAS: 0.9299, UEM: 0.6538, LEM: 0.4269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1895, partial_loss/deprel_loss: 0.2882, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4600, loss: 0.5544, batch_reg_loss: 0.1915, reg_loss: 0.1916 ||:  48%|####8     | 46/95 [00:30<00:33,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9227, UAS: 0.9632, LAS: 0.9302, UEM: 0.6575, LEM: 0.4303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4074, partial_loss/deprel_loss: 0.4105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6014, loss: 0.5526, batch_reg_loss: 0.1915, reg_loss: 0.1916 ||:  52%|#####1    | 49/95 [00:32<00:31,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9627, LAS: 0.9296, UEM: 0.6498, LEM: 0.4213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4384, partial_loss/deprel_loss: 0.3587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5661, loss: 0.5555, batch_reg_loss: 0.1915, reg_loss: 0.1916 ||:  56%|#####5    | 53/95 [00:35<00:27,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9320, UAS: 0.9629, LAS: 0.9298, UEM: 0.6488, LEM: 0.4185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3685, partial_loss/deprel_loss: 0.3698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5610, loss: 0.5553, batch_reg_loss: 0.1915, reg_loss: 0.1916 ||:  60%|######    | 57/95 [00:37<00:25,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9625, LAS: 0.9291, UEM: 0.6473, LEM: 0.4163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5485, partial_loss/deprel_loss: 0.4626, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6712, loss: 0.5580, batch_reg_loss: 0.1915, reg_loss: 0.1915 ||:  64%|######4   | 61/95 [00:40<00:22,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9630, LAS: 0.9297, UEM: 0.6631, LEM: 0.4365, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1971, partial_loss/deprel_loss: 0.3139, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4820, loss: 0.5543, batch_reg_loss: 0.1915, reg_loss: 0.1915 ||:  68%|######8   | 65/95 [00:43<00:21,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9626, LAS: 0.9294, UEM: 0.6562, LEM: 0.4309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4976, partial_loss/deprel_loss: 0.3750, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5910, loss: 0.5566, batch_reg_loss: 0.1915, reg_loss: 0.1915 ||:  72%|#######1  | 68/95 [00:46<00:19,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9630, LAS: 0.9297, UEM: 0.6571, LEM: 0.4294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2111, partial_loss/deprel_loss: 0.3499, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5136, loss: 0.5550, batch_reg_loss: 0.1914, reg_loss: 0.1915 ||:  76%|#######5  | 72/95 [00:48<00:15,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9630, LAS: 0.9298, UEM: 0.6630, LEM: 0.4375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6367, partial_loss/deprel_loss: 0.5429, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7531, loss: 0.5549, batch_reg_loss: 0.1914, reg_loss: 0.1915 ||:  79%|#######8  | 75/95 [00:50<00:14,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9631, LAS: 0.9299, UEM: 0.6651, LEM: 0.4400, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2904, partial_loss/deprel_loss: 0.3650, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5415, loss: 0.5535, batch_reg_loss: 0.1914, reg_loss: 0.1915 ||:  82%|########2 | 78/95 [00:53<00:12,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9626, LAS: 0.9293, UEM: 0.6625, LEM: 0.4380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2748, partial_loss/deprel_loss: 0.3258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5070, loss: 0.5566, batch_reg_loss: 0.1914, reg_loss: 0.1915 ||:  85%|########5 | 81/95 [00:55<00:10,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9624, LAS: 0.9290, UEM: 0.6622, LEM: 0.4378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3186, partial_loss/deprel_loss: 0.4295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5987, loss: 0.5579, batch_reg_loss: 0.1914, reg_loss: 0.1915 ||:  89%|########9 | 85/95 [00:57<00:06,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9626, LAS: 0.9290, UEM: 0.6635, LEM: 0.4376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2641, partial_loss/deprel_loss: 0.3588, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5313, loss: 0.5574, batch_reg_loss: 0.1914, reg_loss: 0.1915 ||:  93%|#########2| 88/95 [00:59<00:04,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8830, UAS: 0.9624, LAS: 0.9288, UEM: 0.6653, LEM: 0.4387, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9281, partial_loss/deprel_loss: 0.5648, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8289, loss: 0.5582, batch_reg_loss: 0.1914, reg_loss: 0.1915 ||:  96%|#########5| 91/95 [01:02<00:02,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9732, UAS: 0.9624, LAS: 0.9289, UEM: 0.6723, LEM: 0.4523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0274, partial_loss/deprel_loss: 0.1028, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2791, loss: 0.5586, batch_reg_loss: 0.1914, reg_loss: 0.1915 ||: 100%|##########| 95/95 [01:05<00:00,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9732, UAS: 0.9624, LAS: 0.9289, UEM: 0.6723, LEM: 0.4523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0274, partial_loss/deprel_loss: 0.1028, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2791, loss: 0.5586, batch_reg_loss: 0.1914, reg_loss: 0.1915 ||: 100%|##########| 95/95 [01:05<00:00,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:54:54,853 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:54:54,853 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.192  |       N/A\n",
+      "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - UEM                      |     0.672  |       N/A\n",
+      "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - LEM                      |     0.452  |       N/A\n",
+      "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - EM                       |     0.973  |       N/A\n",
+      "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.027  |       N/A\n",
+      "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |       N/A\n",
+      "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.103  |       N/A\n",
+      "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - loss                     |     0.559  |       N/A\n",
+      "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - LAS                      |     0.929  |       N/A\n",
+      "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:54:54,854 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:54:54,855 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:54:54,855 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:54:54,855 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:54:54,855 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:54:54,859 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:54:58,881 - INFO - combo.training.trainer - Epoch duration: 0:01:12.142955\n",
+      "2023-04-07 01:54:58,882 - INFO - combo.training.trainer - Estimated training time remaining: 4:38:04\n",
+      "2023-04-07 01:54:58,882 - INFO - allennlp.training.trainer - Epoch 160/399\n",
+      "2023-04-07 01:54:58,882 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:54:58,882 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:54:58,890 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9763, LAS: 0.9455, UEM: 0.8416, LEM: 0.6602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2320, partial_loss/deprel_loss: 0.2936, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4727, loss: 0.4444, batch_reg_loss: 0.1914, reg_loss: 0.1914 ||:   3%|3         | 3/95 [00:02<01:15,  1.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9635, LAS: 0.9305, UEM: 0.7475, LEM: 0.5457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6281, partial_loss/deprel_loss: 0.4631, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6875, loss: 0.5448, batch_reg_loss: 0.1914, reg_loss: 0.1914 ||:   7%|7         | 7/95 [00:04<01:06,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9628, LAS: 0.9300, UEM: 0.6904, LEM: 0.4797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3590, partial_loss/deprel_loss: 0.3953, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5794, loss: 0.5437, batch_reg_loss: 0.1914, reg_loss: 0.1914 ||:  13%|#2        | 12/95 [00:07<00:55,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9541, UAS: 0.9651, LAS: 0.9323, UEM: 0.7082, LEM: 0.4906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1083, partial_loss/deprel_loss: 0.2273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3948, loss: 0.5286, batch_reg_loss: 0.1913, reg_loss: 0.1914 ||:  18%|#7        | 17/95 [00:09<00:47,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9348, UAS: 0.9658, LAS: 0.9333, UEM: 0.7009, LEM: 0.4815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2770, partial_loss/deprel_loss: 0.3270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5083, loss: 0.5212, batch_reg_loss: 0.1913, reg_loss: 0.1914 ||:  23%|##3       | 22/95 [00:11<00:41,  1.76it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9545, UAS: 0.9651, LAS: 0.9327, UEM: 0.6852, LEM: 0.4615, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1269, partial_loss/deprel_loss: 0.2500, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4167, loss: 0.5297, batch_reg_loss: 0.1913, reg_loss: 0.1913 ||:  28%|##8       | 27/95 [00:14<00:37,  1.82it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9650, LAS: 0.9327, UEM: 0.6704, LEM: 0.4449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3497, partial_loss/deprel_loss: 0.3684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5560, loss: 0.5316, batch_reg_loss: 0.1913, reg_loss: 0.1913 ||:  33%|###2      | 31/95 [00:17<00:37,  1.71it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9657, LAS: 0.9333, UEM: 0.6804, LEM: 0.4557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1903, partial_loss/deprel_loss: 0.3031, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4718, loss: 0.5281, batch_reg_loss: 0.1913, reg_loss: 0.1913 ||:  37%|###6      | 35/95 [00:20<00:38,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9526, UAS: 0.9650, LAS: 0.9328, UEM: 0.6808, LEM: 0.4576, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1476, partial_loss/deprel_loss: 0.2481, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4193, loss: 0.5313, batch_reg_loss: 0.1913, reg_loss: 0.1913 ||:  41%|####1     | 39/95 [00:23<00:37,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9647, LAS: 0.9325, UEM: 0.6787, LEM: 0.4568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4090, partial_loss/deprel_loss: 0.4110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6019, loss: 0.5324, batch_reg_loss: 0.1913, reg_loss: 0.1913 ||:  44%|####4     | 42/95 [00:25<00:37,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9312, UAS: 0.9642, LAS: 0.9318, UEM: 0.6684, LEM: 0.4447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2816, partial_loss/deprel_loss: 0.3724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5455, loss: 0.5373, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||:  48%|####8     | 46/95 [00:28<00:34,  1.44it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9640, LAS: 0.9315, UEM: 0.6639, LEM: 0.4389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1647, partial_loss/deprel_loss: 0.2714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4413, loss: 0.5395, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||:  52%|#####1    | 49/95 [00:30<00:32,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9648, LAS: 0.9324, UEM: 0.6768, LEM: 0.4520, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2503, partial_loss/deprel_loss: 0.3267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5026, loss: 0.5331, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||:  55%|#####4    | 52/95 [00:32<00:30,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9165, UAS: 0.9651, LAS: 0.9327, UEM: 0.6788, LEM: 0.4529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4462, partial_loss/deprel_loss: 0.3923, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5943, loss: 0.5310, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||:  59%|#####8    | 56/95 [00:34<00:26,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9646, LAS: 0.9321, UEM: 0.6794, LEM: 0.4571, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4600, partial_loss/deprel_loss: 0.4477, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6414, loss: 0.5378, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||:  63%|######3   | 60/95 [00:37<00:23,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9507, UAS: 0.9639, LAS: 0.9315, UEM: 0.6732, LEM: 0.4521, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2364, partial_loss/deprel_loss: 0.2890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4697, loss: 0.5420, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||:  68%|######8   | 65/95 [00:40<00:18,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9639, LAS: 0.9315, UEM: 0.6766, LEM: 0.4569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5849, partial_loss/deprel_loss: 0.4290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6514, loss: 0.5426, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||:  73%|#######2  | 69/95 [00:43<00:17,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9642, LAS: 0.9316, UEM: 0.6796, LEM: 0.4574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2187, partial_loss/deprel_loss: 0.3388, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5059, loss: 0.5414, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||:  77%|#######6  | 73/95 [00:46<00:15,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9303, UAS: 0.9633, LAS: 0.9308, UEM: 0.6734, LEM: 0.4519, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4063, partial_loss/deprel_loss: 0.4231, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6109, loss: 0.5485, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||:  80%|########  | 76/95 [00:48<00:13,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9632, LAS: 0.9307, UEM: 0.6718, LEM: 0.4500, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2511, partial_loss/deprel_loss: 0.3529, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5237, loss: 0.5496, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||:  83%|########3 | 79/95 [00:50<00:11,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9627, LAS: 0.9302, UEM: 0.6643, LEM: 0.4438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3886, partial_loss/deprel_loss: 0.3747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5686, loss: 0.5549, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||:  86%|########6 | 82/95 [00:52<00:09,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9200, UAS: 0.9631, LAS: 0.9304, UEM: 0.6688, LEM: 0.4471, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2840, partial_loss/deprel_loss: 0.3865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5571, loss: 0.5524, batch_reg_loss: 0.1912, reg_loss: 0.1913 ||:  91%|######### | 86/95 [00:55<00:06,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9768, UAS: 0.9637, LAS: 0.9313, UEM: 0.6856, LEM: 0.4699, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0250, partial_loss/deprel_loss: 0.0992, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2755, loss: 0.5481, batch_reg_loss: 0.1911, reg_loss: 0.1913 ||:  94%|#########3| 89/95 [00:57<00:04,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9638, LAS: 0.9313, UEM: 0.6840, LEM: 0.4668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3355, partial_loss/deprel_loss: 0.3595, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5459, loss: 0.5469, batch_reg_loss: 0.1911, reg_loss: 0.1912 ||:  98%|#########7| 93/95 [01:00<00:01,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9052, UAS: 0.9636, LAS: 0.9310, UEM: 0.6800, LEM: 0.4631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6199, partial_loss/deprel_loss: 0.4463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6722, loss: 0.5485, batch_reg_loss: 0.1911, reg_loss: 0.1912 ||: 100%|##########| 95/95 [01:01<00:00,  1.54it/s]\n",
+      "2023-04-07 01:56:03,562 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9437, UAS: 0.9694, LAS: 0.9243, UEM: 0.8308, LEM: 0.5652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1994, partial_loss/deprel_loss: 4.8253, partial_loss/cycle_loss: 0.0000, batch_loss: 3.9001, loss: 5.2767, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  27%|##7       | 3/11 [00:02<00:07,  1.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8858, UAS: 0.9577, LAS: 0.9093, UEM: 0.7087, LEM: 0.4344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0427, partial_loss/deprel_loss: 8.4733, partial_loss/cycle_loss: 0.0000, batch_loss: 6.9872, loss: 6.0390, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  55%|#####4    | 6/11 [00:05<00:04,  1.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8721, UAS: 0.9586, LAS: 0.9096, UEM: 0.7243, LEM: 0.4414, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0864, partial_loss/deprel_loss: 13.6287, partial_loss/cycle_loss: 0.0000, batch_loss: 11.1203, loss: 6.2996, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  82%|########1 | 9/11 [00:08<00:01,  1.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8594, UAS: 0.9520, LAS: 0.9019, UEM: 0.6842, LEM: 0.4090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5402, partial_loss/deprel_loss: 18.2763, partial_loss/cycle_loss: 0.0000, batch_loss: 14.9291, loss: 7.6460, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8594, UAS: 0.9520, LAS: 0.9019, UEM: 0.6842, LEM: 0.4090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5402, partial_loss/deprel_loss: 18.2763, partial_loss/cycle_loss: 0.0000, batch_loss: 14.9291, loss: 7.6460, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:10<00:00,  1.02it/s]\n",
+      "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.191  |     0.000\n",
+      "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - UEM                      |     0.680  |     0.684\n",
+      "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - LEM                      |     0.463  |     0.409\n",
+      "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - EM                       |     0.905  |     0.859\n",
+      "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.620  |     1.540\n",
+      "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - UAS                      |     0.964  |     0.952\n",
+      "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:56:14,328 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.446  |    18.276\n",
+      "2023-04-07 01:56:14,329 - INFO - combo.training.tensorboard_writer - loss                     |     0.549  |     7.646\n",
+      "2023-04-07 01:56:14,329 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:56:14,329 - INFO - combo.training.tensorboard_writer - LAS                      |     0.931  |     0.902\n",
+      "2023-04-07 01:56:14,329 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:56:14,329 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:56:14,329 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:56:14,329 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:56:14,329 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:56:14,329 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 01:56:14,334 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:56:21,425 - INFO - combo.training.trainer - Epoch duration: 0:01:22.543137\n",
+      "2023-04-07 01:56:21,426 - INFO - combo.training.trainer - Estimated training time remaining: 4:37:13\n",
+      "2023-04-07 01:56:21,426 - INFO - allennlp.training.trainer - Epoch 161/399\n",
+      "2023-04-07 01:56:21,426 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:56:21,427 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:56:21,437 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9555, LAS: 0.9184, UEM: 0.5959, LEM: 0.3368, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2770, partial_loss/deprel_loss: 0.3564, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5317, loss: 0.6300, batch_reg_loss: 0.1911, reg_loss: 0.1911 ||:   3%|3         | 3/95 [00:02<01:03,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9557, LAS: 0.9243, UEM: 0.5085, LEM: 0.2713, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5083, partial_loss/deprel_loss: 0.3574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5787, loss: 0.5879, batch_reg_loss: 0.1911, reg_loss: 0.1911 ||:   7%|7         | 7/95 [00:04<00:58,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9423, UAS: 0.9628, LAS: 0.9307, UEM: 0.6356, LEM: 0.3839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1819, partial_loss/deprel_loss: 0.2977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4656, loss: 0.5359, batch_reg_loss: 0.1911, reg_loss: 0.1911 ||:  13%|#2        | 12/95 [00:07<00:52,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9512, UAS: 0.9621, LAS: 0.9294, UEM: 0.6676, LEM: 0.4297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0854, partial_loss/deprel_loss: 0.2194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3837, loss: 0.5444, batch_reg_loss: 0.1911, reg_loss: 0.1911 ||:  17%|#6        | 16/95 [00:09<00:48,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9627, LAS: 0.9303, UEM: 0.6596, LEM: 0.4195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3484, partial_loss/deprel_loss: 0.3827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5670, loss: 0.5401, batch_reg_loss: 0.1911, reg_loss: 0.1911 ||:  21%|##1       | 20/95 [00:11<00:45,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9648, LAS: 0.9327, UEM: 0.6894, LEM: 0.4524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1833, partial_loss/deprel_loss: 0.2747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4475, loss: 0.5236, batch_reg_loss: 0.1911, reg_loss: 0.1911 ||:  25%|##5       | 24/95 [00:14<00:42,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9639, LAS: 0.9313, UEM: 0.6683, LEM: 0.4304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3213, partial_loss/deprel_loss: 0.3911, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5682, loss: 0.5348, batch_reg_loss: 0.1911, reg_loss: 0.1911 ||:  29%|##9       | 28/95 [00:16<00:41,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9643, LAS: 0.9318, UEM: 0.6854, LEM: 0.4502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7576, partial_loss/deprel_loss: 0.4802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7267, loss: 0.5320, batch_reg_loss: 0.1910, reg_loss: 0.1911 ||:  34%|###3      | 32/95 [00:19<00:38,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9627, LAS: 0.9301, UEM: 0.6603, LEM: 0.4272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3612, partial_loss/deprel_loss: 0.3130, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5137, loss: 0.5463, batch_reg_loss: 0.1910, reg_loss: 0.1911 ||:  39%|###8      | 37/95 [00:21<00:32,  1.80it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9624, LAS: 0.9297, UEM: 0.6565, LEM: 0.4232, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1974, partial_loss/deprel_loss: 0.2774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4524, loss: 0.5493, batch_reg_loss: 0.1910, reg_loss: 0.1911 ||:  44%|####4     | 42/95 [00:23<00:27,  1.91it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9625, LAS: 0.9298, UEM: 0.6596, LEM: 0.4296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2212, partial_loss/deprel_loss: 0.3290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4984, loss: 0.5477, batch_reg_loss: 0.1910, reg_loss: 0.1911 ||:  48%|####8     | 46/95 [00:26<00:28,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9631, LAS: 0.9304, UEM: 0.6641, LEM: 0.4322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3073, partial_loss/deprel_loss: 0.3479, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5308, loss: 0.5449, batch_reg_loss: 0.1910, reg_loss: 0.1911 ||:  53%|#####2    | 50/95 [00:29<00:27,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9642, LAS: 0.9315, UEM: 0.6857, LEM: 0.4569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1297, partial_loss/deprel_loss: 0.2576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4230, loss: 0.5365, batch_reg_loss: 0.1910, reg_loss: 0.1911 ||:  57%|#####6    | 54/95 [00:32<00:26,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9639, LAS: 0.9311, UEM: 0.6912, LEM: 0.4677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5797, partial_loss/deprel_loss: 0.4343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6543, loss: 0.5392, batch_reg_loss: 0.1910, reg_loss: 0.1911 ||:  61%|######1   | 58/95 [00:34<00:24,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9639, LAS: 0.9308, UEM: 0.6910, LEM: 0.4648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2046, partial_loss/deprel_loss: 0.3376, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5020, loss: 0.5417, batch_reg_loss: 0.1910, reg_loss: 0.1910 ||:  65%|######5   | 62/95 [00:37<00:21,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9455, UAS: 0.9638, LAS: 0.9310, UEM: 0.7006, LEM: 0.4848, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2613, partial_loss/deprel_loss: 0.2678, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4575, loss: 0.5400, batch_reg_loss: 0.1910, reg_loss: 0.1910 ||:  69%|######9   | 66/95 [00:40<00:20,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9639, LAS: 0.9311, UEM: 0.7003, LEM: 0.4837, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1505, partial_loss/deprel_loss: 0.2817, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4464, loss: 0.5398, batch_reg_loss: 0.1909, reg_loss: 0.1910 ||:  73%|#######2  | 69/95 [00:42<00:18,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9637, LAS: 0.9308, UEM: 0.6971, LEM: 0.4801, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1655, partial_loss/deprel_loss: 0.2947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4598, loss: 0.5418, batch_reg_loss: 0.1909, reg_loss: 0.1910 ||:  76%|#######5  | 72/95 [00:45<00:16,  1.36it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9636, LAS: 0.9308, UEM: 0.6915, LEM: 0.4742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5565, partial_loss/deprel_loss: 0.4021, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6239, loss: 0.5427, batch_reg_loss: 0.1909, reg_loss: 0.1910 ||:  79%|#######8  | 75/95 [00:47<00:14,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9626, LAS: 0.9298, UEM: 0.6839, LEM: 0.4676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5635, partial_loss/deprel_loss: 0.4325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6496, loss: 0.5497, batch_reg_loss: 0.1909, reg_loss: 0.1910 ||:  82%|########2 | 78/95 [00:49<00:12,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9625, LAS: 0.9297, UEM: 0.6848, LEM: 0.4701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3127, partial_loss/deprel_loss: 0.4014, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5746, loss: 0.5505, batch_reg_loss: 0.1909, reg_loss: 0.1910 ||:  85%|########5 | 81/95 [00:51<00:10,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9625, LAS: 0.9297, UEM: 0.6827, LEM: 0.4672, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3948, partial_loss/deprel_loss: 0.3623, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5597, loss: 0.5507, batch_reg_loss: 0.1909, reg_loss: 0.1910 ||:  88%|########8 | 84/95 [00:53<00:07,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9624, LAS: 0.9294, UEM: 0.6783, LEM: 0.4623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2434, partial_loss/deprel_loss: 0.3092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4869, loss: 0.5525, batch_reg_loss: 0.1909, reg_loss: 0.1910 ||:  92%|#########1| 87/95 [00:55<00:05,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9082, UAS: 0.9622, LAS: 0.9292, UEM: 0.6732, LEM: 0.4570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6044, partial_loss/deprel_loss: 0.4423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6656, loss: 0.5544, batch_reg_loss: 0.1909, reg_loss: 0.1910 ||:  95%|#########4| 90/95 [00:57<00:03,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9625, LAS: 0.9295, UEM: 0.6752, LEM: 0.4574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1655, partial_loss/deprel_loss: 0.3349, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4919, loss: 0.5530, batch_reg_loss: 0.1909, reg_loss: 0.1910 ||:  98%|#########7| 93/95 [00:59<00:01,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9624, LAS: 0.9294, UEM: 0.6733, LEM: 0.4563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4885, partial_loss/deprel_loss: 0.4326, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6347, loss: 0.5530, batch_reg_loss: 0.1909, reg_loss: 0.1910 ||: 100%|##########| 95/95 [01:01<00:00,  1.55it/s]\n",
+      "2023-04-07 01:57:25,711 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:57:25,711 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.191  |       N/A\n",
+      "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - UEM                      |     0.673  |       N/A\n",
+      "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - LEM                      |     0.456  |       N/A\n",
+      "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - EM                       |     0.912  |       N/A\n",
+      "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.488  |       N/A\n",
+      "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |       N/A\n",
+      "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.433  |       N/A\n",
+      "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - loss                     |     0.553  |       N/A\n",
+      "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - LAS                      |     0.929  |       N/A\n",
+      "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:57:25,712 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:57:25,713 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:57:25,713 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:57:25,717 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:57:30,571 - INFO - combo.training.trainer - Epoch duration: 0:01:09.144809\n",
+      "2023-04-07 01:57:30,571 - INFO - combo.training.trainer - Estimated training time remaining: 4:36:03\n",
+      "2023-04-07 01:57:30,571 - INFO - allennlp.training.trainer - Epoch 162/399\n",
+      "2023-04-07 01:57:30,572 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:57:30,572 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:57:30,581 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9612, LAS: 0.9282, UEM: 0.6256, LEM: 0.3884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2923, partial_loss/deprel_loss: 0.2939, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4845, loss: 0.5527, batch_reg_loss: 0.1909, reg_loss: 0.1909 ||:   3%|3         | 3/95 [00:02<01:06,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9637, LAS: 0.9303, UEM: 0.6470, LEM: 0.4008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2618, partial_loss/deprel_loss: 0.3002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4834, loss: 0.5343, batch_reg_loss: 0.1909, reg_loss: 0.1909 ||:   6%|6         | 6/95 [00:04<01:03,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9655, LAS: 0.9322, UEM: 0.6758, LEM: 0.4378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1586, partial_loss/deprel_loss: 0.2265, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4038, loss: 0.5210, batch_reg_loss: 0.1909, reg_loss: 0.1909 ||:   9%|9         | 9/95 [00:06<01:01,  1.39it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9663, LAS: 0.9335, UEM: 0.6827, LEM: 0.4549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5248, partial_loss/deprel_loss: 0.4342, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6432, loss: 0.5187, batch_reg_loss: 0.1909, reg_loss: 0.1909 ||:  14%|#3        | 13/95 [00:09<00:57,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9649, LAS: 0.9321, UEM: 0.6541, LEM: 0.4242, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5915, partial_loss/deprel_loss: 0.4867, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6985, loss: 0.5344, batch_reg_loss: 0.1909, reg_loss: 0.1909 ||:  17%|#6        | 16/95 [00:11<00:54,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9638, LAS: 0.9311, UEM: 0.6333, LEM: 0.4019, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6412, partial_loss/deprel_loss: 0.4716, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6963, loss: 0.5446, batch_reg_loss: 0.1909, reg_loss: 0.1909 ||:  20%|##        | 19/95 [00:13<00:53,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9652, LAS: 0.9328, UEM: 0.6613, LEM: 0.4295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1766, partial_loss/deprel_loss: 0.2791, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4494, loss: 0.5312, batch_reg_loss: 0.1909, reg_loss: 0.1909 ||:  23%|##3       | 22/95 [00:15<00:55,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9649, LAS: 0.9326, UEM: 0.6584, LEM: 0.4249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4952, partial_loss/deprel_loss: 0.4124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6198, loss: 0.5325, batch_reg_loss: 0.1908, reg_loss: 0.1909 ||:  26%|##6       | 25/95 [00:17<00:51,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9160, UAS: 0.9648, LAS: 0.9324, UEM: 0.6507, LEM: 0.4166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5078, partial_loss/deprel_loss: 0.4754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6727, loss: 0.5364, batch_reg_loss: 0.1908, reg_loss: 0.1909 ||:  31%|###       | 29/95 [00:20<00:46,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9383, UAS: 0.9663, LAS: 0.9335, UEM: 0.6773, LEM: 0.4399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1996, partial_loss/deprel_loss: 0.3330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4972, loss: 0.5272, batch_reg_loss: 0.1908, reg_loss: 0.1909 ||:  35%|###4      | 33/95 [00:23<00:43,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9653, LAS: 0.9324, UEM: 0.6630, LEM: 0.4262, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5060, partial_loss/deprel_loss: 0.4764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6731, loss: 0.5343, batch_reg_loss: 0.1908, reg_loss: 0.1909 ||:  38%|###7      | 36/95 [00:25<00:41,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9359, UAS: 0.9654, LAS: 0.9324, UEM: 0.6623, LEM: 0.4239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2030, partial_loss/deprel_loss: 0.3096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4791, loss: 0.5342, batch_reg_loss: 0.1908, reg_loss: 0.1909 ||:  41%|####1     | 39/95 [00:27<00:39,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9639, LAS: 0.9307, UEM: 0.6514, LEM: 0.4147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4177, partial_loss/deprel_loss: 0.3685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5691, loss: 0.5440, batch_reg_loss: 0.1908, reg_loss: 0.1908 ||:  45%|####5     | 43/95 [00:29<00:34,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9629, LAS: 0.9299, UEM: 0.6561, LEM: 0.4238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1249, partial_loss/deprel_loss: 0.2237, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3947, loss: 0.5477, batch_reg_loss: 0.1908, reg_loss: 0.1908 ||:  51%|#####     | 48/95 [00:32<00:28,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9627, LAS: 0.9296, UEM: 0.6457, LEM: 0.4128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3377, partial_loss/deprel_loss: 0.3512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5393, loss: 0.5492, batch_reg_loss: 0.1908, reg_loss: 0.1908 ||:  56%|#####5    | 53/95 [00:34<00:23,  1.82it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9295, UAS: 0.9619, LAS: 0.9288, UEM: 0.6347, LEM: 0.4046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3078, partial_loss/deprel_loss: 0.3655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5447, loss: 0.5566, batch_reg_loss: 0.1908, reg_loss: 0.1908 ||:  61%|######1   | 58/95 [00:36<00:19,  1.93it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9724, UAS: 0.9630, LAS: 0.9303, UEM: 0.6753, LEM: 0.4605, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0364, partial_loss/deprel_loss: 0.1030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2805, loss: 0.5460, batch_reg_loss: 0.1908, reg_loss: 0.1908 ||:  66%|######6   | 63/95 [00:39<00:16,  1.91it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9400, UAS: 0.9636, LAS: 0.9310, UEM: 0.6836, LEM: 0.4690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2450, partial_loss/deprel_loss: 0.3171, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4934, loss: 0.5414, batch_reg_loss: 0.1907, reg_loss: 0.1908 ||:  72%|#######1  | 68/95 [00:41<00:13,  2.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9630, LAS: 0.9301, UEM: 0.6758, LEM: 0.4605, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3095, partial_loss/deprel_loss: 0.4041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5759, loss: 0.5470, batch_reg_loss: 0.1907, reg_loss: 0.1908 ||:  77%|#######6  | 73/95 [00:43<00:10,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9631, LAS: 0.9303, UEM: 0.6746, LEM: 0.4584, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1627, partial_loss/deprel_loss: 0.3092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4706, loss: 0.5461, batch_reg_loss: 0.1907, reg_loss: 0.1908 ||:  82%|########2 | 78/95 [00:45<00:07,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9520, UAS: 0.9633, LAS: 0.9303, UEM: 0.6780, LEM: 0.4617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0843, partial_loss/deprel_loss: 0.2144, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3791, loss: 0.5461, batch_reg_loss: 0.1907, reg_loss: 0.1908 ||:  87%|########7 | 83/95 [00:47<00:05,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9168, UAS: 0.9631, LAS: 0.9300, UEM: 0.6730, LEM: 0.4551, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4936, partial_loss/deprel_loss: 0.4443, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6449, loss: 0.5479, batch_reg_loss: 0.1907, reg_loss: 0.1908 ||:  93%|#########2| 88/95 [00:50<00:03,  2.15it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9630, LAS: 0.9299, UEM: 0.6716, LEM: 0.4537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2051, partial_loss/deprel_loss: 0.2338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4188, loss: 0.5476, batch_reg_loss: 0.1907, reg_loss: 0.1908 ||:  98%|#########7| 93/95 [00:52<00:00,  2.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9307, UAS: 0.9631, LAS: 0.9301, UEM: 0.6724, LEM: 0.4541, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3475, partial_loss/deprel_loss: 0.3907, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5727, loss: 0.5462, batch_reg_loss: 0.1907, reg_loss: 0.1908 ||: 100%|##########| 95/95 [00:53<00:00,  1.77it/s]\n",
+      "2023-04-07 01:58:26,960 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:58:26,960 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 01:58:26,960 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.191  |       N/A\n",
+      "2023-04-07 01:58:26,960 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - UEM                      |     0.672  |       N/A\n",
+      "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - LEM                      |     0.454  |       N/A\n",
+      "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - EM                       |     0.931  |       N/A\n",
+      "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.347  |       N/A\n",
+      "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |       N/A\n",
+      "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.391  |       N/A\n",
+      "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - loss                     |     0.546  |       N/A\n",
+      "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - LAS                      |     0.930  |       N/A\n",
+      "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:58:26,961 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:58:26,962 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:58:26,962 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:58:26,966 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:58:34,185 - INFO - combo.training.trainer - Epoch duration: 0:01:03.613676\n",
+      "2023-04-07 01:58:34,186 - INFO - combo.training.trainer - Estimated training time remaining: 4:34:45\n",
+      "2023-04-07 01:58:34,186 - INFO - allennlp.training.trainer - Epoch 163/399\n",
+      "2023-04-07 01:58:34,186 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:58:34,187 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:58:34,197 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9738, LAS: 0.9427, UEM: 0.7407, LEM: 0.4888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3375, partial_loss/deprel_loss: 0.3351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5263, loss: 0.4713, batch_reg_loss: 0.1907, reg_loss: 0.1907 ||:   5%|5         | 5/95 [00:02<00:43,  2.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9311, UAS: 0.9726, LAS: 0.9422, UEM: 0.7833, LEM: 0.5907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2743, partial_loss/deprel_loss: 0.3165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4987, loss: 0.4745, batch_reg_loss: 0.1906, reg_loss: 0.1907 ||:   9%|9         | 9/95 [00:04<00:41,  2.05it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9705, LAS: 0.9395, UEM: 0.7353, LEM: 0.5301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3920, partial_loss/deprel_loss: 0.3697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5648, loss: 0.4920, batch_reg_loss: 0.1906, reg_loss: 0.1906 ||:  15%|#4        | 14/95 [00:06<00:38,  2.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9726, LAS: 0.9415, UEM: 0.7816, LEM: 0.5827, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2579, partial_loss/deprel_loss: 0.3561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5270, loss: 0.4757, batch_reg_loss: 0.1906, reg_loss: 0.1906 ||:  19%|#8        | 18/95 [00:08<00:37,  2.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9678, LAS: 0.9356, UEM: 0.7379, LEM: 0.5402, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3221, partial_loss/deprel_loss: 0.3727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5532, loss: 0.5152, batch_reg_loss: 0.1906, reg_loss: 0.1906 ||:  24%|##4       | 23/95 [00:11<00:34,  2.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9665, LAS: 0.9344, UEM: 0.7124, LEM: 0.5132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2866, partial_loss/deprel_loss: 0.3175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5019, loss: 0.5233, batch_reg_loss: 0.1906, reg_loss: 0.1906 ||:  29%|##9       | 28/95 [00:13<00:31,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9596, UAS: 0.9660, LAS: 0.9340, UEM: 0.7136, LEM: 0.5188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0685, partial_loss/deprel_loss: 0.1542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3276, loss: 0.5238, batch_reg_loss: 0.1906, reg_loss: 0.1906 ||:  35%|###4      | 33/95 [00:15<00:29,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9494, UAS: 0.9666, LAS: 0.9346, UEM: 0.7175, LEM: 0.5170, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1808, partial_loss/deprel_loss: 0.2531, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4292, loss: 0.5215, batch_reg_loss: 0.1905, reg_loss: 0.1906 ||:  39%|###8      | 37/95 [00:17<00:28,  2.05it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9651, LAS: 0.9329, UEM: 0.7028, LEM: 0.5034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5526, partial_loss/deprel_loss: 0.5093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7085, loss: 0.5335, batch_reg_loss: 0.1905, reg_loss: 0.1906 ||:  44%|####4     | 42/95 [00:20<00:26,  2.02it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9636, LAS: 0.9312, UEM: 0.6875, LEM: 0.4878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7577, partial_loss/deprel_loss: 0.6006, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8225, loss: 0.5440, batch_reg_loss: 0.1905, reg_loss: 0.1906 ||:  49%|####9     | 47/95 [00:22<00:23,  2.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9316, UAS: 0.9623, LAS: 0.9297, UEM: 0.6766, LEM: 0.4765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2872, partial_loss/deprel_loss: 0.3445, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5236, loss: 0.5541, batch_reg_loss: 0.1905, reg_loss: 0.1906 ||:  55%|#####4    | 52/95 [00:25<00:21,  2.05it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9624, LAS: 0.9298, UEM: 0.6881, LEM: 0.4863, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1182, partial_loss/deprel_loss: 0.2426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4082, loss: 0.5534, batch_reg_loss: 0.1905, reg_loss: 0.1906 ||:  60%|######    | 57/95 [00:27<00:18,  2.00it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9267, UAS: 0.9624, LAS: 0.9296, UEM: 0.6822, LEM: 0.4746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2415, partial_loss/deprel_loss: 0.3647, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5306, loss: 0.5547, batch_reg_loss: 0.1905, reg_loss: 0.1906 ||:  65%|######5   | 62/95 [00:30<00:16,  2.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9635, LAS: 0.9306, UEM: 0.6920, LEM: 0.4800, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1464, partial_loss/deprel_loss: 0.2588, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4269, loss: 0.5480, batch_reg_loss: 0.1905, reg_loss: 0.1906 ||:  71%|#######   | 67/95 [00:32<00:13,  2.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9633, LAS: 0.9302, UEM: 0.6827, LEM: 0.4689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4574, partial_loss/deprel_loss: 0.4027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6042, loss: 0.5511, batch_reg_loss: 0.1905, reg_loss: 0.1906 ||:  76%|#######5  | 72/95 [00:34<00:10,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9631, LAS: 0.9301, UEM: 0.6784, LEM: 0.4643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4201, partial_loss/deprel_loss: 0.4119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6041, loss: 0.5508, batch_reg_loss: 0.1905, reg_loss: 0.1906 ||:  81%|########1 | 77/95 [00:37<00:08,  2.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9632, LAS: 0.9301, UEM: 0.6764, LEM: 0.4606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1696, partial_loss/deprel_loss: 0.2757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4449, loss: 0.5505, batch_reg_loss: 0.1905, reg_loss: 0.1906 ||:  86%|########6 | 82/95 [00:39<00:06,  2.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9633, LAS: 0.9301, UEM: 0.6720, LEM: 0.4544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2312, partial_loss/deprel_loss: 0.3471, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5144, loss: 0.5502, batch_reg_loss: 0.1905, reg_loss: 0.1905 ||:  92%|#########1| 87/95 [00:41<00:03,  2.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9632, LAS: 0.9301, UEM: 0.6725, LEM: 0.4558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3495, partial_loss/deprel_loss: 0.3551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5444, loss: 0.5510, batch_reg_loss: 0.1905, reg_loss: 0.1905 ||:  97%|#########6| 92/95 [00:44<00:01,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9533, UAS: 0.9636, LAS: 0.9305, UEM: 0.6769, LEM: 0.4598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0981, partial_loss/deprel_loss: 0.2375, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4001, loss: 0.5482, batch_reg_loss: 0.1905, reg_loss: 0.1905 ||: 100%|##########| 95/95 [00:45<00:00,  2.09it/s]\n",
+      "2023-04-07 01:59:22,894 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:59:22,894 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 01:59:22,894 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.191  |       N/A\n",
+      "2023-04-07 01:59:22,894 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:59:22,894 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:59:22,894 - INFO - combo.training.tensorboard_writer - UEM                      |     0.677  |       N/A\n",
+      "2023-04-07 01:59:22,894 - INFO - combo.training.tensorboard_writer - LEM                      |     0.460  |       N/A\n",
+      "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - EM                       |     0.953  |       N/A\n",
+      "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.098  |       N/A\n",
+      "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - UAS                      |     0.964  |       N/A\n",
+      "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.238  |       N/A\n",
+      "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - loss                     |     0.548  |       N/A\n",
+      "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - LAS                      |     0.930  |       N/A\n",
+      "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:59:22,895 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:59:22,902 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 01:59:27,729 - INFO - combo.training.trainer - Epoch duration: 0:00:53.542821\n",
+      "2023-04-07 01:59:27,729 - INFO - combo.training.trainer - Estimated training time remaining: 4:33:12\n",
+      "2023-04-07 01:59:27,729 - INFO - allennlp.training.trainer - Epoch 164/399\n",
+      "2023-04-07 01:59:27,730 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 01:59:27,730 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:59:27,740 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9148, UAS: 0.9619, LAS: 0.9298, UEM: 0.5734, LEM: 0.3344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5451, partial_loss/deprel_loss: 0.4259, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6402, loss: 0.5597, batch_reg_loss: 0.1904, reg_loss: 0.1904 ||:   5%|5         | 5/95 [00:02<00:44,  2.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9235, UAS: 0.9635, LAS: 0.9322, UEM: 0.5934, LEM: 0.3513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5574, partial_loss/deprel_loss: 0.3986, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6208, loss: 0.5415, batch_reg_loss: 0.1904, reg_loss: 0.1904 ||:  11%|#         | 10/95 [00:04<00:40,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9141, UAS: 0.9623, LAS: 0.9315, UEM: 0.5744, LEM: 0.3344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6257, partial_loss/deprel_loss: 0.4745, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6951, loss: 0.5491, batch_reg_loss: 0.1904, reg_loss: 0.1904 ||:  16%|#5        | 15/95 [00:06<00:37,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9457, UAS: 0.9658, LAS: 0.9341, UEM: 0.6419, LEM: 0.3884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1404, partial_loss/deprel_loss: 0.2562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4234, loss: 0.5297, batch_reg_loss: 0.1904, reg_loss: 0.1904 ||:  21%|##1       | 20/95 [00:09<00:35,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9634, LAS: 0.9315, UEM: 0.6415, LEM: 0.3998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2309, partial_loss/deprel_loss: 0.3083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4832, loss: 0.5432, batch_reg_loss: 0.1904, reg_loss: 0.1904 ||:  26%|##6       | 25/95 [00:11<00:32,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9268, UAS: 0.9616, LAS: 0.9299, UEM: 0.6162, LEM: 0.3831, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4382, partial_loss/deprel_loss: 0.3729, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5763, loss: 0.5513, batch_reg_loss: 0.1904, reg_loss: 0.1904 ||:  32%|###1      | 30/95 [00:13<00:29,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9616, LAS: 0.9295, UEM: 0.6095, LEM: 0.3768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5807, partial_loss/deprel_loss: 0.4786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6894, loss: 0.5535, batch_reg_loss: 0.1904, reg_loss: 0.1904 ||:  37%|###6      | 35/95 [00:15<00:26,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9611, LAS: 0.9289, UEM: 0.6072, LEM: 0.3795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1790, partial_loss/deprel_loss: 0.2619, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4357, loss: 0.5548, batch_reg_loss: 0.1904, reg_loss: 0.1904 ||:  42%|####2     | 40/95 [00:18<00:25,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9623, LAS: 0.9302, UEM: 0.6283, LEM: 0.4016, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3150, partial_loss/deprel_loss: 0.3416, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5267, loss: 0.5459, batch_reg_loss: 0.1903, reg_loss: 0.1904 ||:  47%|####7     | 45/95 [00:20<00:23,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9616, LAS: 0.9293, UEM: 0.6202, LEM: 0.3940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2663, partial_loss/deprel_loss: 0.3061, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4885, loss: 0.5515, batch_reg_loss: 0.1903, reg_loss: 0.1904 ||:  53%|#####2    | 50/95 [00:22<00:20,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9611, LAS: 0.9288, UEM: 0.6350, LEM: 0.4137, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1256, partial_loss/deprel_loss: 0.2711, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4323, loss: 0.5548, batch_reg_loss: 0.1903, reg_loss: 0.1904 ||:  58%|#####7    | 55/95 [00:25<00:19,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9617, LAS: 0.9293, UEM: 0.6479, LEM: 0.4265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3178, partial_loss/deprel_loss: 0.3322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5196, loss: 0.5513, batch_reg_loss: 0.1903, reg_loss: 0.1904 ||:  63%|######3   | 60/95 [00:28<00:17,  2.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9625, LAS: 0.9300, UEM: 0.6559, LEM: 0.4316, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2680, partial_loss/deprel_loss: 0.3304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5082, loss: 0.5457, batch_reg_loss: 0.1903, reg_loss: 0.1904 ||:  68%|######8   | 65/95 [00:30<00:14,  2.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9632, LAS: 0.9307, UEM: 0.6727, LEM: 0.4521, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2048, partial_loss/deprel_loss: 0.2890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4625, loss: 0.5400, batch_reg_loss: 0.1903, reg_loss: 0.1904 ||:  74%|#######3  | 70/95 [00:32<00:12,  2.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9514, UAS: 0.9637, LAS: 0.9317, UEM: 0.6923, LEM: 0.4808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0938, partial_loss/deprel_loss: 0.2573, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4149, loss: 0.5344, batch_reg_loss: 0.1903, reg_loss: 0.1904 ||:  79%|#######8  | 75/95 [00:35<00:09,  2.05it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9020, UAS: 0.9638, LAS: 0.9317, UEM: 0.6925, LEM: 0.4795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7148, partial_loss/deprel_loss: 0.5160, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7460, loss: 0.5358, batch_reg_loss: 0.1902, reg_loss: 0.1904 ||:  84%|########4 | 80/95 [00:37<00:07,  2.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9380, UAS: 0.9633, LAS: 0.9311, UEM: 0.6860, LEM: 0.4731, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1684, partial_loss/deprel_loss: 0.2911, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4568, loss: 0.5391, batch_reg_loss: 0.1902, reg_loss: 0.1903 ||:  89%|########9 | 85/95 [00:39<00:04,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9340, UAS: 0.9632, LAS: 0.9308, UEM: 0.6815, LEM: 0.4673, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2699, partial_loss/deprel_loss: 0.3483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5229, loss: 0.5407, batch_reg_loss: 0.1902, reg_loss: 0.1903 ||:  95%|#########4| 90/95 [00:42<00:02,  2.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9631, LAS: 0.9307, UEM: 0.6746, LEM: 0.4588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4054, partial_loss/deprel_loss: 0.3952, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5874, loss: 0.5432, batch_reg_loss: 0.1902, reg_loss: 0.1903 ||: 100%|##########| 95/95 [00:44<00:00,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9631, LAS: 0.9307, UEM: 0.6746, LEM: 0.4588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4054, partial_loss/deprel_loss: 0.3952, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5874, loss: 0.5432, batch_reg_loss: 0.1902, reg_loss: 0.1903 ||: 100%|##########| 95/95 [00:44<00:00,  2.13it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.190  |       N/A\n",
+      "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer - UEM                      |     0.675  |       N/A\n",
+      "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer - LEM                      |     0.459  |       N/A\n",
+      "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer - EM                       |     0.925  |       N/A\n",
+      "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.405  |       N/A\n",
+      "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:00:15,289 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |       N/A\n",
+      "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.395  |       N/A\n",
+      "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - loss                     |     0.543  |       N/A\n",
+      "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - LAS                      |     0.931  |       N/A\n",
+      "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:00:15,290 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:00:15,295 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:00:20,102 - INFO - combo.training.trainer - Epoch duration: 0:00:52.372078\n",
+      "2023-04-07 02:00:20,102 - INFO - combo.training.trainer - Estimated training time remaining: 4:31:38\n",
+      "2023-04-07 02:00:20,102 - INFO - allennlp.training.trainer - Epoch 165/399\n",
+      "2023-04-07 02:00:20,103 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:00:20,103 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:00:20,113 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9573, LAS: 0.9240, UEM: 0.5156, LEM: 0.2906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7770, partial_loss/deprel_loss: 0.5007, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7461, loss: 0.5904, batch_reg_loss: 0.1902, reg_loss: 0.1902 ||:   5%|5         | 5/95 [00:02<00:41,  2.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9650, LAS: 0.9322, UEM: 0.6708, LEM: 0.4558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2296, partial_loss/deprel_loss: 0.3998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5560, loss: 0.5407, batch_reg_loss: 0.1902, reg_loss: 0.1902 ||:  11%|#         | 10/95 [00:04<00:39,  2.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9678, LAS: 0.9353, UEM: 0.7127, LEM: 0.4968, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1809, partial_loss/deprel_loss: 0.2555, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4308, loss: 0.5196, batch_reg_loss: 0.1902, reg_loss: 0.1902 ||:  15%|#4        | 14/95 [00:06<00:38,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9650, LAS: 0.9318, UEM: 0.6826, LEM: 0.4678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6285, partial_loss/deprel_loss: 0.4741, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6952, loss: 0.5403, batch_reg_loss: 0.1902, reg_loss: 0.1902 ||:  20%|##        | 19/95 [00:08<00:35,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9408, UAS: 0.9671, LAS: 0.9345, UEM: 0.7417, LEM: 0.5474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1539, partial_loss/deprel_loss: 0.2764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4421, loss: 0.5187, batch_reg_loss: 0.1902, reg_loss: 0.1902 ||:  24%|##4       | 23/95 [00:11<00:35,  2.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9666, LAS: 0.9343, UEM: 0.7245, LEM: 0.5267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2292, partial_loss/deprel_loss: 0.3402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5082, loss: 0.5220, batch_reg_loss: 0.1901, reg_loss: 0.1902 ||:  29%|##9       | 28/95 [00:13<00:32,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9647, LAS: 0.9324, UEM: 0.7068, LEM: 0.5070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6443, partial_loss/deprel_loss: 0.5178, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7333, loss: 0.5348, batch_reg_loss: 0.1901, reg_loss: 0.1902 ||:  35%|###4      | 33/95 [00:15<00:29,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9652, LAS: 0.9329, UEM: 0.7001, LEM: 0.4969, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2062, partial_loss/deprel_loss: 0.2855, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4597, loss: 0.5303, batch_reg_loss: 0.1901, reg_loss: 0.1902 ||:  40%|####      | 38/95 [00:18<00:27,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9655, LAS: 0.9333, UEM: 0.7031, LEM: 0.4947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1846, partial_loss/deprel_loss: 0.2773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4489, loss: 0.5274, batch_reg_loss: 0.1901, reg_loss: 0.1902 ||:  45%|####5     | 43/95 [00:20<00:24,  2.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9146, UAS: 0.9638, LAS: 0.9314, UEM: 0.6898, LEM: 0.4807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5657, partial_loss/deprel_loss: 0.4104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6316, loss: 0.5381, batch_reg_loss: 0.1901, reg_loss: 0.1902 ||:  51%|#####     | 48/95 [00:22<00:21,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9632, LAS: 0.9309, UEM: 0.6809, LEM: 0.4694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5652, partial_loss/deprel_loss: 0.4961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7000, loss: 0.5434, batch_reg_loss: 0.1901, reg_loss: 0.1902 ||:  56%|#####5    | 53/95 [00:24<00:19,  2.21it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9541, UAS: 0.9642, LAS: 0.9317, UEM: 0.6983, LEM: 0.4861, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0907, partial_loss/deprel_loss: 0.2074, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3741, loss: 0.5356, batch_reg_loss: 0.1901, reg_loss: 0.1901 ||:  61%|######1   | 58/95 [00:27<00:17,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9344, UAS: 0.9641, LAS: 0.9314, UEM: 0.6879, LEM: 0.4740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3749, partial_loss/deprel_loss: 0.3637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5560, loss: 0.5394, batch_reg_loss: 0.1901, reg_loss: 0.1901 ||:  66%|######6   | 63/95 [00:29<00:14,  2.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9640, LAS: 0.9312, UEM: 0.6810, LEM: 0.4659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4680, partial_loss/deprel_loss: 0.4725, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6616, loss: 0.5400, batch_reg_loss: 0.1901, reg_loss: 0.1901 ||:  72%|#######1  | 68/95 [00:31<00:12,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9635, LAS: 0.9308, UEM: 0.6824, LEM: 0.4701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2634, partial_loss/deprel_loss: 0.3195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4983, loss: 0.5429, batch_reg_loss: 0.1900, reg_loss: 0.1901 ||:  77%|#######6  | 73/95 [00:34<00:10,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9090, UAS: 0.9633, LAS: 0.9308, UEM: 0.6798, LEM: 0.4675, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7059, partial_loss/deprel_loss: 0.4904, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7235, loss: 0.5438, batch_reg_loss: 0.1900, reg_loss: 0.1901 ||:  82%|########2 | 78/95 [00:36<00:08,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9637, LAS: 0.9311, UEM: 0.6769, LEM: 0.4616, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3138, partial_loss/deprel_loss: 0.3029, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4951, loss: 0.5419, batch_reg_loss: 0.1900, reg_loss: 0.1901 ||:  87%|########7 | 83/95 [00:39<00:05,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9642, LAS: 0.9316, UEM: 0.6870, LEM: 0.4712, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1842, partial_loss/deprel_loss: 0.3372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4966, loss: 0.5379, batch_reg_loss: 0.1900, reg_loss: 0.1901 ||:  93%|#########2| 88/95 [00:41<00:03,  2.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9635, LAS: 0.9308, UEM: 0.6806, LEM: 0.4640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1564, partial_loss/deprel_loss: 0.2680, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4357, loss: 0.5434, batch_reg_loss: 0.1900, reg_loss: 0.1901 ||:  98%|#########7| 93/95 [00:44<00:00,  2.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9633, LAS: 0.9307, UEM: 0.6768, LEM: 0.4607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4608, partial_loss/deprel_loss: 0.3600, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5702, loss: 0.5447, batch_reg_loss: 0.1900, reg_loss: 0.1901 ||: 100%|##########| 95/95 [00:45<00:00,  2.10it/s]\n",
+      "2023-04-07 02:01:08,477 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9448, LAS: 0.8860, UEM: 0.5352, LEM: 0.1796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5433, partial_loss/deprel_loss: 7.2230, partial_loss/cycle_loss: 0.0000, batch_loss: 5.8870, loss: 6.9931, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  36%|###6      | 4/11 [00:02<00:04,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9505, LAS: 0.8974, UEM: 0.6350, LEM: 0.3188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4079, partial_loss/deprel_loss: 6.9281, partial_loss/cycle_loss: 0.0000, batch_loss: 5.6240, loss: 7.0933, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  64%|######3   | 7/11 [00:04<00:02,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8590, UAS: 0.9515, LAS: 0.9005, UEM: 0.7005, LEM: 0.4255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5050, partial_loss/deprel_loss: 16.8045, partial_loss/cycle_loss: 0.0000, batch_loss: 13.7446, loss: 7.1973, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  91%|######### | 10/11 [00:06<00:00,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8930, UAS: 0.9514, LAS: 0.8998, UEM: 0.6857, LEM: 0.4084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9330, partial_loss/deprel_loss: 9.0223, partial_loss/cycle_loss: 0.0000, batch_loss: 7.4045, loss: 7.2161, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:07<00:00,  1.47it/s]  \n",
+      "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.190  |     0.000\n",
+      "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - UEM                      |     0.677  |     0.686\n",
+      "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - LEM                      |     0.461  |     0.408\n",
+      "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - EM                       |     0.929  |     0.893\n",
+      "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.461  |     0.933\n",
+      "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 02:01:15,990 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |     0.951\n",
+      "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.360  |     9.022\n",
+      "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - loss                     |     0.545  |     7.216\n",
+      "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - LAS                      |     0.931  |     0.900\n",
+      "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 02:01:15,991 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 02:01:15,996 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 02:01:20,786 - INFO - combo.training.trainer - Epoch duration: 0:01:00.683444\n",
+      "2023-04-07 02:01:20,786 - INFO - combo.training.trainer - Estimated training time remaining: 4:30:17\n",
+      "2023-04-07 02:01:20,786 - INFO - allennlp.training.trainer - Epoch 166/399\n",
+      "2023-04-07 02:01:20,787 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:01:20,787 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:01:20,797 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9630, LAS: 0.9317, UEM: 0.5782, LEM: 0.3517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2255, partial_loss/deprel_loss: 0.3330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5015, loss: 0.5402, batch_reg_loss: 0.1900, reg_loss: 0.1900 ||:   5%|5         | 5/95 [00:02<00:39,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9617, LAS: 0.9299, UEM: 0.5833, LEM: 0.3478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6250, partial_loss/deprel_loss: 0.4584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6817, loss: 0.5524, batch_reg_loss: 0.1900, reg_loss: 0.1900 ||:  11%|#         | 10/95 [00:04<00:38,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9524, UAS: 0.9609, LAS: 0.9288, UEM: 0.6356, LEM: 0.4083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1701, partial_loss/deprel_loss: 0.2190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3992, loss: 0.5518, batch_reg_loss: 0.1900, reg_loss: 0.1900 ||:  16%|#5        | 15/95 [00:07<00:37,  2.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9228, UAS: 0.9625, LAS: 0.9310, UEM: 0.6482, LEM: 0.4231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5529, partial_loss/deprel_loss: 0.4218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6380, loss: 0.5423, batch_reg_loss: 0.1900, reg_loss: 0.1900 ||:  21%|##1       | 20/95 [00:09<00:35,  2.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9658, LAS: 0.9344, UEM: 0.7192, LEM: 0.5075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1990, partial_loss/deprel_loss: 0.2955, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4662, loss: 0.5199, batch_reg_loss: 0.1900, reg_loss: 0.1900 ||:  25%|##5       | 24/95 [00:11<00:33,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9728, UAS: 0.9667, LAS: 0.9357, UEM: 0.7434, LEM: 0.5478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0250, partial_loss/deprel_loss: 0.0946, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2706, loss: 0.5135, batch_reg_loss: 0.1899, reg_loss: 0.1900 ||:  29%|##9       | 28/95 [00:13<00:32,  2.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9642, LAS: 0.9332, UEM: 0.7205, LEM: 0.5279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2251, partial_loss/deprel_loss: 0.3153, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4872, loss: 0.5324, batch_reg_loss: 0.1899, reg_loss: 0.1900 ||:  35%|###4      | 33/95 [00:16<00:30,  2.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9184, UAS: 0.9642, LAS: 0.9329, UEM: 0.7150, LEM: 0.5171, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5854, partial_loss/deprel_loss: 0.4269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6486, loss: 0.5328, batch_reg_loss: 0.1899, reg_loss: 0.1900 ||:  40%|####      | 38/95 [00:18<00:27,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9529, UAS: 0.9655, LAS: 0.9340, UEM: 0.7234, LEM: 0.5171, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0865, partial_loss/deprel_loss: 0.2346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3949, loss: 0.5269, batch_reg_loss: 0.1899, reg_loss: 0.1900 ||:  45%|####5     | 43/95 [00:20<00:24,  2.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9656, LAS: 0.9338, UEM: 0.7135, LEM: 0.5010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3880, partial_loss/deprel_loss: 0.3729, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5658, loss: 0.5266, batch_reg_loss: 0.1899, reg_loss: 0.1900 ||:  51%|#####     | 48/95 [00:23<00:22,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9524, UAS: 0.9664, LAS: 0.9343, UEM: 0.7228, LEM: 0.5068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0947, partial_loss/deprel_loss: 0.2209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3855, loss: 0.5215, batch_reg_loss: 0.1899, reg_loss: 0.1899 ||:  56%|#####5    | 53/95 [00:25<00:20,  2.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9662, LAS: 0.9339, UEM: 0.7176, LEM: 0.5030, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3663, partial_loss/deprel_loss: 0.4278, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6054, loss: 0.5242, batch_reg_loss: 0.1899, reg_loss: 0.1899 ||:  61%|######1   | 58/95 [00:27<00:17,  2.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9368, UAS: 0.9666, LAS: 0.9343, UEM: 0.7131, LEM: 0.4957, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2723, partial_loss/deprel_loss: 0.3498, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5242, loss: 0.5230, batch_reg_loss: 0.1899, reg_loss: 0.1899 ||:  66%|######6   | 63/95 [00:30<00:15,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9655, LAS: 0.9330, UEM: 0.7009, LEM: 0.4835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3474, partial_loss/deprel_loss: 0.3285, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5221, loss: 0.5304, batch_reg_loss: 0.1898, reg_loss: 0.1899 ||:  72%|#######1  | 68/95 [00:32<00:12,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9650, LAS: 0.9325, UEM: 0.6981, LEM: 0.4813, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4814, partial_loss/deprel_loss: 0.4150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6181, loss: 0.5332, batch_reg_loss: 0.1898, reg_loss: 0.1899 ||:  77%|#######6  | 73/95 [00:35<00:10,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9649, LAS: 0.9324, UEM: 0.6913, LEM: 0.4740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4917, partial_loss/deprel_loss: 0.4035, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6110, loss: 0.5346, batch_reg_loss: 0.1898, reg_loss: 0.1899 ||:  82%|########2 | 78/95 [00:37<00:08,  2.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9652, LAS: 0.9326, UEM: 0.6916, LEM: 0.4719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2079, partial_loss/deprel_loss: 0.3110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4802, loss: 0.5338, batch_reg_loss: 0.1898, reg_loss: 0.1899 ||:  87%|########7 | 83/95 [00:39<00:05,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9649, LAS: 0.9321, UEM: 0.6894, LEM: 0.4701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4565, partial_loss/deprel_loss: 0.4445, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6367, loss: 0.5362, batch_reg_loss: 0.1898, reg_loss: 0.1899 ||:  93%|#########2| 88/95 [00:42<00:03,  2.12it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9646, LAS: 0.9318, UEM: 0.6823, LEM: 0.4627, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7761, partial_loss/deprel_loss: 0.4415, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6982, loss: 0.5384, batch_reg_loss: 0.1898, reg_loss: 0.1899 ||:  98%|#########7| 93/95 [00:44<00:00,  2.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9643, LAS: 0.9315, UEM: 0.6814, LEM: 0.4626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2074, partial_loss/deprel_loss: 0.2274, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4132, loss: 0.5408, batch_reg_loss: 0.1898, reg_loss: 0.1899 ||: 100%|##########| 95/95 [00:45<00:00,  2.10it/s]\n",
+      "2023-04-07 02:02:09,280 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:02:09,280 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 02:02:09,280 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.190  |       N/A\n",
+      "2023-04-07 02:02:09,280 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:02:09,280 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:02:09,280 - INFO - combo.training.tensorboard_writer - UEM                      |     0.681  |       N/A\n",
+      "2023-04-07 02:02:09,280 - INFO - combo.training.tensorboard_writer - LEM                      |     0.463  |       N/A\n",
+      "2023-04-07 02:02:09,280 - INFO - combo.training.tensorboard_writer - EM                       |     0.945  |       N/A\n",
+      "2023-04-07 02:02:09,280 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.207  |       N/A\n",
+      "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - UAS                      |     0.964  |       N/A\n",
+      "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.227  |       N/A\n",
+      "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - loss                     |     0.541  |       N/A\n",
+      "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - LAS                      |     0.932  |       N/A\n",
+      "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:02:09,281 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:02:09,286 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:02:14,100 - INFO - combo.training.trainer - Epoch duration: 0:00:53.313553\n",
+      "2023-04-07 02:02:14,100 - INFO - combo.training.trainer - Estimated training time remaining: 4:28:45\n",
+      "2023-04-07 02:02:14,101 - INFO - allennlp.training.trainer - Epoch 167/399\n",
+      "2023-04-07 02:02:14,101 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:02:14,102 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:02:14,110 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9506, UAS: 0.9654, LAS: 0.9332, UEM: 0.6255, LEM: 0.4033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1278, partial_loss/deprel_loss: 0.2510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4161, loss: 0.5278, batch_reg_loss: 0.1898, reg_loss: 0.1898 ||:   5%|5         | 5/95 [00:02<00:43,  2.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8819, UAS: 0.9584, LAS: 0.9268, UEM: 0.6078, LEM: 0.3995, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1507, partial_loss/deprel_loss: 0.6453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9362, loss: 0.5770, batch_reg_loss: 0.1898, reg_loss: 0.1898 ||:   9%|9         | 9/95 [00:04<00:42,  2.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9493, UAS: 0.9615, LAS: 0.9300, UEM: 0.6402, LEM: 0.4273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1392, partial_loss/deprel_loss: 0.2267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3990, loss: 0.5564, batch_reg_loss: 0.1898, reg_loss: 0.1898 ||:  14%|#3        | 13/95 [00:06<00:40,  2.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9644, LAS: 0.9332, UEM: 0.6783, LEM: 0.4616, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2646, partial_loss/deprel_loss: 0.3075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4887, loss: 0.5265, batch_reg_loss: 0.1898, reg_loss: 0.1898 ||:  19%|#8        | 18/95 [00:08<00:37,  2.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9633, LAS: 0.9322, UEM: 0.6436, LEM: 0.4276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2725, partial_loss/deprel_loss: 0.2990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4835, loss: 0.5361, batch_reg_loss: 0.1897, reg_loss: 0.1898 ||:  24%|##4       | 23/95 [00:11<00:34,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9625, LAS: 0.9311, UEM: 0.6389, LEM: 0.4258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1966, partial_loss/deprel_loss: 0.3390, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5002, loss: 0.5427, batch_reg_loss: 0.1897, reg_loss: 0.1898 ||:  29%|##9       | 28/95 [00:13<00:32,  2.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8894, UAS: 0.9623, LAS: 0.9310, UEM: 0.6383, LEM: 0.4220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8791, partial_loss/deprel_loss: 0.5183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7802, loss: 0.5432, batch_reg_loss: 0.1897, reg_loss: 0.1898 ||:  35%|###4      | 33/95 [00:16<00:29,  2.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9624, LAS: 0.9309, UEM: 0.6327, LEM: 0.4129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1652, partial_loss/deprel_loss: 0.3114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4718, loss: 0.5450, batch_reg_loss: 0.1897, reg_loss: 0.1898 ||:  40%|####      | 38/95 [00:18<00:26,  2.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9481, UAS: 0.9632, LAS: 0.9319, UEM: 0.6344, LEM: 0.4112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2448, partial_loss/deprel_loss: 0.2695, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4543, loss: 0.5403, batch_reg_loss: 0.1897, reg_loss: 0.1897 ||:  45%|####5     | 43/95 [00:20<00:24,  2.16it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9184, UAS: 0.9639, LAS: 0.9326, UEM: 0.6478, LEM: 0.4249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5301, partial_loss/deprel_loss: 0.4553, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6599, loss: 0.5358, batch_reg_loss: 0.1897, reg_loss: 0.1897 ||:  51%|#####     | 48/95 [00:22<00:22,  2.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9643, LAS: 0.9329, UEM: 0.6518, LEM: 0.4286, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4277, partial_loss/deprel_loss: 0.4355, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6236, loss: 0.5326, batch_reg_loss: 0.1896, reg_loss: 0.1897 ||:  56%|#####5    | 53/95 [00:25<00:19,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9332, UAS: 0.9645, LAS: 0.9330, UEM: 0.6463, LEM: 0.4197, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3142, partial_loss/deprel_loss: 0.3520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5341, loss: 0.5324, batch_reg_loss: 0.1896, reg_loss: 0.1897 ||:  61%|######1   | 58/95 [00:27<00:17,  2.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9648, LAS: 0.9333, UEM: 0.6506, LEM: 0.4231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2682, partial_loss/deprel_loss: 0.3169, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4968, loss: 0.5293, batch_reg_loss: 0.1896, reg_loss: 0.1897 ||:  66%|######6   | 63/95 [00:29<00:14,  2.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9653, LAS: 0.9337, UEM: 0.6653, LEM: 0.4415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3111, partial_loss/deprel_loss: 0.3504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5321, loss: 0.5264, batch_reg_loss: 0.1896, reg_loss: 0.1897 ||:  72%|#######1  | 68/95 [00:32<00:12,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9649, LAS: 0.9334, UEM: 0.6681, LEM: 0.4497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2896, partial_loss/deprel_loss: 0.2878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4777, loss: 0.5303, batch_reg_loss: 0.1896, reg_loss: 0.1897 ||:  77%|#######6  | 73/95 [00:34<00:10,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9654, LAS: 0.9338, UEM: 0.6709, LEM: 0.4501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2031, partial_loss/deprel_loss: 0.2615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4394, loss: 0.5279, batch_reg_loss: 0.1896, reg_loss: 0.1897 ||:  82%|########2 | 78/95 [00:36<00:07,  2.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9736, UAS: 0.9662, LAS: 0.9346, UEM: 0.6955, LEM: 0.4819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0278, partial_loss/deprel_loss: 0.1079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2814, loss: 0.5208, batch_reg_loss: 0.1895, reg_loss: 0.1897 ||:  87%|########7 | 83/95 [00:39<00:06,  1.97it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9661, LAS: 0.9344, UEM: 0.6960, LEM: 0.4822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1564, partial_loss/deprel_loss: 0.2694, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4363, loss: 0.5217, batch_reg_loss: 0.1895, reg_loss: 0.1897 ||:  92%|#########1| 87/95 [00:41<00:04,  1.98it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9657, LAS: 0.9341, UEM: 0.6945, LEM: 0.4807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1499, partial_loss/deprel_loss: 0.2363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4085, loss: 0.5231, batch_reg_loss: 0.1895, reg_loss: 0.1897 ||:  97%|#########6| 92/95 [00:44<00:01,  2.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9082, UAS: 0.9651, LAS: 0.9334, UEM: 0.6874, LEM: 0.4750, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6916, partial_loss/deprel_loss: 0.4745, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7074, loss: 0.5286, batch_reg_loss: 0.1895, reg_loss: 0.1897 ||: 100%|##########| 95/95 [00:45<00:00,  2.07it/s]\n",
+      "2023-04-07 02:03:02,709 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:03:02,711 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 02:03:02,711 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.190  |       N/A\n",
+      "2023-04-07 02:03:02,711 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:03:02,711 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:03:02,711 - INFO - combo.training.tensorboard_writer - UEM                      |     0.687  |       N/A\n",
+      "2023-04-07 02:03:02,711 - INFO - combo.training.tensorboard_writer - LEM                      |     0.475  |       N/A\n",
+      "2023-04-07 02:03:02,711 - INFO - combo.training.tensorboard_writer - EM                       |     0.908  |       N/A\n",
+      "2023-04-07 02:03:02,711 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.692  |       N/A\n",
+      "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - UAS                      |     0.965  |       N/A\n",
+      "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.474  |       N/A\n",
+      "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - loss                     |     0.529  |       N/A\n",
+      "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - LAS                      |     0.933  |       N/A\n",
+      "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:03:02,712 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:03:02,717 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:03:07,245 - INFO - combo.training.trainer - Epoch duration: 0:00:53.144077\n",
+      "2023-04-07 02:03:07,245 - INFO - combo.training.trainer - Estimated training time remaining: 4:27:14\n",
+      "2023-04-07 02:03:07,246 - INFO - allennlp.training.trainer - Epoch 168/399\n",
+      "2023-04-07 02:03:07,246 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:03:07,247 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:03:07,257 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9359, UAS: 0.9666, LAS: 0.9362, UEM: 0.6196, LEM: 0.3873, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2618, partial_loss/deprel_loss: 0.2921, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4755, loss: 0.5008, batch_reg_loss: 0.1895, reg_loss: 0.1895 ||:   5%|5         | 5/95 [00:02<00:38,  2.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9671, LAS: 0.9346, UEM: 0.6740, LEM: 0.4231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5996, partial_loss/deprel_loss: 0.4462, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6664, loss: 0.5037, batch_reg_loss: 0.1895, reg_loss: 0.1895 ||:   9%|9         | 9/95 [00:04<00:39,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9649, LAS: 0.9325, UEM: 0.6628, LEM: 0.4281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3849, partial_loss/deprel_loss: 0.3403, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5386, loss: 0.5212, batch_reg_loss: 0.1894, reg_loss: 0.1895 ||:  15%|#4        | 14/95 [00:06<00:36,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9664, LAS: 0.9347, UEM: 0.6997, LEM: 0.4825, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4664, partial_loss/deprel_loss: 0.4039, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6058, loss: 0.5104, batch_reg_loss: 0.1894, reg_loss: 0.1895 ||:  20%|##        | 19/95 [00:08<00:34,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9641, LAS: 0.9330, UEM: 0.6694, LEM: 0.4525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3107, partial_loss/deprel_loss: 0.3015, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4927, loss: 0.5253, batch_reg_loss: 0.1894, reg_loss: 0.1894 ||:  25%|##5       | 24/95 [00:11<00:32,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9620, LAS: 0.9311, UEM: 0.6397, LEM: 0.4237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8955, partial_loss/deprel_loss: 0.4527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7307, loss: 0.5400, batch_reg_loss: 0.1894, reg_loss: 0.1894 ||:  31%|###       | 29/95 [00:13<00:30,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9614, LAS: 0.9305, UEM: 0.6237, LEM: 0.4095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2517, partial_loss/deprel_loss: 0.3106, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4882, loss: 0.5452, batch_reg_loss: 0.1894, reg_loss: 0.1894 ||:  36%|###5      | 34/95 [00:15<00:27,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9617, LAS: 0.9309, UEM: 0.6249, LEM: 0.4115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1641, partial_loss/deprel_loss: 0.2673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4361, loss: 0.5443, batch_reg_loss: 0.1894, reg_loss: 0.1894 ||:  41%|####1     | 39/95 [00:18<00:26,  2.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9625, LAS: 0.9318, UEM: 0.6325, LEM: 0.4153, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3411, partial_loss/deprel_loss: 0.3364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5267, loss: 0.5372, batch_reg_loss: 0.1893, reg_loss: 0.1894 ||:  46%|####6     | 44/95 [00:20<00:24,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9629, LAS: 0.9323, UEM: 0.6364, LEM: 0.4190, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1839, partial_loss/deprel_loss: 0.2767, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4475, loss: 0.5370, batch_reg_loss: 0.1893, reg_loss: 0.1894 ||:  52%|#####1    | 49/95 [00:22<00:21,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9398, UAS: 0.9635, LAS: 0.9327, UEM: 0.6392, LEM: 0.4162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1691, partial_loss/deprel_loss: 0.3004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4635, loss: 0.5335, batch_reg_loss: 0.1893, reg_loss: 0.1894 ||:  57%|#####6    | 54/95 [00:25<00:19,  2.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9640, LAS: 0.9330, UEM: 0.6387, LEM: 0.4136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2968, partial_loss/deprel_loss: 0.3182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5032, loss: 0.5312, batch_reg_loss: 0.1893, reg_loss: 0.1894 ||:  62%|######2   | 59/95 [00:27<00:16,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9639, LAS: 0.9332, UEM: 0.6360, LEM: 0.4122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2409, partial_loss/deprel_loss: 0.2927, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4716, loss: 0.5308, batch_reg_loss: 0.1893, reg_loss: 0.1894 ||:  67%|######7   | 64/95 [00:29<00:14,  2.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9528, UAS: 0.9645, LAS: 0.9338, UEM: 0.6452, LEM: 0.4213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1767, partial_loss/deprel_loss: 0.2089, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3917, loss: 0.5265, batch_reg_loss: 0.1893, reg_loss: 0.1894 ||:  73%|#######2  | 69/95 [00:32<00:12,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9644, LAS: 0.9336, UEM: 0.6536, LEM: 0.4298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2759, partial_loss/deprel_loss: 0.3663, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5375, loss: 0.5278, batch_reg_loss: 0.1892, reg_loss: 0.1894 ||:  78%|#######7  | 74/95 [00:34<00:10,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9250, UAS: 0.9649, LAS: 0.9342, UEM: 0.6632, LEM: 0.4390, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4438, partial_loss/deprel_loss: 0.4065, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6031, loss: 0.5240, batch_reg_loss: 0.1892, reg_loss: 0.1894 ||:  83%|########3 | 79/95 [00:37<00:07,  2.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9728, UAS: 0.9657, LAS: 0.9351, UEM: 0.6920, LEM: 0.4787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0267, partial_loss/deprel_loss: 0.1064, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2796, loss: 0.5168, batch_reg_loss: 0.1892, reg_loss: 0.1893 ||:  88%|########8 | 84/95 [00:40<00:05,  1.98it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9653, LAS: 0.9348, UEM: 0.6902, LEM: 0.4779, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2619, partial_loss/deprel_loss: 0.2646, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4532, loss: 0.5183, batch_reg_loss: 0.1892, reg_loss: 0.1893 ||:  94%|#########3| 89/95 [00:42<00:03,  1.99it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9431, UAS: 0.9653, LAS: 0.9347, UEM: 0.6901, LEM: 0.4773, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1948, partial_loss/deprel_loss: 0.2738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4471, loss: 0.5187, batch_reg_loss: 0.1891, reg_loss: 0.1893 ||:  99%|#########8| 94/95 [00:45<00:00,  2.00it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9652, LAS: 0.9346, UEM: 0.6877, LEM: 0.4753, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4584, partial_loss/deprel_loss: 0.3815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5860, loss: 0.5194, batch_reg_loss: 0.1891, reg_loss: 0.1893 ||: 100%|##########| 95/95 [00:45<00:00,  2.09it/s]\n",
+      "2023-04-07 02:03:55,866 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.189  |       N/A\n",
+      "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - UEM                      |     0.688  |       N/A\n",
+      "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - LEM                      |     0.475  |       N/A\n",
+      "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - EM                       |     0.931  |       N/A\n",
+      "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.458  |       N/A\n",
+      "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - UAS                      |     0.965  |       N/A\n",
+      "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.381  |       N/A\n",
+      "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - loss                     |     0.519  |       N/A\n",
+      "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:03:55,867 - INFO - combo.training.tensorboard_writer - LAS                      |     0.935  |       N/A\n",
+      "2023-04-07 02:03:55,868 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 02:03:55,868 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:03:55,868 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:03:55,868 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:03:55,868 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:03:55,868 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:03:55,873 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:04:00,656 - INFO - combo.training.trainer - Epoch duration: 0:00:53.410501\n",
+      "2023-04-07 02:04:00,657 - INFO - combo.training.trainer - Estimated training time remaining: 4:25:43\n",
+      "2023-04-07 02:04:00,657 - INFO - allennlp.training.trainer - Epoch 169/399\n",
+      "2023-04-07 02:04:00,657 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:04:00,658 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:04:00,667 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9431, UAS: 0.9698, LAS: 0.9411, UEM: 0.6418, LEM: 0.4026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2413, partial_loss/deprel_loss: 0.2945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4730, loss: 0.4935, batch_reg_loss: 0.1891, reg_loss: 0.1891 ||:   5%|5         | 5/95 [00:02<00:38,  2.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9488, UAS: 0.9726, LAS: 0.9440, UEM: 0.7260, LEM: 0.5097, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2509, partial_loss/deprel_loss: 0.2617, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4487, loss: 0.4653, batch_reg_loss: 0.1891, reg_loss: 0.1891 ||:  11%|#         | 10/95 [00:04<00:37,  2.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9677, LAS: 0.9380, UEM: 0.6683, LEM: 0.4510, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5019, partial_loss/deprel_loss: 0.3501, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5695, loss: 0.4984, batch_reg_loss: 0.1891, reg_loss: 0.1891 ||:  16%|#5        | 15/95 [00:06<00:36,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9693, LAS: 0.9395, UEM: 0.6868, LEM: 0.4654, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1516, partial_loss/deprel_loss: 0.2564, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4245, loss: 0.4872, batch_reg_loss: 0.1891, reg_loss: 0.1891 ||:  21%|##1       | 20/95 [00:09<00:34,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9518, UAS: 0.9687, LAS: 0.9386, UEM: 0.6907, LEM: 0.4665, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1540, partial_loss/deprel_loss: 0.2328, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4061, loss: 0.4929, batch_reg_loss: 0.1890, reg_loss: 0.1891 ||:  26%|##6       | 25/95 [00:11<00:32,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9170, UAS: 0.9673, LAS: 0.9369, UEM: 0.6747, LEM: 0.4506, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6361, partial_loss/deprel_loss: 0.4534, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6790, loss: 0.5034, batch_reg_loss: 0.1890, reg_loss: 0.1891 ||:  32%|###1      | 30/95 [00:13<00:29,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9517, UAS: 0.9654, LAS: 0.9351, UEM: 0.6693, LEM: 0.4517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1109, partial_loss/deprel_loss: 0.2039, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3743, loss: 0.5151, batch_reg_loss: 0.1890, reg_loss: 0.1891 ||:  36%|###5      | 34/95 [00:15<00:28,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9640, LAS: 0.9335, UEM: 0.6648, LEM: 0.4455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2365, partial_loss/deprel_loss: 0.3067, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4816, loss: 0.5248, batch_reg_loss: 0.1890, reg_loss: 0.1891 ||:  40%|####      | 38/95 [00:18<00:27,  2.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9504, UAS: 0.9643, LAS: 0.9338, UEM: 0.6627, LEM: 0.4412, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1614, partial_loss/deprel_loss: 0.2306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4058, loss: 0.5239, batch_reg_loss: 0.1890, reg_loss: 0.1891 ||:  45%|####5     | 43/95 [00:20<00:24,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9639, LAS: 0.9334, UEM: 0.6678, LEM: 0.4480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4158, partial_loss/deprel_loss: 0.3459, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5489, loss: 0.5280, batch_reg_loss: 0.1890, reg_loss: 0.1890 ||:  51%|#####     | 48/95 [00:22<00:23,  2.04it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9648, LAS: 0.9342, UEM: 0.6731, LEM: 0.4501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1368, partial_loss/deprel_loss: 0.2578, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4226, loss: 0.5226, batch_reg_loss: 0.1890, reg_loss: 0.1890 ||:  56%|#####5    | 53/95 [00:25<00:19,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9652, LAS: 0.9346, UEM: 0.6799, LEM: 0.4560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3672, partial_loss/deprel_loss: 0.4244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6019, loss: 0.5194, batch_reg_loss: 0.1889, reg_loss: 0.1890 ||:  61%|######1   | 58/95 [00:27<00:17,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9470, UAS: 0.9662, LAS: 0.9354, UEM: 0.6912, LEM: 0.4639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1551, partial_loss/deprel_loss: 0.2573, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4258, loss: 0.5132, batch_reg_loss: 0.1889, reg_loss: 0.1890 ||:  66%|######6   | 63/95 [00:29<00:15,  2.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9476, UAS: 0.9664, LAS: 0.9359, UEM: 0.7032, LEM: 0.4875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1846, partial_loss/deprel_loss: 0.2637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4368, loss: 0.5111, batch_reg_loss: 0.1889, reg_loss: 0.1890 ||:  72%|#######1  | 68/95 [00:32<00:13,  2.00it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9481, UAS: 0.9659, LAS: 0.9357, UEM: 0.6989, LEM: 0.4847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1499, partial_loss/deprel_loss: 0.2348, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4067, loss: 0.5120, batch_reg_loss: 0.1889, reg_loss: 0.1890 ||:  77%|#######6  | 73/95 [00:35<00:10,  2.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9461, UAS: 0.9665, LAS: 0.9364, UEM: 0.7073, LEM: 0.4957, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2139, partial_loss/deprel_loss: 0.2823, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4574, loss: 0.5077, batch_reg_loss: 0.1889, reg_loss: 0.1890 ||:  82%|########2 | 78/95 [00:37<00:08,  2.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9665, LAS: 0.9363, UEM: 0.7041, LEM: 0.4912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4997, partial_loss/deprel_loss: 0.3876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5988, loss: 0.5086, batch_reg_loss: 0.1888, reg_loss: 0.1890 ||:  87%|########7 | 83/95 [00:39<00:05,  2.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9661, LAS: 0.9360, UEM: 0.6966, LEM: 0.4835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5800, partial_loss/deprel_loss: 0.3905, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6172, loss: 0.5121, batch_reg_loss: 0.1888, reg_loss: 0.1890 ||:  93%|#########2| 88/95 [00:42<00:03,  2.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9664, LAS: 0.9362, UEM: 0.6986, LEM: 0.4822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3492, partial_loss/deprel_loss: 0.4149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5906, loss: 0.5113, batch_reg_loss: 0.1888, reg_loss: 0.1890 ||:  98%|#########7| 93/95 [00:44<00:00,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9663, LAS: 0.9362, UEM: 0.6948, LEM: 0.4785, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3264, partial_loss/deprel_loss: 0.3409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5268, loss: 0.5126, batch_reg_loss: 0.1888, reg_loss: 0.1890 ||: 100%|##########| 95/95 [00:45<00:00,  2.09it/s]\n",
+      "2023-04-07 02:04:48,869 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:04:48,869 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 02:04:48,869 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.189  |       N/A\n",
+      "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - UEM                      |     0.695  |       N/A\n",
+      "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - LEM                      |     0.479  |       N/A\n",
+      "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - EM                       |     0.942  |       N/A\n",
+      "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.326  |       N/A\n",
+      "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - UAS                      |     0.966  |       N/A\n",
+      "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.341  |       N/A\n",
+      "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - loss                     |     0.513  |       N/A\n",
+      "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - LAS                      |     0.936  |       N/A\n",
+      "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:04:48,870 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:04:48,871 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:04:48,871 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:04:48,871 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:04:48,874 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:04:52,934 - INFO - combo.training.trainer - Epoch duration: 0:00:52.276559\n",
+      "2023-04-07 02:04:52,934 - INFO - combo.training.trainer - Estimated training time remaining: 4:24:12\n",
+      "2023-04-07 02:04:52,934 - INFO - allennlp.training.trainer - Epoch 170/399\n",
+      "2023-04-07 02:04:52,934 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:04:52,935 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:04:52,943 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9684, LAS: 0.9376, UEM: 0.6909, LEM: 0.4470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4841, partial_loss/deprel_loss: 0.4147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6174, loss: 0.5100, batch_reg_loss: 0.1888, reg_loss: 0.1888 ||:   5%|5         | 5/95 [00:02<00:39,  2.29it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9381, UAS: 0.9687, LAS: 0.9387, UEM: 0.6775, LEM: 0.4396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2149, partial_loss/deprel_loss: 0.2755, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4521, loss: 0.4978, batch_reg_loss: 0.1888, reg_loss: 0.1888 ||:  11%|#         | 10/95 [00:04<00:36,  2.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9482, UAS: 0.9715, LAS: 0.9419, UEM: 0.7333, LEM: 0.5131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1959, partial_loss/deprel_loss: 0.2153, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4001, loss: 0.4725, batch_reg_loss: 0.1887, reg_loss: 0.1888 ||:  16%|#5        | 15/95 [00:06<00:34,  2.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9721, LAS: 0.9428, UEM: 0.7274, LEM: 0.5008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2891, partial_loss/deprel_loss: 0.3201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5026, loss: 0.4681, batch_reg_loss: 0.1887, reg_loss: 0.1888 ||:  21%|##1       | 20/95 [00:08<00:32,  2.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9698, LAS: 0.9406, UEM: 0.7019, LEM: 0.4749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2561, partial_loss/deprel_loss: 0.2651, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4520, loss: 0.4841, batch_reg_loss: 0.1887, reg_loss: 0.1888 ||:  26%|##6       | 25/95 [00:10<00:30,  2.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9662, LAS: 0.9372, UEM: 0.6700, LEM: 0.4491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6342, partial_loss/deprel_loss: 0.4175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6495, loss: 0.5039, batch_reg_loss: 0.1887, reg_loss: 0.1887 ||:  32%|###1      | 30/95 [00:13<00:28,  2.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9434, UAS: 0.9666, LAS: 0.9376, UEM: 0.6813, LEM: 0.4667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1756, partial_loss/deprel_loss: 0.2992, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4631, loss: 0.5028, batch_reg_loss: 0.1887, reg_loss: 0.1887 ||:  37%|###6      | 35/95 [00:15<00:27,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9670, LAS: 0.9382, UEM: 0.6947, LEM: 0.4845, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4920, partial_loss/deprel_loss: 0.3329, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5534, loss: 0.4973, batch_reg_loss: 0.1887, reg_loss: 0.1887 ||:  42%|####2     | 40/95 [00:17<00:24,  2.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9678, LAS: 0.9391, UEM: 0.7201, LEM: 0.5218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7146, partial_loss/deprel_loss: 0.4227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6697, loss: 0.4923, batch_reg_loss: 0.1886, reg_loss: 0.1887 ||:  47%|####7     | 45/95 [00:20<00:23,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9299, UAS: 0.9673, LAS: 0.9385, UEM: 0.7101, LEM: 0.5084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4554, partial_loss/deprel_loss: 0.3643, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5711, loss: 0.4978, batch_reg_loss: 0.1886, reg_loss: 0.1887 ||:  53%|#####2    | 50/95 [00:22<00:21,  2.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9529, UAS: 0.9675, LAS: 0.9387, UEM: 0.7079, LEM: 0.5057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0977, partial_loss/deprel_loss: 0.2086, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3750, loss: 0.4944, batch_reg_loss: 0.1886, reg_loss: 0.1887 ||:  58%|#####7    | 55/95 [00:25<00:19,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9660, LAS: 0.9371, UEM: 0.6921, LEM: 0.4913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0203, partial_loss/deprel_loss: 0.4821, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7783, loss: 0.5049, batch_reg_loss: 0.1886, reg_loss: 0.1887 ||:  63%|######3   | 60/95 [00:27<00:16,  2.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9272, UAS: 0.9658, LAS: 0.9369, UEM: 0.6886, LEM: 0.4873, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5424, partial_loss/deprel_loss: 0.4279, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6394, loss: 0.5069, batch_reg_loss: 0.1886, reg_loss: 0.1887 ||:  68%|######8   | 65/95 [00:30<00:14,  2.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9501, UAS: 0.9658, LAS: 0.9368, UEM: 0.6917, LEM: 0.4884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1012, partial_loss/deprel_loss: 0.2260, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3896, loss: 0.5079, batch_reg_loss: 0.1885, reg_loss: 0.1887 ||:  74%|#######3  | 70/95 [00:32<00:12,  2.00it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9659, LAS: 0.9369, UEM: 0.6901, LEM: 0.4871, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3690, partial_loss/deprel_loss: 0.3551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5464, loss: 0.5082, batch_reg_loss: 0.1885, reg_loss: 0.1887 ||:  78%|#######7  | 74/95 [00:34<00:10,  1.99it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9661, LAS: 0.9371, UEM: 0.6906, LEM: 0.4851, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2181, partial_loss/deprel_loss: 0.3031, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4746, loss: 0.5066, batch_reg_loss: 0.1885, reg_loss: 0.1886 ||:  83%|########3 | 79/95 [00:37<00:08,  1.99it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9541, UAS: 0.9666, LAS: 0.9375, UEM: 0.6934, LEM: 0.4857, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1515, partial_loss/deprel_loss: 0.2274, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4007, loss: 0.5043, batch_reg_loss: 0.1885, reg_loss: 0.1886 ||:  88%|########8 | 84/95 [00:39<00:05,  2.00it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9668, LAS: 0.9376, UEM: 0.6980, LEM: 0.4908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3548, partial_loss/deprel_loss: 0.3839, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5666, loss: 0.5031, batch_reg_loss: 0.1885, reg_loss: 0.1886 ||:  94%|#########3| 89/95 [00:42<00:02,  2.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9665, LAS: 0.9373, UEM: 0.6975, LEM: 0.4906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2611, partial_loss/deprel_loss: 0.3297, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5044, loss: 0.5043, batch_reg_loss: 0.1885, reg_loss: 0.1886 ||:  99%|#########8| 94/95 [00:44<00:00,  2.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9665, LAS: 0.9373, UEM: 0.6966, LEM: 0.4894, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3578, partial_loss/deprel_loss: 0.3210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5168, loss: 0.5045, batch_reg_loss: 0.1885, reg_loss: 0.1886 ||: 100%|##########| 95/95 [00:45<00:00,  2.11it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 02:05:41,112 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9485, UAS: 0.9606, LAS: 0.9147, UEM: 0.8017, LEM: 0.5895, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2081, partial_loss/deprel_loss: 4.6841, partial_loss/cycle_loss: 0.0000, batch_loss: 3.7889, loss: 6.6149, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  27%|##7       | 3/11 [00:02<00:05,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8574, UAS: 0.9545, LAS: 0.9051, UEM: 0.7521, LEM: 0.4908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5775, partial_loss/deprel_loss: 16.9584, partial_loss/cycle_loss: 0.0000, batch_loss: 13.8822, loss: 7.3829, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  55%|#####4    | 6/11 [00:04<00:03,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9544, LAS: 0.9039, UEM: 0.7156, LEM: 0.4422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2515, partial_loss/deprel_loss: 14.2445, partial_loss/cycle_loss: 0.0000, batch_loss: 11.6459, loss: 7.2721, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  91%|######### | 10/11 [00:06<00:00,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9524, LAS: 0.9017, UEM: 0.6955, LEM: 0.4239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0646, partial_loss/deprel_loss: 8.0247, partial_loss/cycle_loss: 0.0000, batch_loss: 6.6326, loss: 7.2140, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:07<00:00,  1.49it/s]  \n",
+      "2023-04-07 02:05:48,501 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.189  |     0.000\n",
+      "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - UEM                      |     0.697  |     0.695\n",
+      "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - LEM                      |     0.489  |     0.424\n",
+      "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - EM                       |     0.936  |     0.880\n",
+      "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.358  |     1.065\n",
+      "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - UAS                      |     0.966  |     0.952\n",
+      "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.321  |     8.025\n",
+      "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - loss                     |     0.504  |     7.214\n",
+      "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - LAS                      |     0.937  |     0.902\n",
+      "2023-04-07 02:05:48,502 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 02:05:48,503 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 02:05:48,503 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 02:05:48,503 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 02:05:48,503 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 02:05:48,503 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 02:05:48,508 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:05:53,326 - INFO - combo.training.trainer - Epoch duration: 0:01:00.392223\n",
+      "2023-04-07 02:05:53,327 - INFO - combo.training.trainer - Estimated training time remaining: 4:22:51\n",
+      "2023-04-07 02:05:53,327 - INFO - allennlp.training.trainer - Epoch 171/399\n",
+      "2023-04-07 02:05:53,328 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:05:53,328 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:05:53,338 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9800, UAS: 0.9725, LAS: 0.9501, UEM: 0.9113, LEM: 0.8424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0207, partial_loss/deprel_loss: 0.0859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2613, loss: 0.4325, batch_reg_loss: 0.1884, reg_loss: 0.1884 ||:   2%|2         | 2/95 [00:03<02:36,  1.68s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9484, UAS: 0.9683, LAS: 0.9401, UEM: 0.8034, LEM: 0.6626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1351, partial_loss/deprel_loss: 0.2525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4174, loss: 0.4835, batch_reg_loss: 0.1884, reg_loss: 0.1884 ||:   7%|7         | 7/95 [00:05<01:55,  1.31s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9489, UAS: 0.9652, LAS: 0.9365, UEM: 0.7790, LEM: 0.6240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1633, partial_loss/deprel_loss: 0.2132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3916, loss: 0.4996, batch_reg_loss: 0.1884, reg_loss: 0.1884 ||:  12%|#1        | 11/95 [00:07<01:30,  1.08s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9678, LAS: 0.9386, UEM: 0.7664, LEM: 0.5865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1950, partial_loss/deprel_loss: 0.2914, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4605, loss: 0.4872, batch_reg_loss: 0.1884, reg_loss: 0.1884 ||:  17%|#6        | 16/95 [00:09<01:09,  1.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9520, UAS: 0.9692, LAS: 0.9398, UEM: 0.7505, LEM: 0.5586, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1606, partial_loss/deprel_loss: 0.2313, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4056, loss: 0.4809, batch_reg_loss: 0.1884, reg_loss: 0.1884 ||:  22%|##2       | 21/95 [00:12<00:56,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9704, LAS: 0.9406, UEM: 0.7493, LEM: 0.5435, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1785, partial_loss/deprel_loss: 0.2603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4323, loss: 0.4747, batch_reg_loss: 0.1883, reg_loss: 0.1884 ||:  27%|##7       | 26/95 [00:14<00:45,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9569, UAS: 0.9703, LAS: 0.9406, UEM: 0.7494, LEM: 0.5445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1113, partial_loss/deprel_loss: 0.1922, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3643, loss: 0.4752, batch_reg_loss: 0.1883, reg_loss: 0.1884 ||:  32%|###1      | 30/95 [00:16<00:40,  1.60it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9696, LAS: 0.9397, UEM: 0.7372, LEM: 0.5301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2091, partial_loss/deprel_loss: 0.2668, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4435, loss: 0.4816, batch_reg_loss: 0.1883, reg_loss: 0.1884 ||:  36%|###5      | 34/95 [00:18<00:36,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9700, LAS: 0.9400, UEM: 0.7325, LEM: 0.5208, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3220, partial_loss/deprel_loss: 0.3393, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5241, loss: 0.4803, batch_reg_loss: 0.1883, reg_loss: 0.1884 ||:  41%|####1     | 39/95 [00:21<00:30,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9699, LAS: 0.9401, UEM: 0.7327, LEM: 0.5236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3314, partial_loss/deprel_loss: 0.3686, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5494, loss: 0.4811, batch_reg_loss: 0.1883, reg_loss: 0.1884 ||:  45%|####5     | 43/95 [00:23<00:28,  1.84it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9691, LAS: 0.9394, UEM: 0.7168, LEM: 0.5071, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2708, partial_loss/deprel_loss: 0.3169, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4960, loss: 0.4881, batch_reg_loss: 0.1882, reg_loss: 0.1883 ||:  51%|#####     | 48/95 [00:25<00:24,  1.91it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9593, UAS: 0.9694, LAS: 0.9400, UEM: 0.7222, LEM: 0.5151, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0995, partial_loss/deprel_loss: 0.1760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3489, loss: 0.4851, batch_reg_loss: 0.1882, reg_loss: 0.1883 ||:  56%|#####5    | 53/95 [00:27<00:21,  1.95it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9689, LAS: 0.9395, UEM: 0.7107, LEM: 0.5024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2013, partial_loss/deprel_loss: 0.2850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4564, loss: 0.4883, batch_reg_loss: 0.1882, reg_loss: 0.1883 ||:  61%|######1   | 58/95 [00:30<00:18,  1.97it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9689, LAS: 0.9396, UEM: 0.7063, LEM: 0.4967, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1335, partial_loss/deprel_loss: 0.2659, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4276, loss: 0.4874, batch_reg_loss: 0.1882, reg_loss: 0.1883 ||:  66%|######6   | 63/95 [00:32<00:15,  2.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9685, LAS: 0.9392, UEM: 0.7010, LEM: 0.4914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4787, partial_loss/deprel_loss: 0.4124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6138, loss: 0.4897, batch_reg_loss: 0.1882, reg_loss: 0.1883 ||:  72%|#######1  | 68/95 [00:35<00:13,  2.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9300, UAS: 0.9688, LAS: 0.9393, UEM: 0.7078, LEM: 0.4975, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4541, partial_loss/deprel_loss: 0.3486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5579, loss: 0.4890, batch_reg_loss: 0.1882, reg_loss: 0.1883 ||:  77%|#######6  | 73/95 [00:37<00:10,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9535, UAS: 0.9681, LAS: 0.9388, UEM: 0.6992, LEM: 0.4888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2062, partial_loss/deprel_loss: 0.2743, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4489, loss: 0.4939, batch_reg_loss: 0.1881, reg_loss: 0.1883 ||:  82%|########2 | 78/95 [00:39<00:07,  2.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9276, UAS: 0.9680, LAS: 0.9386, UEM: 0.6943, LEM: 0.4816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5463, partial_loss/deprel_loss: 0.4094, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6249, loss: 0.4966, batch_reg_loss: 0.1881, reg_loss: 0.1883 ||:  87%|########7 | 83/95 [00:41<00:05,  2.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9679, LAS: 0.9386, UEM: 0.6982, LEM: 0.4858, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3599, partial_loss/deprel_loss: 0.3570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5457, loss: 0.4961, batch_reg_loss: 0.1881, reg_loss: 0.1883 ||:  93%|#########2| 88/95 [00:44<00:03,  2.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9514, UAS: 0.9669, LAS: 0.9376, UEM: 0.6929, LEM: 0.4818, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1493, partial_loss/deprel_loss: 0.2456, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4144, loss: 0.5021, batch_reg_loss: 0.1881, reg_loss: 0.1883 ||:  98%|#########7| 93/95 [00:46<00:00,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9612, UAS: 0.9671, LAS: 0.9378, UEM: 0.6992, LEM: 0.4909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0732, partial_loss/deprel_loss: 0.1482, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3213, loss: 0.5004, batch_reg_loss: 0.1881, reg_loss: 0.1883 ||: 100%|##########| 95/95 [00:47<00:00,  1.99it/s]\n",
+      "2023-04-07 02:06:43,858 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:06:43,858 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 02:06:43,858 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.188  |       N/A\n",
+      "2023-04-07 02:06:43,858 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:06:43,858 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:06:43,858 - INFO - combo.training.tensorboard_writer - UEM                      |     0.699  |       N/A\n",
+      "2023-04-07 02:06:43,858 - INFO - combo.training.tensorboard_writer - LEM                      |     0.491  |       N/A\n",
+      "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - EM                       |     0.961  |       N/A\n",
+      "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.073  |       N/A\n",
+      "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - UAS                      |     0.967  |       N/A\n",
+      "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.148  |       N/A\n",
+      "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - loss                     |     0.500  |       N/A\n",
+      "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - LAS                      |     0.938  |       N/A\n",
+      "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:06:43,859 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:06:43,864 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 02:06:48,563 - INFO - combo.training.trainer - Epoch duration: 0:00:55.235260\n",
+      "2023-04-07 02:06:48,563 - INFO - combo.training.trainer - Estimated training time remaining: 4:21:24\n",
+      "2023-04-07 02:06:48,563 - INFO - allennlp.training.trainer - Epoch 172/399\n",
+      "2023-04-07 02:06:48,564 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:06:48,564 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:06:48,574 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9654, LAS: 0.9351, UEM: 0.6406, LEM: 0.4375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3578, partial_loss/deprel_loss: 0.3048, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5035, loss: 0.5067, batch_reg_loss: 0.1881, reg_loss: 0.1881 ||:   4%|4         | 4/95 [00:02<00:46,  1.94it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9668, LAS: 0.9381, UEM: 0.7154, LEM: 0.5356, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2848, partial_loss/deprel_loss: 0.2695, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4606, loss: 0.4873, batch_reg_loss: 0.1881, reg_loss: 0.1881 ||:   8%|8         | 8/95 [00:04<00:44,  1.94it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9510, UAS: 0.9678, LAS: 0.9385, UEM: 0.6907, LEM: 0.4949, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1446, partial_loss/deprel_loss: 0.2444, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4125, loss: 0.4866, batch_reg_loss: 0.1880, reg_loss: 0.1881 ||:  14%|#3        | 13/95 [00:06<00:40,  2.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9687, LAS: 0.9392, UEM: 0.6788, LEM: 0.4712, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2708, partial_loss/deprel_loss: 0.3406, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5147, loss: 0.4863, batch_reg_loss: 0.1880, reg_loss: 0.1881 ||:  19%|#8        | 18/95 [00:08<00:37,  2.05it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8803, UAS: 0.9653, LAS: 0.9356, UEM: 0.6687, LEM: 0.4583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0776, partial_loss/deprel_loss: 0.6299, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9074, loss: 0.5121, batch_reg_loss: 0.1880, reg_loss: 0.1881 ||:  23%|##3       | 22/95 [00:10<00:36,  2.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9456, UAS: 0.9662, LAS: 0.9369, UEM: 0.6886, LEM: 0.4802, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1285, partial_loss/deprel_loss: 0.2678, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4280, loss: 0.5059, batch_reg_loss: 0.1880, reg_loss: 0.1880 ||:  28%|##8       | 27/95 [00:13<00:33,  2.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9485, UAS: 0.9663, LAS: 0.9369, UEM: 0.6907, LEM: 0.4835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1518, partial_loss/deprel_loss: 0.2603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4266, loss: 0.5073, batch_reg_loss: 0.1880, reg_loss: 0.1880 ||:  33%|###2      | 31/95 [00:15<00:31,  2.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9651, LAS: 0.9357, UEM: 0.6733, LEM: 0.4675, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4089, partial_loss/deprel_loss: 0.3642, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5611, loss: 0.5143, batch_reg_loss: 0.1880, reg_loss: 0.1880 ||:  38%|###7      | 36/95 [00:17<00:28,  2.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9538, UAS: 0.9654, LAS: 0.9361, UEM: 0.6825, LEM: 0.4790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1190, partial_loss/deprel_loss: 0.2261, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3926, loss: 0.5107, batch_reg_loss: 0.1880, reg_loss: 0.1880 ||:  42%|####2     | 40/95 [00:19<00:27,  2.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9653, LAS: 0.9361, UEM: 0.6749, LEM: 0.4693, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2404, partial_loss/deprel_loss: 0.2831, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4625, loss: 0.5092, batch_reg_loss: 0.1879, reg_loss: 0.1880 ||:  47%|####7     | 45/95 [00:21<00:23,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9657, LAS: 0.9362, UEM: 0.6765, LEM: 0.4678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2225, partial_loss/deprel_loss: 0.3255, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4928, loss: 0.5081, batch_reg_loss: 0.1879, reg_loss: 0.1880 ||:  53%|#####2    | 50/95 [00:23<00:21,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9481, UAS: 0.9660, LAS: 0.9366, UEM: 0.6709, LEM: 0.4587, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2004, partial_loss/deprel_loss: 0.2366, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4173, loss: 0.5059, batch_reg_loss: 0.1879, reg_loss: 0.1880 ||:  58%|#####7    | 55/95 [00:26<00:18,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9659, LAS: 0.9366, UEM: 0.6683, LEM: 0.4564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3238, partial_loss/deprel_loss: 0.2760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4734, loss: 0.5053, batch_reg_loss: 0.1879, reg_loss: 0.1880 ||:  63%|######3   | 60/95 [00:28<00:15,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9764, UAS: 0.9665, LAS: 0.9373, UEM: 0.6924, LEM: 0.4914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0326, partial_loss/deprel_loss: 0.0888, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2654, loss: 0.5009, batch_reg_loss: 0.1879, reg_loss: 0.1880 ||:  68%|######8   | 65/95 [00:30<00:14,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9498, UAS: 0.9665, LAS: 0.9375, UEM: 0.6984, LEM: 0.4983, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1507, partial_loss/deprel_loss: 0.2718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4355, loss: 0.4997, batch_reg_loss: 0.1879, reg_loss: 0.1880 ||:  74%|#######3  | 70/95 [00:33<00:12,  2.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9665, LAS: 0.9376, UEM: 0.6949, LEM: 0.4936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6818, partial_loss/deprel_loss: 0.5021, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7259, loss: 0.5003, batch_reg_loss: 0.1878, reg_loss: 0.1880 ||:  79%|#######8  | 75/95 [00:35<00:09,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9172, UAS: 0.9662, LAS: 0.9372, UEM: 0.6853, LEM: 0.4833, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4882, partial_loss/deprel_loss: 0.4265, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6266, loss: 0.5023, batch_reg_loss: 0.1878, reg_loss: 0.1880 ||:  84%|########4 | 80/95 [00:37<00:06,  2.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9352, UAS: 0.9665, LAS: 0.9373, UEM: 0.6917, LEM: 0.4898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2493, partial_loss/deprel_loss: 0.3012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4786, loss: 0.5004, batch_reg_loss: 0.1878, reg_loss: 0.1879 ||:  89%|########9 | 85/95 [00:40<00:04,  2.14it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9665, LAS: 0.9373, UEM: 0.6970, LEM: 0.4944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2377, partial_loss/deprel_loss: 0.2672, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4491, loss: 0.5000, batch_reg_loss: 0.1878, reg_loss: 0.1879 ||:  95%|#########4| 90/95 [00:42<00:02,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9666, LAS: 0.9374, UEM: 0.6953, LEM: 0.4916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3022, partial_loss/deprel_loss: 0.3378, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5184, loss: 0.4993, batch_reg_loss: 0.1878, reg_loss: 0.1879 ||: 100%|##########| 95/95 [00:45<00:00,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9666, LAS: 0.9374, UEM: 0.6953, LEM: 0.4916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3022, partial_loss/deprel_loss: 0.3378, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5184, loss: 0.4993, batch_reg_loss: 0.1878, reg_loss: 0.1879 ||: 100%|##########| 95/95 [00:45<00:00,  2.11it/s]\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.188  |       N/A\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - UEM                      |     0.695  |       N/A\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - LEM                      |     0.492  |       N/A\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - EM                       |     0.938  |       N/A\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.302  |       N/A\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - UAS                      |     0.967  |       N/A\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.338  |       N/A\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - loss                     |     0.499  |       N/A\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - LAS                      |     0.937  |       N/A\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:07:36,068 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:07:36,069 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:07:36,072 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:07:39,884 - INFO - combo.training.trainer - Epoch duration: 0:00:51.320842\n",
+      "2023-04-07 02:07:39,885 - INFO - combo.training.trainer - Estimated training time remaining: 4:19:53\n",
+      "2023-04-07 02:07:39,885 - INFO - allennlp.training.trainer - Epoch 173/399\n",
+      "2023-04-07 02:07:39,885 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:07:39,885 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:07:39,894 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9668, LAS: 0.9351, UEM: 0.7266, LEM: 0.5045, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1379, partial_loss/deprel_loss: 0.2552, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4195, loss: 0.5019, batch_reg_loss: 0.1877, reg_loss: 0.1877 ||:   5%|5         | 5/95 [00:02<00:45,  1.98it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9366, UAS: 0.9691, LAS: 0.9388, UEM: 0.6967, LEM: 0.4699, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2543, partial_loss/deprel_loss: 0.3132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4891, loss: 0.4870, batch_reg_loss: 0.1877, reg_loss: 0.1877 ||:  11%|#         | 10/95 [00:04<00:41,  2.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9680, LAS: 0.9385, UEM: 0.6448, LEM: 0.4259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2867, partial_loss/deprel_loss: 0.3220, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5026, loss: 0.4966, batch_reg_loss: 0.1877, reg_loss: 0.1877 ||:  16%|#5        | 15/95 [00:07<00:38,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9577, UAS: 0.9652, LAS: 0.9361, UEM: 0.6765, LEM: 0.4808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0895, partial_loss/deprel_loss: 0.1832, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3521, loss: 0.5077, batch_reg_loss: 0.1877, reg_loss: 0.1877 ||:  21%|##1       | 20/95 [00:09<00:35,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9654, LAS: 0.9368, UEM: 0.6994, LEM: 0.5103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6584, partial_loss/deprel_loss: 0.4079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6457, loss: 0.5024, batch_reg_loss: 0.1877, reg_loss: 0.1877 ||:  26%|##6       | 25/95 [00:11<00:33,  2.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9452, UAS: 0.9669, LAS: 0.9382, UEM: 0.7003, LEM: 0.5003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3080, partial_loss/deprel_loss: 0.2853, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4775, loss: 0.4950, batch_reg_loss: 0.1876, reg_loss: 0.1877 ||:  32%|###1      | 30/95 [00:13<00:29,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9671, LAS: 0.9384, UEM: 0.6968, LEM: 0.4940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3844, partial_loss/deprel_loss: 0.3584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5512, loss: 0.4927, batch_reg_loss: 0.1876, reg_loss: 0.1877 ||:  37%|###6      | 35/95 [00:16<00:28,  2.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9666, LAS: 0.9376, UEM: 0.6920, LEM: 0.4878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9114, partial_loss/deprel_loss: 0.4385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7207, loss: 0.4980, batch_reg_loss: 0.1876, reg_loss: 0.1877 ||:  42%|####2     | 40/95 [00:18<00:25,  2.13it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9568, UAS: 0.9680, LAS: 0.9396, UEM: 0.7289, LEM: 0.5380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1540, partial_loss/deprel_loss: 0.2103, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3866, loss: 0.4856, batch_reg_loss: 0.1876, reg_loss: 0.1877 ||:  47%|####7     | 45/95 [00:21<00:24,  2.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9259, UAS: 0.9686, LAS: 0.9401, UEM: 0.7335, LEM: 0.5403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4065, partial_loss/deprel_loss: 0.3558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5535, loss: 0.4817, batch_reg_loss: 0.1876, reg_loss: 0.1877 ||:  53%|#####2    | 50/95 [00:23<00:21,  2.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9686, LAS: 0.9400, UEM: 0.7342, LEM: 0.5408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3939, partial_loss/deprel_loss: 0.2988, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5054, loss: 0.4833, batch_reg_loss: 0.1875, reg_loss: 0.1876 ||:  58%|#####7    | 55/95 [00:26<00:19,  2.05it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9679, LAS: 0.9392, UEM: 0.7241, LEM: 0.5296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0444, partial_loss/deprel_loss: 0.4688, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7715, loss: 0.4892, batch_reg_loss: 0.1875, reg_loss: 0.1876 ||:  63%|######3   | 60/95 [00:28<00:16,  2.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9678, LAS: 0.9390, UEM: 0.7198, LEM: 0.5223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4509, partial_loss/deprel_loss: 0.3862, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5867, loss: 0.4908, batch_reg_loss: 0.1875, reg_loss: 0.1876 ||:  68%|######8   | 65/95 [00:30<00:13,  2.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9674, LAS: 0.9387, UEM: 0.7102, LEM: 0.5122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2441, partial_loss/deprel_loss: 0.2851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4644, loss: 0.4921, batch_reg_loss: 0.1875, reg_loss: 0.1876 ||:  74%|#######3  | 70/95 [00:33<00:11,  2.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9104, UAS: 0.9668, LAS: 0.9379, UEM: 0.7007, LEM: 0.5021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7125, partial_loss/deprel_loss: 0.4865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7191, loss: 0.4986, batch_reg_loss: 0.1875, reg_loss: 0.1876 ||:  79%|#######8  | 75/95 [00:35<00:09,  2.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9674, LAS: 0.9383, UEM: 0.7049, LEM: 0.5035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1480, partial_loss/deprel_loss: 0.3090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4643, loss: 0.4961, batch_reg_loss: 0.1874, reg_loss: 0.1876 ||:  84%|########4 | 80/95 [00:37<00:07,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9527, UAS: 0.9675, LAS: 0.9383, UEM: 0.7038, LEM: 0.5023, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1645, partial_loss/deprel_loss: 0.2580, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4268, loss: 0.4957, batch_reg_loss: 0.1874, reg_loss: 0.1876 ||:  89%|########9 | 85/95 [00:40<00:04,  2.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9340, UAS: 0.9676, LAS: 0.9384, UEM: 0.7036, LEM: 0.4999, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2718, partial_loss/deprel_loss: 0.3316, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5071, loss: 0.4949, batch_reg_loss: 0.1874, reg_loss: 0.1876 ||:  95%|#########4| 90/95 [00:42<00:02,  2.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9674, LAS: 0.9380, UEM: 0.6967, LEM: 0.4923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3628, partial_loss/deprel_loss: 0.3859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5687, loss: 0.4976, batch_reg_loss: 0.1874, reg_loss: 0.1876 ||: 100%|##########| 95/95 [00:44<00:00,  2.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9674, LAS: 0.9380, UEM: 0.6967, LEM: 0.4923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3628, partial_loss/deprel_loss: 0.3859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5687, loss: 0.4976, batch_reg_loss: 0.1874, reg_loss: 0.1876 ||: 100%|##########| 95/95 [00:44<00:00,  2.12it/s]\n",
+      "2023-04-07 02:08:27,737 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.188  |       N/A\n",
+      "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - UEM                      |     0.697  |       N/A\n",
+      "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - LEM                      |     0.492  |       N/A\n",
+      "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - EM                       |     0.923  |       N/A\n",
+      "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.363  |       N/A\n",
+      "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - UAS                      |     0.967  |       N/A\n",
+      "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.386  |       N/A\n",
+      "2023-04-07 02:08:27,738 - INFO - combo.training.tensorboard_writer - loss                     |     0.498  |       N/A\n",
+      "2023-04-07 02:08:27,739 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:08:27,739 - INFO - combo.training.tensorboard_writer - LAS                      |     0.938  |       N/A\n",
+      "2023-04-07 02:08:27,739 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.845  |       N/A\n",
+      "2023-04-07 02:08:27,739 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:08:27,739 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:08:27,739 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:08:27,739 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:08:27,739 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:08:27,744 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:08:32,237 - INFO - combo.training.trainer - Epoch duration: 0:00:52.352574\n",
+      "2023-04-07 02:08:32,238 - INFO - combo.training.trainer - Estimated training time remaining: 4:18:23\n",
+      "2023-04-07 02:08:32,238 - INFO - allennlp.training.trainer - Epoch 174/399\n",
+      "2023-04-07 02:08:32,238 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:08:32,239 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:08:32,250 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9597, UAS: 0.9754, LAS: 0.9467, UEM: 0.7662, LEM: 0.5495, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0672, partial_loss/deprel_loss: 0.1893, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3522, loss: 0.4420, batch_reg_loss: 0.1874, reg_loss: 0.1874 ||:   5%|5         | 5/95 [00:02<00:42,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9713, LAS: 0.9423, UEM: 0.7106, LEM: 0.4840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2048, partial_loss/deprel_loss: 0.2832, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4549, loss: 0.4666, batch_reg_loss: 0.1874, reg_loss: 0.1874 ||:  11%|#         | 10/95 [00:04<00:40,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9706, LAS: 0.9419, UEM: 0.6911, LEM: 0.4658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2233, partial_loss/deprel_loss: 0.2813, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4570, loss: 0.4739, batch_reg_loss: 0.1873, reg_loss: 0.1874 ||:  16%|#5        | 15/95 [00:06<00:37,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9699, LAS: 0.9412, UEM: 0.6877, LEM: 0.4705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3466, partial_loss/deprel_loss: 0.3447, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5324, loss: 0.4771, batch_reg_loss: 0.1873, reg_loss: 0.1874 ||:  21%|##1       | 20/95 [00:09<00:35,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9690, LAS: 0.9393, UEM: 0.7068, LEM: 0.4927, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7900, partial_loss/deprel_loss: 0.4784, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7280, loss: 0.4828, batch_reg_loss: 0.1873, reg_loss: 0.1873 ||:  26%|##6       | 25/95 [00:11<00:33,  2.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9658, LAS: 0.9361, UEM: 0.6803, LEM: 0.4683, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8419, partial_loss/deprel_loss: 0.5101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7638, loss: 0.5070, batch_reg_loss: 0.1873, reg_loss: 0.1873 ||:  32%|###1      | 30/95 [00:14<00:31,  2.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9554, UAS: 0.9666, LAS: 0.9369, UEM: 0.6862, LEM: 0.4727, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1228, partial_loss/deprel_loss: 0.2493, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4113, loss: 0.5049, batch_reg_loss: 0.1873, reg_loss: 0.1873 ||:  36%|###5      | 34/95 [00:16<00:29,  2.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9661, LAS: 0.9365, UEM: 0.6719, LEM: 0.4587, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4983, partial_loss/deprel_loss: 0.3589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5741, loss: 0.5089, batch_reg_loss: 0.1873, reg_loss: 0.1873 ||:  40%|####      | 38/95 [00:18<00:28,  2.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9486, UAS: 0.9666, LAS: 0.9373, UEM: 0.6827, LEM: 0.4704, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1798, partial_loss/deprel_loss: 0.2568, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4286, loss: 0.5011, batch_reg_loss: 0.1873, reg_loss: 0.1873 ||:  45%|####5     | 43/95 [00:20<00:25,  2.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9482, UAS: 0.9667, LAS: 0.9374, UEM: 0.6793, LEM: 0.4653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1713, partial_loss/deprel_loss: 0.2444, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4170, loss: 0.4999, batch_reg_loss: 0.1872, reg_loss: 0.1873 ||:  51%|#####     | 48/95 [00:23<00:22,  2.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9663, LAS: 0.9371, UEM: 0.6693, LEM: 0.4551, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3065, partial_loss/deprel_loss: 0.3364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5176, loss: 0.5033, batch_reg_loss: 0.1872, reg_loss: 0.1873 ||:  56%|#####5    | 53/95 [00:25<00:20,  2.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9667, LAS: 0.9375, UEM: 0.6694, LEM: 0.4524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2536, partial_loss/deprel_loss: 0.2654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4502, loss: 0.4998, batch_reg_loss: 0.1872, reg_loss: 0.1873 ||:  61%|######1   | 58/95 [00:27<00:17,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9732, UAS: 0.9672, LAS: 0.9381, UEM: 0.6852, LEM: 0.4772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0324, partial_loss/deprel_loss: 0.0998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2735, loss: 0.4956, batch_reg_loss: 0.1872, reg_loss: 0.1873 ||:  66%|######6   | 63/95 [00:30<00:15,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9498, UAS: 0.9675, LAS: 0.9383, UEM: 0.6916, LEM: 0.4835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1398, partial_loss/deprel_loss: 0.2216, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3924, loss: 0.4931, batch_reg_loss: 0.1872, reg_loss: 0.1873 ||:  72%|#######1  | 68/95 [00:32<00:12,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9390, UAS: 0.9673, LAS: 0.9384, UEM: 0.6854, LEM: 0.4777, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3293, partial_loss/deprel_loss: 0.3302, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5172, loss: 0.4935, batch_reg_loss: 0.1871, reg_loss: 0.1873 ||:  77%|#######6  | 73/95 [00:34<00:10,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9451, UAS: 0.9668, LAS: 0.9379, UEM: 0.6789, LEM: 0.4706, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1879, partial_loss/deprel_loss: 0.2809, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4494, loss: 0.4964, batch_reg_loss: 0.1871, reg_loss: 0.1873 ||:  82%|########2 | 78/95 [00:37<00:08,  2.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9669, LAS: 0.9381, UEM: 0.6832, LEM: 0.4790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3689, partial_loss/deprel_loss: 0.3222, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5186, loss: 0.4952, batch_reg_loss: 0.1871, reg_loss: 0.1872 ||:  87%|########7 | 83/95 [00:39<00:05,  2.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9557, UAS: 0.9676, LAS: 0.9388, UEM: 0.6984, LEM: 0.4952, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0900, partial_loss/deprel_loss: 0.1902, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3573, loss: 0.4903, batch_reg_loss: 0.1871, reg_loss: 0.1872 ||:  93%|#########2| 88/95 [00:42<00:03,  2.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9493, UAS: 0.9680, LAS: 0.9391, UEM: 0.7009, LEM: 0.4951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1930, partial_loss/deprel_loss: 0.2365, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4149, loss: 0.4885, batch_reg_loss: 0.1871, reg_loss: 0.1872 ||:  98%|#########7| 93/95 [00:44<00:00,  2.07it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9448, UAS: 0.9677, LAS: 0.9389, UEM: 0.6975, LEM: 0.4919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3214, partial_loss/deprel_loss: 0.2698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4672, loss: 0.4900, batch_reg_loss: 0.1870, reg_loss: 0.1872 ||: 100%|##########| 95/95 [00:45<00:00,  2.09it/s]\n",
+      "2023-04-07 02:09:20,939 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:09:20,939 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 02:09:20,939 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.187  |       N/A\n",
+      "2023-04-07 02:09:20,939 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - UEM                      |     0.697  |       N/A\n",
+      "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - LEM                      |     0.492  |       N/A\n",
+      "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - EM                       |     0.945  |       N/A\n",
+      "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.321  |       N/A\n",
+      "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - UAS                      |     0.968  |       N/A\n",
+      "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.270  |       N/A\n",
+      "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - loss                     |     0.490  |       N/A\n",
+      "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - LAS                      |     0.939  |       N/A\n",
+      "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:09:20,940 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:09:20,945 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:09:25,709 - INFO - combo.training.trainer - Epoch duration: 0:00:53.471397\n",
+      "2023-04-07 02:09:25,710 - INFO - combo.training.trainer - Estimated training time remaining: 4:16:55\n",
+      "2023-04-07 02:09:25,710 - INFO - allennlp.training.trainer - Epoch 175/399\n",
+      "2023-04-07 02:09:25,710 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:09:25,711 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:09:25,720 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9476, UAS: 0.9662, LAS: 0.9369, UEM: 0.7409, LEM: 0.5371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1297, partial_loss/deprel_loss: 0.2315, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3982, loss: 0.4858, batch_reg_loss: 0.1870, reg_loss: 0.1870 ||:   5%|5         | 5/95 [00:02<00:43,  2.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9423, UAS: 0.9621, LAS: 0.9336, UEM: 0.6399, LEM: 0.4383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2192, partial_loss/deprel_loss: 0.2733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4495, loss: 0.5212, batch_reg_loss: 0.1870, reg_loss: 0.1870 ||:  11%|#         | 10/95 [00:04<00:40,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9637, LAS: 0.9356, UEM: 0.6253, LEM: 0.4157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5335, partial_loss/deprel_loss: 0.3490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5729, loss: 0.5136, batch_reg_loss: 0.1870, reg_loss: 0.1870 ||:  15%|#4        | 14/95 [00:06<00:39,  2.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9643, LAS: 0.9366, UEM: 0.6265, LEM: 0.4171, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2836, partial_loss/deprel_loss: 0.3064, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4888, loss: 0.5072, batch_reg_loss: 0.1870, reg_loss: 0.1870 ||:  20%|##        | 19/95 [00:09<00:36,  2.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9650, LAS: 0.9375, UEM: 0.6447, LEM: 0.4437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2784, partial_loss/deprel_loss: 0.2675, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4567, loss: 0.4992, batch_reg_loss: 0.1870, reg_loss: 0.1870 ||:  25%|##5       | 24/95 [00:11<00:33,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9352, UAS: 0.9668, LAS: 0.9390, UEM: 0.6874, LEM: 0.4897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2737, partial_loss/deprel_loss: 0.3384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5124, loss: 0.4892, batch_reg_loss: 0.1869, reg_loss: 0.1870 ||:  31%|###       | 29/95 [00:13<00:31,  2.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9667, LAS: 0.9385, UEM: 0.6772, LEM: 0.4748, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3763, partial_loss/deprel_loss: 0.3628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5525, loss: 0.4919, batch_reg_loss: 0.1869, reg_loss: 0.1870 ||:  36%|###5      | 34/95 [00:16<00:28,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9664, LAS: 0.9384, UEM: 0.6660, LEM: 0.4586, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3088, partial_loss/deprel_loss: 0.3559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5334, loss: 0.4938, batch_reg_loss: 0.1869, reg_loss: 0.1870 ||:  41%|####1     | 39/95 [00:18<00:25,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9534, UAS: 0.9668, LAS: 0.9387, UEM: 0.6746, LEM: 0.4676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1448, partial_loss/deprel_loss: 0.2160, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3886, loss: 0.4902, batch_reg_loss: 0.1869, reg_loss: 0.1870 ||:  46%|####6     | 44/95 [00:20<00:23,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9486, UAS: 0.9672, LAS: 0.9391, UEM: 0.6930, LEM: 0.4894, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1267, partial_loss/deprel_loss: 0.2429, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4065, loss: 0.4877, batch_reg_loss: 0.1869, reg_loss: 0.1870 ||:  52%|#####1    | 49/95 [00:23<00:21,  2.10it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9553, UAS: 0.9665, LAS: 0.9385, UEM: 0.6856, LEM: 0.4828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1364, partial_loss/deprel_loss: 0.2059, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3788, loss: 0.4915, batch_reg_loss: 0.1869, reg_loss: 0.1870 ||:  57%|#####6    | 54/95 [00:25<00:19,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9659, LAS: 0.9379, UEM: 0.6728, LEM: 0.4709, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3806, partial_loss/deprel_loss: 0.3239, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5221, loss: 0.4978, batch_reg_loss: 0.1868, reg_loss: 0.1869 ||:  62%|######2   | 59/95 [00:27<00:16,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9521, UAS: 0.9665, LAS: 0.9384, UEM: 0.6843, LEM: 0.4827, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1283, partial_loss/deprel_loss: 0.1964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3696, loss: 0.4941, batch_reg_loss: 0.1868, reg_loss: 0.1869 ||:  67%|######7   | 64/95 [00:30<00:14,  2.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9666, LAS: 0.9384, UEM: 0.6792, LEM: 0.4764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3055, partial_loss/deprel_loss: 0.3890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5591, loss: 0.4943, batch_reg_loss: 0.1868, reg_loss: 0.1869 ||:  73%|#######2  | 69/95 [00:32<00:11,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9672, LAS: 0.9389, UEM: 0.6884, LEM: 0.4856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1952, partial_loss/deprel_loss: 0.2882, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4564, loss: 0.4904, batch_reg_loss: 0.1868, reg_loss: 0.1869 ||:  78%|#######7  | 74/95 [00:34<00:09,  2.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9340, UAS: 0.9667, LAS: 0.9385, UEM: 0.6771, LEM: 0.4741, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4252, partial_loss/deprel_loss: 0.3328, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5380, loss: 0.4942, batch_reg_loss: 0.1868, reg_loss: 0.1869 ||:  83%|########3 | 79/95 [00:37<00:07,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9668, LAS: 0.9387, UEM: 0.6865, LEM: 0.4900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1773, partial_loss/deprel_loss: 0.2759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4429, loss: 0.4927, batch_reg_loss: 0.1867, reg_loss: 0.1869 ||:  88%|########8 | 84/95 [00:39<00:05,  2.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9676, LAS: 0.9392, UEM: 0.7002, LEM: 0.4987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1410, partial_loss/deprel_loss: 0.2602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4231, loss: 0.4887, batch_reg_loss: 0.1867, reg_loss: 0.1869 ||:  94%|#########3| 89/95 [00:42<00:02,  2.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9549, UAS: 0.9678, LAS: 0.9395, UEM: 0.7012, LEM: 0.4997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0891, partial_loss/deprel_loss: 0.2031, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3670, loss: 0.4872, batch_reg_loss: 0.1867, reg_loss: 0.1869 ||:  99%|#########8| 94/95 [00:44<00:00,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9199, UAS: 0.9676, LAS: 0.9393, UEM: 0.6989, LEM: 0.4977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5695, partial_loss/deprel_loss: 0.3864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6098, loss: 0.4885, batch_reg_loss: 0.1867, reg_loss: 0.1869 ||: 100%|##########| 95/95 [00:44<00:00,  2.11it/s]\n",
+      "2023-04-07 02:10:13,809 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8822, UAS: 0.9487, LAS: 0.8983, UEM: 0.6867, LEM: 0.4739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0548, partial_loss/deprel_loss: 8.0360, partial_loss/cycle_loss: 0.0000, batch_loss: 6.6398, loss: 7.0117, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  36%|###6      | 4/11 [00:02<00:04,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8582, UAS: 0.9503, LAS: 0.9017, UEM: 0.7040, LEM: 0.4726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5264, partial_loss/deprel_loss: 16.6715, partial_loss/cycle_loss: 0.0000, batch_loss: 13.6425, loss: 7.3681, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  64%|######3   | 7/11 [00:04<00:02,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9518, LAS: 0.9014, UEM: 0.6831, LEM: 0.4146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5225, partial_loss/deprel_loss: 7.1535, partial_loss/cycle_loss: 0.0000, batch_loss: 5.8273, loss: 7.1744, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:07<00:00,  1.51it/s] \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9518, LAS: 0.9014, UEM: 0.6831, LEM: 0.4146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5225, partial_loss/deprel_loss: 7.1535, partial_loss/cycle_loss: 0.0000, batch_loss: 5.8273, loss: 7.1744, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:07<00:00,  1.50it/s]\n",
+      "2023-04-07 02:10:21,133 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:10:21,133 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 02:10:21,133 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.187  |     0.000\n",
+      "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - UEM                      |     0.699  |     0.683\n",
+      "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - LEM                      |     0.498  |     0.415\n",
+      "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - EM                       |     0.920  |     0.905\n",
+      "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.570  |     0.523\n",
+      "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - UAS                      |     0.968  |     0.952\n",
+      "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.386  |     7.153\n",
+      "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - loss                     |     0.489  |     7.174\n",
+      "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - LAS                      |     0.939  |     0.901\n",
+      "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 02:10:21,134 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 02:10:21,135 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 02:10:21,135 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 02:10:21,139 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 02:10:25,839 - INFO - combo.training.trainer - Epoch duration: 0:01:00.129085\n",
+      "2023-04-07 02:10:25,840 - INFO - combo.training.trainer - Estimated training time remaining: 4:15:35\n",
+      "2023-04-07 02:10:25,840 - INFO - allennlp.training.trainer - Epoch 176/399\n",
+      "2023-04-07 02:10:25,840 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:10:25,841 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:10:25,850 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9367, UAS: 0.9736, LAS: 0.9421, UEM: 0.7172, LEM: 0.4547, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2733, partial_loss/deprel_loss: 0.3096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4890, loss: 0.4643, batch_reg_loss: 0.1867, reg_loss: 0.1867 ||:   5%|5         | 5/95 [00:02<00:38,  2.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9514, UAS: 0.9735, LAS: 0.9443, UEM: 0.7156, LEM: 0.4755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1517, partial_loss/deprel_loss: 0.2610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4258, loss: 0.4558, batch_reg_loss: 0.1867, reg_loss: 0.1867 ||:  11%|#         | 10/95 [00:04<00:36,  2.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9460, UAS: 0.9701, LAS: 0.9417, UEM: 0.7079, LEM: 0.4924, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1365, partial_loss/deprel_loss: 0.2318, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3994, loss: 0.4714, batch_reg_loss: 0.1866, reg_loss: 0.1867 ||:  16%|#5        | 15/95 [00:06<00:36,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9689, LAS: 0.9400, UEM: 0.6964, LEM: 0.4766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5728, partial_loss/deprel_loss: 0.3881, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6117, loss: 0.4803, batch_reg_loss: 0.1866, reg_loss: 0.1866 ||:  21%|##1       | 20/95 [00:09<00:34,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9541, UAS: 0.9700, LAS: 0.9414, UEM: 0.7148, LEM: 0.4964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0880, partial_loss/deprel_loss: 0.1952, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3603, loss: 0.4688, batch_reg_loss: 0.1866, reg_loss: 0.1866 ||:  26%|##6       | 25/95 [00:11<00:32,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9536, UAS: 0.9701, LAS: 0.9414, UEM: 0.7079, LEM: 0.4883, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0996, partial_loss/deprel_loss: 0.2304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3908, loss: 0.4698, batch_reg_loss: 0.1866, reg_loss: 0.1866 ||:  32%|###1      | 30/95 [00:13<00:28,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9525, UAS: 0.9710, LAS: 0.9429, UEM: 0.7498, LEM: 0.5551, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1418, partial_loss/deprel_loss: 0.1781, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3574, loss: 0.4600, batch_reg_loss: 0.1866, reg_loss: 0.1866 ||:  36%|###5      | 34/95 [00:15<00:29,  2.05it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9702, LAS: 0.9423, UEM: 0.7355, LEM: 0.5374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5495, partial_loss/deprel_loss: 0.3517, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5778, loss: 0.4654, batch_reg_loss: 0.1865, reg_loss: 0.1866 ||:  41%|####1     | 39/95 [00:18<00:26,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9703, LAS: 0.9422, UEM: 0.7315, LEM: 0.5286, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4231, partial_loss/deprel_loss: 0.3928, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5854, loss: 0.4662, batch_reg_loss: 0.1865, reg_loss: 0.1866 ||:  45%|####5     | 43/95 [00:20<00:25,  2.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9597, UAS: 0.9705, LAS: 0.9425, UEM: 0.7315, LEM: 0.5290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0979, partial_loss/deprel_loss: 0.2064, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3712, loss: 0.4664, batch_reg_loss: 0.1865, reg_loss: 0.1866 ||:  51%|#####     | 48/95 [00:22<00:22,  2.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9698, LAS: 0.9417, UEM: 0.7230, LEM: 0.5194, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5247, partial_loss/deprel_loss: 0.3651, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5835, loss: 0.4715, batch_reg_loss: 0.1865, reg_loss: 0.1866 ||:  56%|#####5    | 53/95 [00:24<00:19,  2.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9483, UAS: 0.9694, LAS: 0.9411, UEM: 0.7197, LEM: 0.5139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1925, partial_loss/deprel_loss: 0.3408, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4976, loss: 0.4757, batch_reg_loss: 0.1865, reg_loss: 0.1866 ||:  61%|######1   | 58/95 [00:27<00:17,  2.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9694, LAS: 0.9412, UEM: 0.7165, LEM: 0.5096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2613, partial_loss/deprel_loss: 0.3015, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4799, loss: 0.4759, batch_reg_loss: 0.1864, reg_loss: 0.1866 ||:  66%|######6   | 63/95 [00:29<00:15,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9604, UAS: 0.9693, LAS: 0.9412, UEM: 0.7166, LEM: 0.5146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0665, partial_loss/deprel_loss: 0.1377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3099, loss: 0.4770, batch_reg_loss: 0.1864, reg_loss: 0.1865 ||:  72%|#######1  | 68/95 [00:31<00:12,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9691, LAS: 0.9411, UEM: 0.7162, LEM: 0.5155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7586, partial_loss/deprel_loss: 0.4775, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7201, loss: 0.4784, batch_reg_loss: 0.1864, reg_loss: 0.1865 ||:  77%|#######6  | 73/95 [00:34<00:10,  2.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8947, UAS: 0.9689, LAS: 0.9408, UEM: 0.7165, LEM: 0.5143, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9787, partial_loss/deprel_loss: 0.5288, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8052, loss: 0.4813, batch_reg_loss: 0.1864, reg_loss: 0.1865 ||:  82%|########2 | 78/95 [00:36<00:08,  2.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9686, LAS: 0.9405, UEM: 0.7123, LEM: 0.5082, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3432, partial_loss/deprel_loss: 0.3228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5132, loss: 0.4826, batch_reg_loss: 0.1864, reg_loss: 0.1865 ||:  87%|########7 | 83/95 [00:38<00:05,  2.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9470, UAS: 0.9681, LAS: 0.9400, UEM: 0.7034, LEM: 0.4989, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2496, partial_loss/deprel_loss: 0.2751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4564, loss: 0.4858, batch_reg_loss: 0.1864, reg_loss: 0.1865 ||:  93%|#########2| 88/95 [00:41<00:03,  2.14it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9684, LAS: 0.9402, UEM: 0.7072, LEM: 0.5033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3478, partial_loss/deprel_loss: 0.2936, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4908, loss: 0.4848, batch_reg_loss: 0.1863, reg_loss: 0.1865 ||:  98%|#########7| 93/95 [00:43<00:00,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9408, UAS: 0.9683, LAS: 0.9401, UEM: 0.7039, LEM: 0.4996, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3500, partial_loss/deprel_loss: 0.3141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5076, loss: 0.4860, batch_reg_loss: 0.1863, reg_loss: 0.1865 ||: 100%|##########| 95/95 [00:44<00:00,  2.13it/s]\n",
+      "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.187  |       N/A\n",
+      "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - UEM                      |     0.704  |       N/A\n",
+      "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - LEM                      |     0.500  |       N/A\n",
+      "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - EM                       |     0.941  |       N/A\n",
+      "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.350  |       N/A\n",
+      "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - UAS                      |     0.968  |       N/A\n",
+      "2023-04-07 02:11:13,578 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:11:13,579 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.314  |       N/A\n",
+      "2023-04-07 02:11:13,579 - INFO - combo.training.tensorboard_writer - loss                     |     0.486  |       N/A\n",
+      "2023-04-07 02:11:13,579 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:11:13,579 - INFO - combo.training.tensorboard_writer - LAS                      |     0.940  |       N/A\n",
+      "2023-04-07 02:11:13,579 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:11:13,579 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:11:13,579 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:11:13,579 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:11:13,579 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:11:13,579 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:11:13,585 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:11:18,407 - INFO - combo.training.trainer - Epoch duration: 0:00:52.567475\n",
+      "2023-04-07 02:11:18,408 - INFO - combo.training.trainer - Estimated training time remaining: 4:14:07\n",
+      "2023-04-07 02:11:18,408 - INFO - allennlp.training.trainer - Epoch 177/399\n",
+      "2023-04-07 02:11:18,408 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:11:18,409 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:11:18,417 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9532, UAS: 0.9691, LAS: 0.9429, UEM: 0.7046, LEM: 0.5057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1772, partial_loss/deprel_loss: 0.2249, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4017, loss: 0.4576, batch_reg_loss: 0.1863, reg_loss: 0.1863 ||:   5%|5         | 5/95 [00:02<00:38,  2.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9549, UAS: 0.9739, LAS: 0.9472, UEM: 0.7883, LEM: 0.5924, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1418, partial_loss/deprel_loss: 0.2064, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3798, loss: 0.4267, batch_reg_loss: 0.1863, reg_loss: 0.1863 ||:  11%|#         | 10/95 [00:04<00:38,  2.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9482, UAS: 0.9735, LAS: 0.9456, UEM: 0.7580, LEM: 0.5463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1520, partial_loss/deprel_loss: 0.2291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3999, loss: 0.4449, batch_reg_loss: 0.1863, reg_loss: 0.1863 ||:  16%|#5        | 15/95 [00:07<00:36,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9517, UAS: 0.9725, LAS: 0.9443, UEM: 0.7376, LEM: 0.5214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2179, partial_loss/deprel_loss: 0.2340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4170, loss: 0.4530, batch_reg_loss: 0.1863, reg_loss: 0.1863 ||:  21%|##1       | 20/95 [00:09<00:33,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9541, UAS: 0.9734, LAS: 0.9455, UEM: 0.7734, LEM: 0.5827, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0992, partial_loss/deprel_loss: 0.1703, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3423, loss: 0.4430, batch_reg_loss: 0.1862, reg_loss: 0.1863 ||:  25%|##5       | 24/95 [00:11<00:33,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9715, LAS: 0.9437, UEM: 0.7634, LEM: 0.5770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4981, partial_loss/deprel_loss: 0.3644, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5773, loss: 0.4542, batch_reg_loss: 0.1862, reg_loss: 0.1863 ||:  29%|##9       | 28/95 [00:13<00:32,  2.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9526, UAS: 0.9719, LAS: 0.9438, UEM: 0.7596, LEM: 0.5644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1283, partial_loss/deprel_loss: 0.2279, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3942, loss: 0.4535, batch_reg_loss: 0.1862, reg_loss: 0.1863 ||:  36%|###5      | 34/95 [00:15<00:28,  2.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9712, LAS: 0.9433, UEM: 0.7448, LEM: 0.5488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3113, partial_loss/deprel_loss: 0.3193, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5039, loss: 0.4607, batch_reg_loss: 0.1862, reg_loss: 0.1863 ||:  41%|####1     | 39/95 [00:17<00:25,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9525, UAS: 0.9700, LAS: 0.9424, UEM: 0.7470, LEM: 0.5602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1133, partial_loss/deprel_loss: 0.2004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3691, loss: 0.4649, batch_reg_loss: 0.1862, reg_loss: 0.1863 ||:  46%|####6     | 44/95 [00:20<00:23,  2.18it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9695, LAS: 0.9418, UEM: 0.7385, LEM: 0.5475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6892, partial_loss/deprel_loss: 0.4599, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6919, loss: 0.4696, batch_reg_loss: 0.1861, reg_loss: 0.1862 ||:  52%|#####1    | 49/95 [00:22<00:20,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8963, UAS: 0.9682, LAS: 0.9405, UEM: 0.7245, LEM: 0.5336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9134, partial_loss/deprel_loss: 0.4578, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7351, loss: 0.4782, batch_reg_loss: 0.1861, reg_loss: 0.1862 ||:  57%|#####6    | 54/95 [00:24<00:18,  2.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9328, UAS: 0.9683, LAS: 0.9404, UEM: 0.7213, LEM: 0.5261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2665, partial_loss/deprel_loss: 0.3174, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4933, loss: 0.4771, batch_reg_loss: 0.1861, reg_loss: 0.1862 ||:  63%|######3   | 60/95 [00:26<00:15,  2.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9515, UAS: 0.9686, LAS: 0.9406, UEM: 0.7199, LEM: 0.5221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2206, partial_loss/deprel_loss: 0.2610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4390, loss: 0.4748, batch_reg_loss: 0.1861, reg_loss: 0.1862 ||:  68%|######8   | 65/95 [00:29<00:13,  2.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9482, UAS: 0.9686, LAS: 0.9405, UEM: 0.7183, LEM: 0.5185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1395, partial_loss/deprel_loss: 0.2363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4030, loss: 0.4750, batch_reg_loss: 0.1861, reg_loss: 0.1862 ||:  74%|#######3  | 70/95 [00:31<00:11,  2.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9676, LAS: 0.9396, UEM: 0.7092, LEM: 0.5094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4908, partial_loss/deprel_loss: 0.3907, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5968, loss: 0.4827, batch_reg_loss: 0.1861, reg_loss: 0.1862 ||:  79%|#######8  | 75/95 [00:33<00:09,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9671, LAS: 0.9389, UEM: 0.6995, LEM: 0.4986, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2549, partial_loss/deprel_loss: 0.2794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4605, loss: 0.4870, batch_reg_loss: 0.1860, reg_loss: 0.1862 ||:  84%|########4 | 80/95 [00:36<00:06,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9674, LAS: 0.9394, UEM: 0.6988, LEM: 0.4968, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2487, partial_loss/deprel_loss: 0.2758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4565, loss: 0.4839, batch_reg_loss: 0.1860, reg_loss: 0.1862 ||:  89%|########9 | 85/95 [00:38<00:04,  2.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9508, UAS: 0.9675, LAS: 0.9393, UEM: 0.6969, LEM: 0.4925, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0929, partial_loss/deprel_loss: 0.2407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3971, loss: 0.4851, batch_reg_loss: 0.1860, reg_loss: 0.1862 ||:  95%|#########4| 90/95 [00:40<00:02,  2.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9675, LAS: 0.9391, UEM: 0.6996, LEM: 0.4956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3971, partial_loss/deprel_loss: 0.3080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5118, loss: 0.4848, batch_reg_loss: 0.1860, reg_loss: 0.1862 ||: 100%|##########| 95/95 [00:42<00:00,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9675, LAS: 0.9391, UEM: 0.6996, LEM: 0.4956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3971, partial_loss/deprel_loss: 0.3080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5118, loss: 0.4848, batch_reg_loss: 0.1860, reg_loss: 0.1862 ||: 100%|##########| 95/95 [00:42<00:00,  2.22it/s]\n",
+      "2023-04-07 02:12:04,416 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:12:04,416 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 02:12:04,416 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.186  |       N/A\n",
+      "2023-04-07 02:12:04,416 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - UEM                      |     0.700  |       N/A\n",
+      "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - LEM                      |     0.496  |       N/A\n",
+      "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - EM                       |     0.929  |       N/A\n",
+      "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.397  |       N/A\n",
+      "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - UAS                      |     0.968  |       N/A\n",
+      "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.308  |       N/A\n",
+      "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - loss                     |     0.485  |       N/A\n",
+      "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - LAS                      |     0.939  |       N/A\n",
+      "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:12:04,417 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:12:04,418 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:12:04,418 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:12:04,418 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:12:04,422 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:12:09,262 - INFO - combo.training.trainer - Epoch duration: 0:00:50.853596\n",
+      "2023-04-07 02:12:09,262 - INFO - combo.training.trainer - Estimated training time remaining: 4:12:37\n",
+      "2023-04-07 02:12:09,262 - INFO - allennlp.training.trainer - Epoch 178/399\n",
+      "2023-04-07 02:12:09,263 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:12:09,263 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:12:09,271 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9593, UAS: 0.9771, LAS: 0.9459, UEM: 0.8007, LEM: 0.5751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0742, partial_loss/deprel_loss: 0.1687, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3357, loss: 0.4355, batch_reg_loss: 0.1860, reg_loss: 0.1860 ||:   5%|5         | 5/95 [00:02<00:41,  2.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9691, LAS: 0.9408, UEM: 0.7053, LEM: 0.4880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7240, partial_loss/deprel_loss: 0.3619, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6203, loss: 0.4856, batch_reg_loss: 0.1860, reg_loss: 0.1860 ||:  11%|#         | 10/95 [00:04<00:39,  2.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9661, LAS: 0.9379, UEM: 0.6407, LEM: 0.4330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2132, partial_loss/deprel_loss: 0.2303, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4128, loss: 0.4981, batch_reg_loss: 0.1859, reg_loss: 0.1860 ||:  16%|#5        | 15/95 [00:06<00:36,  2.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9484, UAS: 0.9692, LAS: 0.9409, UEM: 0.7156, LEM: 0.5118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1023, partial_loss/deprel_loss: 0.2382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3970, loss: 0.4764, batch_reg_loss: 0.1859, reg_loss: 0.1860 ||:  21%|##1       | 20/95 [00:09<00:34,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9227, UAS: 0.9672, LAS: 0.9391, UEM: 0.6871, LEM: 0.4828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4981, partial_loss/deprel_loss: 0.3675, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5795, loss: 0.4870, batch_reg_loss: 0.1859, reg_loss: 0.1859 ||:  26%|##6       | 25/95 [00:11<00:31,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9564, UAS: 0.9672, LAS: 0.9392, UEM: 0.7025, LEM: 0.4973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1483, partial_loss/deprel_loss: 0.2250, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3956, loss: 0.4867, batch_reg_loss: 0.1859, reg_loss: 0.1859 ||:  31%|###       | 29/95 [00:13<00:31,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9682, LAS: 0.9402, UEM: 0.7164, LEM: 0.5110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0899, partial_loss/deprel_loss: 0.2149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3757, loss: 0.4796, batch_reg_loss: 0.1859, reg_loss: 0.1859 ||:  35%|###4      | 33/95 [00:15<00:30,  2.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9676, LAS: 0.9394, UEM: 0.7095, LEM: 0.5035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2311, partial_loss/deprel_loss: 0.2782, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4546, loss: 0.4861, batch_reg_loss: 0.1859, reg_loss: 0.1859 ||:  40%|####      | 38/95 [00:17<00:27,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9664, LAS: 0.9381, UEM: 0.6917, LEM: 0.4876, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3869, partial_loss/deprel_loss: 0.3763, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5643, loss: 0.4963, batch_reg_loss: 0.1858, reg_loss: 0.1859 ||:  44%|####4     | 42/95 [00:19<00:25,  2.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9671, LAS: 0.9385, UEM: 0.6923, LEM: 0.4830, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2153, partial_loss/deprel_loss: 0.2968, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4664, loss: 0.4938, batch_reg_loss: 0.1858, reg_loss: 0.1859 ||:  49%|####9     | 47/95 [00:21<00:22,  2.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9616, UAS: 0.9676, LAS: 0.9390, UEM: 0.7013, LEM: 0.4943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0641, partial_loss/deprel_loss: 0.1436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3135, loss: 0.4904, batch_reg_loss: 0.1858, reg_loss: 0.1859 ||:  55%|#####4    | 52/95 [00:23<00:19,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9677, LAS: 0.9387, UEM: 0.6950, LEM: 0.4842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3082, partial_loss/deprel_loss: 0.3621, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5371, loss: 0.4918, batch_reg_loss: 0.1858, reg_loss: 0.1859 ||:  60%|######    | 57/95 [00:26<00:17,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9678, LAS: 0.9390, UEM: 0.6928, LEM: 0.4797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1609, partial_loss/deprel_loss: 0.2728, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4362, loss: 0.4911, batch_reg_loss: 0.1858, reg_loss: 0.1859 ||:  65%|######5   | 62/95 [00:28<00:14,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9479, UAS: 0.9684, LAS: 0.9397, UEM: 0.6997, LEM: 0.4862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2115, partial_loss/deprel_loss: 0.2146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3997, loss: 0.4859, batch_reg_loss: 0.1858, reg_loss: 0.1859 ||:  71%|#######   | 67/95 [00:30<00:12,  2.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9680, LAS: 0.9391, UEM: 0.6943, LEM: 0.4817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4662, partial_loss/deprel_loss: 0.4066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6043, loss: 0.4896, batch_reg_loss: 0.1857, reg_loss: 0.1859 ||:  76%|#######5  | 72/95 [00:32<00:10,  2.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9681, LAS: 0.9392, UEM: 0.6975, LEM: 0.4857, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5883, partial_loss/deprel_loss: 0.3589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5905, loss: 0.4893, batch_reg_loss: 0.1857, reg_loss: 0.1859 ||:  81%|########1 | 77/95 [00:35<00:08,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9686, LAS: 0.9400, UEM: 0.7131, LEM: 0.5090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3220, partial_loss/deprel_loss: 0.3004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4905, loss: 0.4845, batch_reg_loss: 0.1857, reg_loss: 0.1858 ||:  86%|########6 | 82/95 [00:37<00:05,  2.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9687, LAS: 0.9400, UEM: 0.7106, LEM: 0.5041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2107, partial_loss/deprel_loss: 0.2866, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4571, loss: 0.4844, batch_reg_loss: 0.1857, reg_loss: 0.1858 ||:  92%|#########1| 87/95 [00:39<00:03,  2.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9527, UAS: 0.9688, LAS: 0.9402, UEM: 0.7071, LEM: 0.4997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2027, partial_loss/deprel_loss: 0.2632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4368, loss: 0.4833, batch_reg_loss: 0.1857, reg_loss: 0.1858 ||:  97%|#########6| 92/95 [00:41<00:01,  2.26it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8997, UAS: 0.9685, LAS: 0.9399, UEM: 0.7062, LEM: 0.4987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8674, partial_loss/deprel_loss: 0.5190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7743, loss: 0.4859, batch_reg_loss: 0.1857, reg_loss: 0.1858 ||: 100%|##########| 95/95 [00:43<00:00,  2.19it/s]\n",
+      "2023-04-07 02:12:55,913 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.186  |       N/A\n",
+      "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - UEM                      |     0.706  |       N/A\n",
+      "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - LEM                      |     0.499  |       N/A\n",
+      "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - EM                       |     0.900  |       N/A\n",
+      "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.867  |       N/A\n",
+      "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - UAS                      |     0.969  |       N/A\n",
+      "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.519  |       N/A\n",
+      "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - loss                     |     0.486  |       N/A\n",
+      "2023-04-07 02:12:55,914 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:12:55,915 - INFO - combo.training.tensorboard_writer - LAS                      |     0.940  |       N/A\n",
+      "2023-04-07 02:12:55,915 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:12:55,915 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:12:55,915 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:12:55,915 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:12:55,915 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:12:55,915 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:12:55,921 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:13:00,792 - INFO - combo.training.trainer - Epoch duration: 0:00:51.529326\n",
+      "2023-04-07 02:13:00,792 - INFO - combo.training.trainer - Estimated training time remaining: 4:11:08\n",
+      "2023-04-07 02:13:00,792 - INFO - allennlp.training.trainer - Epoch 179/399\n",
+      "2023-04-07 02:13:00,793 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:13:00,793 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:13:00,803 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9487, UAS: 0.9741, LAS: 0.9447, UEM: 0.7545, LEM: 0.5154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2545, partial_loss/deprel_loss: 0.2657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4491, loss: 0.4412, batch_reg_loss: 0.1856, reg_loss: 0.1856 ||:   5%|5         | 5/95 [00:02<00:38,  2.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9696, LAS: 0.9413, UEM: 0.6951, LEM: 0.4698, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4386, partial_loss/deprel_loss: 0.3273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5352, loss: 0.4716, batch_reg_loss: 0.1856, reg_loss: 0.1856 ||:  11%|#         | 10/95 [00:04<00:36,  2.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9501, UAS: 0.9708, LAS: 0.9427, UEM: 0.7186, LEM: 0.4994, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1168, partial_loss/deprel_loss: 0.2143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3804, loss: 0.4632, batch_reg_loss: 0.1856, reg_loss: 0.1856 ||:  15%|#4        | 14/95 [00:06<00:36,  2.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9694, LAS: 0.9418, UEM: 0.6895, LEM: 0.4791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2626, partial_loss/deprel_loss: 0.3353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5063, loss: 0.4716, batch_reg_loss: 0.1856, reg_loss: 0.1856 ||:  20%|##        | 19/95 [00:08<00:33,  2.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9676, LAS: 0.9401, UEM: 0.6739, LEM: 0.4672, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4694, partial_loss/deprel_loss: 0.3503, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5597, loss: 0.4829, batch_reg_loss: 0.1856, reg_loss: 0.1856 ||:  25%|##5       | 24/95 [00:10<00:30,  2.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9674, LAS: 0.9396, UEM: 0.6575, LEM: 0.4444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5876, partial_loss/deprel_loss: 0.4009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6238, loss: 0.4877, batch_reg_loss: 0.1855, reg_loss: 0.1856 ||:  32%|###1      | 30/95 [00:12<00:27,  2.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9478, UAS: 0.9671, LAS: 0.9394, UEM: 0.6786, LEM: 0.4724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1968, partial_loss/deprel_loss: 0.2692, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4402, loss: 0.4889, batch_reg_loss: 0.1855, reg_loss: 0.1856 ||:  37%|###6      | 35/95 [00:15<00:26,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9684, LAS: 0.9407, UEM: 0.6999, LEM: 0.4939, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1567, partial_loss/deprel_loss: 0.2432, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4114, loss: 0.4793, batch_reg_loss: 0.1855, reg_loss: 0.1856 ||:  42%|####2     | 40/95 [00:17<00:24,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9685, LAS: 0.9408, UEM: 0.6923, LEM: 0.4840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2838, partial_loss/deprel_loss: 0.2799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4662, loss: 0.4792, batch_reg_loss: 0.1855, reg_loss: 0.1856 ||:  47%|####7     | 45/95 [00:19<00:21,  2.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9688, LAS: 0.9413, UEM: 0.7222, LEM: 0.5253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2696, partial_loss/deprel_loss: 0.2620, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4490, loss: 0.4761, batch_reg_loss: 0.1855, reg_loss: 0.1856 ||:  53%|#####2    | 50/95 [00:22<00:20,  2.18it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9493, UAS: 0.9684, LAS: 0.9411, UEM: 0.7157, LEM: 0.5196, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1743, partial_loss/deprel_loss: 0.2036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3832, loss: 0.4767, batch_reg_loss: 0.1855, reg_loss: 0.1855 ||:  58%|#####7    | 55/95 [00:24<00:18,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9665, UAS: 0.9681, LAS: 0.9410, UEM: 0.7111, LEM: 0.5155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0689, partial_loss/deprel_loss: 0.1774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3412, loss: 0.4791, batch_reg_loss: 0.1854, reg_loss: 0.1855 ||:  63%|######3   | 60/95 [00:26<00:15,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9473, UAS: 0.9680, LAS: 0.9409, UEM: 0.7069, LEM: 0.5104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2347, partial_loss/deprel_loss: 0.2438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4274, loss: 0.4796, batch_reg_loss: 0.1854, reg_loss: 0.1855 ||:  68%|######8   | 65/95 [00:28<00:13,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9678, LAS: 0.9407, UEM: 0.7068, LEM: 0.5081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1226, partial_loss/deprel_loss: 0.2546, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4136, loss: 0.4802, batch_reg_loss: 0.1854, reg_loss: 0.1855 ||:  74%|#######3  | 70/95 [00:31<00:11,  2.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9683, LAS: 0.9412, UEM: 0.7103, LEM: 0.5114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1969, partial_loss/deprel_loss: 0.2432, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4193, loss: 0.4771, batch_reg_loss: 0.1854, reg_loss: 0.1855 ||:  79%|#######8  | 75/95 [00:33<00:08,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9518, UAS: 0.9686, LAS: 0.9413, UEM: 0.7199, LEM: 0.5234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1272, partial_loss/deprel_loss: 0.2134, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3815, loss: 0.4750, batch_reg_loss: 0.1854, reg_loss: 0.1855 ||:  84%|########4 | 80/95 [00:35<00:06,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9682, LAS: 0.9409, UEM: 0.7135, LEM: 0.5157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2717, partial_loss/deprel_loss: 0.3277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5018, loss: 0.4787, batch_reg_loss: 0.1853, reg_loss: 0.1855 ||:  89%|########9 | 85/95 [00:38<00:04,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9479, UAS: 0.9685, LAS: 0.9411, UEM: 0.7142, LEM: 0.5132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1888, partial_loss/deprel_loss: 0.2510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4239, loss: 0.4767, batch_reg_loss: 0.1853, reg_loss: 0.1855 ||:  95%|#########4| 90/95 [00:40<00:02,  2.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9589, UAS: 0.9684, LAS: 0.9411, UEM: 0.7093, LEM: 0.5086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1960, partial_loss/deprel_loss: 0.2169, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3981, loss: 0.4780, batch_reg_loss: 0.1853, reg_loss: 0.1855 ||: 100%|##########| 95/95 [00:42<00:00,  2.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9589, UAS: 0.9684, LAS: 0.9411, UEM: 0.7093, LEM: 0.5086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1960, partial_loss/deprel_loss: 0.2169, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3981, loss: 0.4780, batch_reg_loss: 0.1853, reg_loss: 0.1855 ||: 100%|##########| 95/95 [00:42<00:00,  2.24it/s]\n",
+      "2023-04-07 02:13:46,147 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.185  |       N/A\n",
+      "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - UEM                      |     0.709  |       N/A\n",
+      "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - LEM                      |     0.509  |       N/A\n",
+      "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - EM                       |     0.959  |       N/A\n",
+      "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.196  |       N/A\n",
+      "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - UAS                      |     0.968  |       N/A\n",
+      "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.217  |       N/A\n",
+      "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - loss                     |     0.478  |       N/A\n",
+      "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - LAS                      |     0.941  |       N/A\n",
+      "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:13:46,148 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:13:46,149 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:13:46,149 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:13:46,149 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:13:46,153 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:13:50,367 - INFO - combo.training.trainer - Epoch duration: 0:00:49.574997\n",
+      "2023-04-07 02:13:50,368 - INFO - combo.training.trainer - Estimated training time remaining: 4:09:37\n",
+      "2023-04-07 02:13:50,368 - INFO - allennlp.training.trainer - Epoch 180/399\n",
+      "2023-04-07 02:13:50,368 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:13:50,368 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:13:50,376 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9227, UAS: 0.9666, LAS: 0.9383, UEM: 0.7143, LEM: 0.5138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5761, partial_loss/deprel_loss: 0.4226, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6386, loss: 0.4976, batch_reg_loss: 0.1853, reg_loss: 0.1853 ||:   5%|5         | 5/95 [00:02<00:39,  2.31it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9528, UAS: 0.9725, LAS: 0.9441, UEM: 0.7695, LEM: 0.5583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1173, partial_loss/deprel_loss: 0.2469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4063, loss: 0.4607, batch_reg_loss: 0.1853, reg_loss: 0.1853 ||:  11%|#         | 10/95 [00:04<00:37,  2.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9516, UAS: 0.9703, LAS: 0.9421, UEM: 0.7411, LEM: 0.5255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1205, partial_loss/deprel_loss: 0.2397, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4011, loss: 0.4728, batch_reg_loss: 0.1852, reg_loss: 0.1853 ||:  16%|#5        | 15/95 [00:06<00:35,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9272, UAS: 0.9678, LAS: 0.9398, UEM: 0.7004, LEM: 0.4850, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5309, partial_loss/deprel_loss: 0.3997, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6112, loss: 0.4891, batch_reg_loss: 0.1852, reg_loss: 0.1853 ||:  21%|##1       | 20/95 [00:08<00:33,  2.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9581, UAS: 0.9695, LAS: 0.9411, UEM: 0.7254, LEM: 0.5143, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0978, partial_loss/deprel_loss: 0.1723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3426, loss: 0.4737, batch_reg_loss: 0.1852, reg_loss: 0.1853 ||:  26%|##6       | 25/95 [00:11<00:31,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9740, UAS: 0.9715, LAS: 0.9437, UEM: 0.7774, LEM: 0.5921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0434, partial_loss/deprel_loss: 0.1056, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2784, loss: 0.4567, batch_reg_loss: 0.1852, reg_loss: 0.1852 ||:  32%|###1      | 30/95 [00:14<00:31,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9523, UAS: 0.9717, LAS: 0.9443, UEM: 0.7673, LEM: 0.5787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2146, partial_loss/deprel_loss: 0.2549, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4320, loss: 0.4575, batch_reg_loss: 0.1852, reg_loss: 0.1852 ||:  37%|###6      | 35/95 [00:16<00:28,  2.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9294, UAS: 0.9710, LAS: 0.9432, UEM: 0.7501, LEM: 0.5583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4043, partial_loss/deprel_loss: 0.3704, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5624, loss: 0.4664, batch_reg_loss: 0.1851, reg_loss: 0.1852 ||:  42%|####2     | 40/95 [00:18<00:25,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9704, LAS: 0.9424, UEM: 0.7416, LEM: 0.5446, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1745, partial_loss/deprel_loss: 0.2983, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4587, loss: 0.4725, batch_reg_loss: 0.1851, reg_loss: 0.1852 ||:  47%|####7     | 45/95 [00:20<00:22,  2.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9569, UAS: 0.9699, LAS: 0.9418, UEM: 0.7404, LEM: 0.5427, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1420, partial_loss/deprel_loss: 0.2244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3930, loss: 0.4751, batch_reg_loss: 0.1851, reg_loss: 0.1852 ||:  53%|#####2    | 50/95 [00:22<00:20,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9608, UAS: 0.9702, LAS: 0.9422, UEM: 0.7406, LEM: 0.5428, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0560, partial_loss/deprel_loss: 0.1966, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3536, loss: 0.4727, batch_reg_loss: 0.1851, reg_loss: 0.1852 ||:  58%|#####7    | 55/95 [00:25<00:18,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8971, UAS: 0.9693, LAS: 0.9415, UEM: 0.7310, LEM: 0.5324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8916, partial_loss/deprel_loss: 0.4016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6847, loss: 0.4766, batch_reg_loss: 0.1851, reg_loss: 0.1852 ||:  63%|######3   | 60/95 [00:27<00:16,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9568, UAS: 0.9695, LAS: 0.9418, UEM: 0.7304, LEM: 0.5310, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1583, partial_loss/deprel_loss: 0.1793, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3601, loss: 0.4742, batch_reg_loss: 0.1851, reg_loss: 0.1852 ||:  68%|######8   | 65/95 [00:29<00:13,  2.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9034, UAS: 0.9691, LAS: 0.9413, UEM: 0.7234, LEM: 0.5233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8747, partial_loss/deprel_loss: 0.4824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7459, loss: 0.4777, batch_reg_loss: 0.1850, reg_loss: 0.1852 ||:  74%|#######3  | 70/95 [00:32<00:11,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9691, LAS: 0.9412, UEM: 0.7214, LEM: 0.5210, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3175, partial_loss/deprel_loss: 0.3895, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5601, loss: 0.4768, batch_reg_loss: 0.1850, reg_loss: 0.1852 ||:  79%|#######8  | 75/95 [00:34<00:09,  2.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9689, LAS: 0.9411, UEM: 0.7181, LEM: 0.5174, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3564, partial_loss/deprel_loss: 0.2989, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4954, loss: 0.4772, batch_reg_loss: 0.1850, reg_loss: 0.1852 ||:  84%|########4 | 80/95 [00:36<00:06,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9688, LAS: 0.9411, UEM: 0.7141, LEM: 0.5136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2639, partial_loss/deprel_loss: 0.2869, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4673, loss: 0.4762, batch_reg_loss: 0.1850, reg_loss: 0.1851 ||:  89%|########9 | 85/95 [00:38<00:04,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9688, LAS: 0.9411, UEM: 0.7095, LEM: 0.5080, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3271, partial_loss/deprel_loss: 0.3225, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5084, loss: 0.4765, batch_reg_loss: 0.1850, reg_loss: 0.1851 ||:  95%|#########4| 90/95 [00:41<00:02,  2.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9687, LAS: 0.9410, UEM: 0.7068, LEM: 0.5043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1697, partial_loss/deprel_loss: 0.2672, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4326, loss: 0.4761, batch_reg_loss: 0.1850, reg_loss: 0.1851 ||: 100%|##########| 95/95 [00:43<00:00,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9687, LAS: 0.9410, UEM: 0.7068, LEM: 0.5043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1697, partial_loss/deprel_loss: 0.2672, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4326, loss: 0.4761, batch_reg_loss: 0.1850, reg_loss: 0.1851 ||: 100%|##########| 95/95 [00:43<00:00,  2.19it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 02:14:37,037 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8546, UAS: 0.9535, LAS: 0.9074, UEM: 0.7970, LEM: 0.5912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5753, partial_loss/deprel_loss: 16.2328, partial_loss/cycle_loss: 0.0000, batch_loss: 13.3013, loss: 7.2497, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  27%|##7       | 3/11 [00:02<00:05,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8725, UAS: 0.9544, LAS: 0.9038, UEM: 0.7405, LEM: 0.4788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0724, partial_loss/deprel_loss: 12.5631, partial_loss/cycle_loss: 0.0000, batch_loss: 10.2649, loss: 7.0178, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  64%|######3   | 7/11 [00:04<00:02,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8985, UAS: 0.9519, LAS: 0.9015, UEM: 0.6893, LEM: 0.4162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6453, partial_loss/deprel_loss: 6.3757, partial_loss/cycle_loss: 0.0000, batch_loss: 5.2296, loss: 7.0737, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:07<00:00,  1.54it/s] \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8985, UAS: 0.9519, LAS: 0.9015, UEM: 0.6893, LEM: 0.4162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6453, partial_loss/deprel_loss: 6.3757, partial_loss/cycle_loss: 0.0000, batch_loss: 5.2296, loss: 7.0737, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:07<00:00,  1.57it/s]\n",
+      "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.185  |     0.000\n",
+      "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - UEM                      |     0.707  |     0.689\n",
+      "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - LEM                      |     0.504  |     0.416\n",
+      "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - EM                       |     0.945  |     0.899\n",
+      "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.170  |     0.645\n",
+      "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - UAS                      |     0.969  |     0.952\n",
+      "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.267  |     6.376\n",
+      "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - loss                     |     0.476  |     7.074\n",
+      "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 02:14:44,051 - INFO - combo.training.tensorboard_writer - LAS                      |     0.941  |     0.902\n",
+      "2023-04-07 02:14:44,052 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:14:44,052 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 02:14:44,052 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 02:14:44,052 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 02:14:44,052 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 02:14:44,052 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 02:14:44,056 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:14:48,239 - INFO - combo.training.trainer - Epoch duration: 0:00:57.871390\n",
+      "2023-04-07 02:14:48,240 - INFO - combo.training.trainer - Estimated training time remaining: 4:08:16\n",
+      "2023-04-07 02:14:48,240 - INFO - allennlp.training.trainer - Epoch 181/399\n",
+      "2023-04-07 02:14:48,240 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:14:48,241 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:14:48,251 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9632, UAS: 0.9710, LAS: 0.9417, UEM: 0.7680, LEM: 0.5770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0552, partial_loss/deprel_loss: 0.1685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3308, loss: 0.4788, batch_reg_loss: 0.1849, reg_loss: 0.1849 ||:   5%|5         | 5/95 [00:02<00:41,  2.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9557, UAS: 0.9717, LAS: 0.9426, UEM: 0.7406, LEM: 0.5353, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1134, partial_loss/deprel_loss: 0.1824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3535, loss: 0.4690, batch_reg_loss: 0.1849, reg_loss: 0.1849 ||:  11%|#         | 10/95 [00:04<00:39,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9515, UAS: 0.9691, LAS: 0.9408, UEM: 0.7014, LEM: 0.4932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2414, partial_loss/deprel_loss: 0.2581, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4397, loss: 0.4805, batch_reg_loss: 0.1849, reg_loss: 0.1849 ||:  16%|#5        | 15/95 [00:06<00:36,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9492, UAS: 0.9685, LAS: 0.9408, UEM: 0.6720, LEM: 0.4638, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2285, partial_loss/deprel_loss: 0.2683, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4452, loss: 0.4799, batch_reg_loss: 0.1849, reg_loss: 0.1849 ||:  21%|##1       | 20/95 [00:08<00:33,  2.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9681, LAS: 0.9399, UEM: 0.6728, LEM: 0.4593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1980, partial_loss/deprel_loss: 0.2204, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4008, loss: 0.4819, batch_reg_loss: 0.1849, reg_loss: 0.1849 ||:  26%|##6       | 25/95 [00:11<00:31,  2.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9443, UAS: 0.9664, LAS: 0.9386, UEM: 0.6539, LEM: 0.4442, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2628, partial_loss/deprel_loss: 0.2362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4264, loss: 0.4863, batch_reg_loss: 0.1849, reg_loss: 0.1849 ||:  32%|###1      | 30/95 [00:13<00:29,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9535, UAS: 0.9670, LAS: 0.9395, UEM: 0.6755, LEM: 0.4746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2242, partial_loss/deprel_loss: 0.2373, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4195, loss: 0.4807, batch_reg_loss: 0.1848, reg_loss: 0.1849 ||:  37%|###6      | 35/95 [00:15<00:26,  2.26it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9515, UAS: 0.9672, LAS: 0.9397, UEM: 0.6724, LEM: 0.4718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1763, partial_loss/deprel_loss: 0.2509, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4208, loss: 0.4792, batch_reg_loss: 0.1848, reg_loss: 0.1849 ||:  42%|####2     | 40/95 [00:17<00:24,  2.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9529, UAS: 0.9681, LAS: 0.9407, UEM: 0.6855, LEM: 0.4840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1212, partial_loss/deprel_loss: 0.2362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3980, loss: 0.4717, batch_reg_loss: 0.1848, reg_loss: 0.1849 ||:  47%|####7     | 45/95 [00:19<00:21,  2.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9460, UAS: 0.9687, LAS: 0.9412, UEM: 0.6877, LEM: 0.4805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1818, partial_loss/deprel_loss: 0.2404, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4134, loss: 0.4700, batch_reg_loss: 0.1848, reg_loss: 0.1849 ||:  53%|#####2    | 50/95 [00:22<00:19,  2.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9577, UAS: 0.9687, LAS: 0.9412, UEM: 0.6919, LEM: 0.4843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1079, partial_loss/deprel_loss: 0.2376, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3965, loss: 0.4705, batch_reg_loss: 0.1848, reg_loss: 0.1849 ||:  58%|#####7    | 55/95 [00:24<00:17,  2.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9680, LAS: 0.9404, UEM: 0.7010, LEM: 0.4956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8331, partial_loss/deprel_loss: 0.4301, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6954, loss: 0.4739, batch_reg_loss: 0.1847, reg_loss: 0.1848 ||:  63%|######3   | 60/95 [00:27<00:16,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9684, LAS: 0.9407, UEM: 0.7038, LEM: 0.4976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5620, partial_loss/deprel_loss: 0.4448, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6530, loss: 0.4739, batch_reg_loss: 0.1847, reg_loss: 0.1848 ||:  68%|######8   | 65/95 [00:29<00:13,  2.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9683, LAS: 0.9406, UEM: 0.7031, LEM: 0.4978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4556, partial_loss/deprel_loss: 0.3402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5480, loss: 0.4741, batch_reg_loss: 0.1847, reg_loss: 0.1848 ||:  74%|#######3  | 70/95 [00:31<00:11,  2.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9521, UAS: 0.9689, LAS: 0.9411, UEM: 0.7104, LEM: 0.5046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1098, partial_loss/deprel_loss: 0.2107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3752, loss: 0.4713, batch_reg_loss: 0.1847, reg_loss: 0.1848 ||:  79%|#######8  | 75/95 [00:33<00:09,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9691, LAS: 0.9414, UEM: 0.7085, LEM: 0.5024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2873, partial_loss/deprel_loss: 0.2373, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4320, loss: 0.4695, batch_reg_loss: 0.1847, reg_loss: 0.1848 ||:  84%|########4 | 80/95 [00:35<00:06,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9592, UAS: 0.9689, LAS: 0.9411, UEM: 0.7038, LEM: 0.4966, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1614, partial_loss/deprel_loss: 0.2006, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3774, loss: 0.4733, batch_reg_loss: 0.1847, reg_loss: 0.1848 ||:  89%|########9 | 85/95 [00:38<00:04,  2.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9686, LAS: 0.9409, UEM: 0.7077, LEM: 0.5081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4128, partial_loss/deprel_loss: 0.3691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5624, loss: 0.4748, batch_reg_loss: 0.1846, reg_loss: 0.1848 ||:  95%|#########4| 90/95 [00:40<00:02,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9686, LAS: 0.9408, UEM: 0.7062, LEM: 0.5043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2855, partial_loss/deprel_loss: 0.3166, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4950, loss: 0.4757, batch_reg_loss: 0.1846, reg_loss: 0.1848 ||: 100%|##########| 95/95 [00:42<00:00,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9686, LAS: 0.9408, UEM: 0.7062, LEM: 0.5043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2855, partial_loss/deprel_loss: 0.3166, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4950, loss: 0.4757, batch_reg_loss: 0.1846, reg_loss: 0.1848 ||: 100%|##########| 95/95 [00:42<00:00,  2.22it/s]\n",
+      "2023-04-07 02:15:34,180 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:15:34,180 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 02:15:34,180 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.185  |       N/A\n",
+      "2023-04-07 02:15:34,180 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:15:34,181 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:15:34,181 - INFO - combo.training.tensorboard_writer - UEM                      |     0.706  |       N/A\n",
+      "2023-04-07 02:15:34,181 - INFO - combo.training.tensorboard_writer - LEM                      |     0.504  |       N/A\n",
+      "2023-04-07 02:15:34,181 - INFO - combo.training.tensorboard_writer - EM                       |     0.935  |       N/A\n",
+      "2023-04-07 02:15:34,181 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.286  |       N/A\n",
+      "2023-04-07 02:15:34,181 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:15:34,181 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:15:34,182 - INFO - combo.training.tensorboard_writer - UAS                      |     0.969  |       N/A\n",
+      "2023-04-07 02:15:34,182 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:15:34,182 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.317  |       N/A\n",
+      "2023-04-07 02:15:34,182 - INFO - combo.training.tensorboard_writer - loss                     |     0.476  |       N/A\n",
+      "2023-04-07 02:15:34,182 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:15:34,182 - INFO - combo.training.tensorboard_writer - LAS                      |     0.941  |       N/A\n",
+      "2023-04-07 02:15:34,182 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:15:34,183 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:15:34,183 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:15:34,183 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:15:34,183 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:15:34,183 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:15:34,195 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 02:15:38,586 - INFO - combo.training.trainer - Epoch duration: 0:00:50.345983\n",
+      "2023-04-07 02:15:38,586 - INFO - combo.training.trainer - Estimated training time remaining: 4:06:47\n",
+      "2023-04-07 02:15:38,587 - INFO - allennlp.training.trainer - Epoch 182/399\n",
+      "2023-04-07 02:15:38,587 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:15:38,587 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:15:38,594 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9589, LAS: 0.9323, UEM: 0.4513, LEM: 0.2445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8072, partial_loss/deprel_loss: 0.4965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7432, loss: 0.5557, batch_reg_loss: 0.1846, reg_loss: 0.1846 ||:   5%|5         | 5/95 [00:02<00:37,  2.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9688, UAS: 0.9632, LAS: 0.9373, UEM: 0.6926, LEM: 0.5358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0722, partial_loss/deprel_loss: 0.1310, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3038, loss: 0.5093, batch_reg_loss: 0.1846, reg_loss: 0.1846 ||:  11%|#         | 10/95 [00:04<00:36,  2.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9643, LAS: 0.9378, UEM: 0.6684, LEM: 0.5039, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3727, partial_loss/deprel_loss: 0.3393, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5306, loss: 0.5034, batch_reg_loss: 0.1846, reg_loss: 0.1846 ||:  16%|#5        | 15/95 [00:06<00:34,  2.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9479, UAS: 0.9642, LAS: 0.9372, UEM: 0.6723, LEM: 0.4964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2291, partial_loss/deprel_loss: 0.2518, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4318, loss: 0.5044, batch_reg_loss: 0.1846, reg_loss: 0.1846 ||:  21%|##1       | 20/95 [00:08<00:32,  2.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9576, UAS: 0.9656, LAS: 0.9386, UEM: 0.6941, LEM: 0.5172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0670, partial_loss/deprel_loss: 0.2053, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3622, loss: 0.4949, batch_reg_loss: 0.1845, reg_loss: 0.1846 ||:  26%|##6       | 25/95 [00:10<00:30,  2.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9569, UAS: 0.9667, LAS: 0.9399, UEM: 0.6898, LEM: 0.5080, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2092, partial_loss/deprel_loss: 0.2409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4191, loss: 0.4878, batch_reg_loss: 0.1845, reg_loss: 0.1846 ||:  32%|###1      | 30/95 [00:12<00:27,  2.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9673, LAS: 0.9401, UEM: 0.6961, LEM: 0.5105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4122, partial_loss/deprel_loss: 0.3134, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5177, loss: 0.4844, batch_reg_loss: 0.1845, reg_loss: 0.1846 ||:  37%|###6      | 35/95 [00:15<00:25,  2.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9663, LAS: 0.9393, UEM: 0.6766, LEM: 0.4891, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3957, partial_loss/deprel_loss: 0.3226, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5217, loss: 0.4897, batch_reg_loss: 0.1845, reg_loss: 0.1846 ||:  42%|####2     | 40/95 [00:17<00:23,  2.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9283, UAS: 0.9662, LAS: 0.9391, UEM: 0.6756, LEM: 0.4869, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4823, partial_loss/deprel_loss: 0.3495, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5606, loss: 0.4917, batch_reg_loss: 0.1845, reg_loss: 0.1845 ||:  47%|####7     | 45/95 [00:19<00:21,  2.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9529, UAS: 0.9676, LAS: 0.9406, UEM: 0.6992, LEM: 0.5072, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1197, partial_loss/deprel_loss: 0.2593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4158, loss: 0.4832, batch_reg_loss: 0.1845, reg_loss: 0.1845 ||:  53%|#####2    | 50/95 [00:21<00:20,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9677, LAS: 0.9404, UEM: 0.6934, LEM: 0.4971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4337, partial_loss/deprel_loss: 0.3512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5522, loss: 0.4848, batch_reg_loss: 0.1844, reg_loss: 0.1845 ||:  58%|#####7    | 55/95 [00:23<00:17,  2.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9464, UAS: 0.9682, LAS: 0.9411, UEM: 0.6925, LEM: 0.4947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2274, partial_loss/deprel_loss: 0.2473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4278, loss: 0.4807, batch_reg_loss: 0.1844, reg_loss: 0.1845 ||:  63%|######3   | 60/95 [00:26<00:15,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9522, UAS: 0.9685, LAS: 0.9413, UEM: 0.6904, LEM: 0.4888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2265, partial_loss/deprel_loss: 0.2075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3957, loss: 0.4787, batch_reg_loss: 0.1844, reg_loss: 0.1845 ||:  68%|######8   | 65/95 [00:28<00:12,  2.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9687, LAS: 0.9414, UEM: 0.6932, LEM: 0.4907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1359, partial_loss/deprel_loss: 0.2819, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4371, loss: 0.4779, batch_reg_loss: 0.1844, reg_loss: 0.1845 ||:  74%|#######3  | 70/95 [00:30<00:11,  2.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9476, UAS: 0.9692, LAS: 0.9419, UEM: 0.6971, LEM: 0.4931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2576, partial_loss/deprel_loss: 0.2595, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4435, loss: 0.4745, batch_reg_loss: 0.1844, reg_loss: 0.1845 ||:  79%|#######8  | 75/95 [00:32<00:09,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9252, UAS: 0.9688, LAS: 0.9415, UEM: 0.6922, LEM: 0.4883, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5407, partial_loss/deprel_loss: 0.3514, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5736, loss: 0.4771, batch_reg_loss: 0.1843, reg_loss: 0.1845 ||:  84%|########4 | 80/95 [00:37<00:08,  1.71it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9689, LAS: 0.9418, UEM: 0.7071, LEM: 0.5115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5852, partial_loss/deprel_loss: 0.3974, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6193, loss: 0.4749, batch_reg_loss: 0.1843, reg_loss: 0.1845 ||:  88%|########8 | 84/95 [00:39<00:06,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9691, LAS: 0.9419, UEM: 0.7056, LEM: 0.5088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3327, partial_loss/deprel_loss: 0.3603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5391, loss: 0.4745, batch_reg_loss: 0.1843, reg_loss: 0.1845 ||:  94%|#########3| 89/95 [00:41<00:03,  1.90it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9461, UAS: 0.9693, LAS: 0.9421, UEM: 0.7087, LEM: 0.5115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2439, partial_loss/deprel_loss: 0.2633, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4437, loss: 0.4740, batch_reg_loss: 0.1843, reg_loss: 0.1845 ||:  99%|#########8| 94/95 [00:44<00:00,  1.97it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9694, LAS: 0.9422, UEM: 0.7084, LEM: 0.5104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1739, partial_loss/deprel_loss: 0.2740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4383, loss: 0.4736, batch_reg_loss: 0.1843, reg_loss: 0.1845 ||: 100%|##########| 95/95 [00:44<00:00,  2.14it/s]\n",
+      "2023-04-07 02:16:25,865 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:16:25,865 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 02:16:25,865 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.184  |       N/A\n",
+      "2023-04-07 02:16:25,865 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:16:25,865 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:16:25,865 - INFO - combo.training.tensorboard_writer - UEM                      |     0.708  |       N/A\n",
+      "2023-04-07 02:16:25,865 - INFO - combo.training.tensorboard_writer - LEM                      |     0.510  |       N/A\n",
+      "2023-04-07 02:16:25,865 - INFO - combo.training.tensorboard_writer - EM                       |     0.948  |       N/A\n",
+      "2023-04-07 02:16:25,865 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.174  |       N/A\n",
+      "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - UAS                      |     0.969  |       N/A\n",
+      "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.274  |       N/A\n",
+      "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - loss                     |     0.474  |       N/A\n",
+      "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - LAS                      |     0.942  |       N/A\n",
+      "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:16:25,866 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:16:25,870 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:16:29,983 - INFO - combo.training.trainer - Epoch duration: 0:00:51.396437\n",
+      "2023-04-07 02:16:29,983 - INFO - combo.training.trainer - Estimated training time remaining: 4:05:20\n",
+      "2023-04-07 02:16:29,984 - INFO - allennlp.training.trainer - Epoch 183/399\n",
+      "2023-04-07 02:16:29,984 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:16:29,984 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:16:29,992 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9736, LAS: 0.9450, UEM: 0.7081, LEM: 0.4617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1576, partial_loss/deprel_loss: 0.2291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3990, loss: 0.4526, batch_reg_loss: 0.1843, reg_loss: 0.1843 ||:   5%|5         | 5/95 [00:02<00:38,  2.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9648, LAS: 0.9359, UEM: 0.6100, LEM: 0.3716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3126, partial_loss/deprel_loss: 0.3098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4946, loss: 0.5070, batch_reg_loss: 0.1843, reg_loss: 0.1843 ||:  11%|#         | 10/95 [00:04<00:36,  2.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9488, UAS: 0.9680, LAS: 0.9394, UEM: 0.6750, LEM: 0.4463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1583, partial_loss/deprel_loss: 0.2077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3821, loss: 0.4776, batch_reg_loss: 0.1842, reg_loss: 0.1843 ||:  16%|#5        | 15/95 [00:06<00:34,  2.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9501, UAS: 0.9706, LAS: 0.9418, UEM: 0.7283, LEM: 0.5052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2150, partial_loss/deprel_loss: 0.2509, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4279, loss: 0.4616, batch_reg_loss: 0.1842, reg_loss: 0.1843 ||:  21%|##1       | 20/95 [00:08<00:32,  2.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9343, UAS: 0.9682, LAS: 0.9397, UEM: 0.6953, LEM: 0.4727, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3700, partial_loss/deprel_loss: 0.3394, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5297, loss: 0.4773, batch_reg_loss: 0.1842, reg_loss: 0.1842 ||:  26%|##6       | 25/95 [00:10<00:30,  2.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9593, UAS: 0.9699, LAS: 0.9416, UEM: 0.7165, LEM: 0.4932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0679, partial_loss/deprel_loss: 0.1659, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3305, loss: 0.4651, batch_reg_loss: 0.1842, reg_loss: 0.1842 ||:  32%|###1      | 30/95 [00:13<00:28,  2.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9489, UAS: 0.9707, LAS: 0.9429, UEM: 0.7351, LEM: 0.5240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2346, partial_loss/deprel_loss: 0.2264, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4122, loss: 0.4562, batch_reg_loss: 0.1842, reg_loss: 0.1842 ||:  37%|###6      | 35/95 [00:15<00:26,  2.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9470, UAS: 0.9701, LAS: 0.9425, UEM: 0.7245, LEM: 0.5128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2820, partial_loss/deprel_loss: 0.2577, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4467, loss: 0.4615, batch_reg_loss: 0.1841, reg_loss: 0.1842 ||:  42%|####2     | 40/95 [00:17<00:24,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9443, UAS: 0.9694, LAS: 0.9419, UEM: 0.7106, LEM: 0.4996, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2296, partial_loss/deprel_loss: 0.2727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4482, loss: 0.4674, batch_reg_loss: 0.1841, reg_loss: 0.1842 ||:  47%|####7     | 45/95 [00:19<00:21,  2.27it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9498, UAS: 0.9702, LAS: 0.9424, UEM: 0.7154, LEM: 0.5002, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1348, partial_loss/deprel_loss: 0.2371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4008, loss: 0.4638, batch_reg_loss: 0.1841, reg_loss: 0.1842 ||:  53%|#####2    | 50/95 [00:21<00:19,  2.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9521, UAS: 0.9709, LAS: 0.9432, UEM: 0.7288, LEM: 0.5171, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1072, partial_loss/deprel_loss: 0.2281, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3880, loss: 0.4582, batch_reg_loss: 0.1841, reg_loss: 0.1842 ||:  58%|#####7    | 55/95 [00:24<00:17,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9709, LAS: 0.9432, UEM: 0.7273, LEM: 0.5154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5454, partial_loss/deprel_loss: 0.3674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5870, loss: 0.4585, batch_reg_loss: 0.1841, reg_loss: 0.1842 ||:  63%|######3   | 60/95 [00:26<00:16,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9537, UAS: 0.9709, LAS: 0.9431, UEM: 0.7266, LEM: 0.5144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0981, partial_loss/deprel_loss: 0.2148, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3755, loss: 0.4597, batch_reg_loss: 0.1840, reg_loss: 0.1842 ||:  68%|######8   | 65/95 [00:28<00:13,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9381, UAS: 0.9707, LAS: 0.9428, UEM: 0.7228, LEM: 0.5096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3294, partial_loss/deprel_loss: 0.2967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4872, loss: 0.4622, batch_reg_loss: 0.1840, reg_loss: 0.1842 ||:  74%|#######3  | 70/95 [00:31<00:11,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9584, UAS: 0.9700, LAS: 0.9423, UEM: 0.7160, LEM: 0.5036, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1628, partial_loss/deprel_loss: 0.2177, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3907, loss: 0.4662, batch_reg_loss: 0.1840, reg_loss: 0.1841 ||:  79%|#######8  | 75/95 [00:33<00:09,  2.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9697, LAS: 0.9418, UEM: 0.7115, LEM: 0.4986, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3087, partial_loss/deprel_loss: 0.3319, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5112, loss: 0.4701, batch_reg_loss: 0.1840, reg_loss: 0.1841 ||:  84%|########4 | 80/95 [00:35<00:06,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9515, UAS: 0.9701, LAS: 0.9424, UEM: 0.7249, LEM: 0.5196, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1842, partial_loss/deprel_loss: 0.2391, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4120, loss: 0.4662, batch_reg_loss: 0.1840, reg_loss: 0.1841 ||:  89%|########9 | 85/95 [00:38<00:04,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9698, LAS: 0.9421, UEM: 0.7194, LEM: 0.5130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3806, partial_loss/deprel_loss: 0.3290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5233, loss: 0.4687, batch_reg_loss: 0.1839, reg_loss: 0.1841 ||:  95%|#########4| 90/95 [00:40<00:02,  2.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9264, UAS: 0.9691, LAS: 0.9415, UEM: 0.7092, LEM: 0.5038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4928, partial_loss/deprel_loss: 0.3736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5814, loss: 0.4741, batch_reg_loss: 0.1839, reg_loss: 0.1841 ||: 100%|##########| 95/95 [00:42<00:00,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9264, UAS: 0.9691, LAS: 0.9415, UEM: 0.7092, LEM: 0.5038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4928, partial_loss/deprel_loss: 0.3736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5814, loss: 0.4741, batch_reg_loss: 0.1839, reg_loss: 0.1841 ||: 100%|##########| 95/95 [00:42<00:00,  2.23it/s]\n",
+      "2023-04-07 02:17:15,937 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:17:15,937 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 02:17:15,937 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.184  |       N/A\n",
+      "2023-04-07 02:17:15,937 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:17:15,938 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:17:15,938 - INFO - combo.training.tensorboard_writer - UEM                      |     0.709  |       N/A\n",
+      "2023-04-07 02:17:15,938 - INFO - combo.training.tensorboard_writer - LEM                      |     0.504  |       N/A\n",
+      "2023-04-07 02:17:15,938 - INFO - combo.training.tensorboard_writer - EM                       |     0.926  |       N/A\n",
+      "2023-04-07 02:17:15,938 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.493  |       N/A\n",
+      "2023-04-07 02:17:15,938 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:17:15,938 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:17:15,938 - INFO - combo.training.tensorboard_writer - UAS                      |     0.969  |       N/A\n",
+      "2023-04-07 02:17:15,939 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:17:15,939 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.374  |       N/A\n",
+      "2023-04-07 02:17:15,939 - INFO - combo.training.tensorboard_writer - loss                     |     0.474  |       N/A\n",
+      "2023-04-07 02:17:15,939 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:17:15,939 - INFO - combo.training.tensorboard_writer - LAS                      |     0.941  |       N/A\n",
+      "2023-04-07 02:17:15,939 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:17:15,939 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:17:15,940 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:17:15,940 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:17:15,940 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:17:15,940 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:17:15,949 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:17:19,499 - INFO - combo.training.trainer - Epoch duration: 0:00:49.514962\n",
+      "2023-04-07 02:17:19,499 - INFO - combo.training.trainer - Estimated training time remaining: 4:03:50\n",
+      "2023-04-07 02:17:19,499 - INFO - allennlp.training.trainer - Epoch 184/399\n",
+      "2023-04-07 02:17:19,500 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:17:19,501 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:17:19,510 - INFO - allennlp.training.trainer - Training\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9601, UAS: 0.9756, LAS: 0.9476, UEM: 0.7727, LEM: 0.5719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0784, partial_loss/deprel_loss: 0.1610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3284, loss: 0.4333, batch_reg_loss: 0.1839, reg_loss: 0.1839 ||:   5%|5         | 5/95 [00:02<00:37,  2.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9517, UAS: 0.9734, LAS: 0.9460, UEM: 0.7501, LEM: 0.5449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1814, partial_loss/deprel_loss: 0.2370, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4097, loss: 0.4404, batch_reg_loss: 0.1839, reg_loss: 0.1839 ||:  11%|#         | 10/95 [00:04<00:36,  2.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9707, LAS: 0.9428, UEM: 0.7047, LEM: 0.4890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6634, partial_loss/deprel_loss: 0.4062, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6415, loss: 0.4590, batch_reg_loss: 0.1839, reg_loss: 0.1839 ||:  16%|#5        | 15/95 [00:06<00:33,  2.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9683, LAS: 0.9406, UEM: 0.6697, LEM: 0.4599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3319, partial_loss/deprel_loss: 0.4034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5729, loss: 0.4729, batch_reg_loss: 0.1839, reg_loss: 0.1839 ||:  21%|##1       | 20/95 [00:08<00:31,  2.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8979, UAS: 0.9671, LAS: 0.9396, UEM: 0.6771, LEM: 0.4706, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9460, partial_loss/deprel_loss: 0.4293, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7165, loss: 0.4751, batch_reg_loss: 0.1838, reg_loss: 0.1839 ||:  26%|##6       | 25/95 [00:10<00:30,  2.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9554, UAS: 0.9685, LAS: 0.9412, UEM: 0.6890, LEM: 0.4775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1203, partial_loss/deprel_loss: 0.2240, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3871, loss: 0.4683, batch_reg_loss: 0.1838, reg_loss: 0.1839 ||:  33%|###2      | 31/95 [00:13<00:26,  2.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9521, UAS: 0.9686, LAS: 0.9412, UEM: 0.6822, LEM: 0.4679, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1838, partial_loss/deprel_loss: 0.2343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4080, loss: 0.4687, batch_reg_loss: 0.1838, reg_loss: 0.1839 ||:  39%|###8      | 37/95 [00:15<00:23,  2.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9128, UAS: 0.9682, LAS: 0.9413, UEM: 0.7009, LEM: 0.5026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6546, partial_loss/deprel_loss: 0.4432, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6693, loss: 0.4710, batch_reg_loss: 0.1838, reg_loss: 0.1839 ||:  44%|####4     | 42/95 [00:17<00:23,  2.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9629, UAS: 0.9691, LAS: 0.9420, UEM: 0.7133, LEM: 0.5150, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0854, partial_loss/deprel_loss: 0.1738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3399, loss: 0.4655, batch_reg_loss: 0.1838, reg_loss: 0.1838 ||:  49%|####9     | 47/95 [00:19<00:20,  2.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9501, UAS: 0.9689, LAS: 0.9421, UEM: 0.7040, LEM: 0.5064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3287, partial_loss/deprel_loss: 0.2751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4696, loss: 0.4667, batch_reg_loss: 0.1838, reg_loss: 0.1838 ||:  55%|#####4    | 52/95 [00:22<00:18,  2.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9395, UAS: 0.9690, LAS: 0.9420, UEM: 0.6976, LEM: 0.4968, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3717, partial_loss/deprel_loss: 0.3194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5136, loss: 0.4681, batch_reg_loss: 0.1837, reg_loss: 0.1838 ||:  60%|######    | 57/95 [00:24<00:16,  2.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9686, LAS: 0.9416, UEM: 0.6937, LEM: 0.4938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2831, partial_loss/deprel_loss: 0.2799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4643, loss: 0.4708, batch_reg_loss: 0.1837, reg_loss: 0.1838 ||:  65%|######5   | 62/95 [00:26<00:14,  2.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9693, LAS: 0.9423, UEM: 0.7034, LEM: 0.5028, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3190, partial_loss/deprel_loss: 0.2927, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4817, loss: 0.4677, batch_reg_loss: 0.1837, reg_loss: 0.1838 ||:  71%|#######   | 67/95 [00:29<00:12,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9502, UAS: 0.9694, LAS: 0.9424, UEM: 0.7031, LEM: 0.5013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1532, partial_loss/deprel_loss: 0.2547, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4181, loss: 0.4677, batch_reg_loss: 0.1837, reg_loss: 0.1838 ||:  76%|#######5  | 72/95 [00:31<00:10,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9687, LAS: 0.9417, UEM: 0.6940, LEM: 0.4925, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8632, partial_loss/deprel_loss: 0.4697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7321, loss: 0.4724, batch_reg_loss: 0.1837, reg_loss: 0.1838 ||:  81%|########1 | 77/95 [00:33<00:08,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9691, LAS: 0.9420, UEM: 0.7061, LEM: 0.5077, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5038, partial_loss/deprel_loss: 0.3411, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5573, loss: 0.4695, batch_reg_loss: 0.1837, reg_loss: 0.1838 ||:  86%|########6 | 82/95 [00:36<00:06,  2.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9468, UAS: 0.9689, LAS: 0.9418, UEM: 0.7023, LEM: 0.5026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1276, partial_loss/deprel_loss: 0.2435, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4039, loss: 0.4710, batch_reg_loss: 0.1836, reg_loss: 0.1838 ||:  92%|#########1| 87/95 [00:38<00:03,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9694, LAS: 0.9423, UEM: 0.7084, LEM: 0.5077, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2658, partial_loss/deprel_loss: 0.3261, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4977, loss: 0.4680, batch_reg_loss: 0.1836, reg_loss: 0.1838 ||:  97%|#########6| 92/95 [00:40<00:01,  2.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9544, UAS: 0.9697, LAS: 0.9425, UEM: 0.7121, LEM: 0.5115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1267, partial_loss/deprel_loss: 0.2219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3864, loss: 0.4661, batch_reg_loss: 0.1836, reg_loss: 0.1838 ||: 100%|##########| 95/95 [00:41<00:00,  2.26it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 02:18:04,351 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.184  |       N/A\n",
+      "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - UEM                      |     0.712  |       N/A\n",
+      "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - LEM                      |     0.511  |       N/A\n",
+      "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - EM                       |     0.954  |       N/A\n",
+      "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.127  |       N/A\n",
+      "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - UAS                      |     0.970  |       N/A\n",
+      "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.222  |       N/A\n",
+      "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - loss                     |     0.466  |       N/A\n",
+      "2023-04-07 02:18:04,352 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:18:04,353 - INFO - combo.training.tensorboard_writer - LAS                      |     0.943  |       N/A\n",
+      "2023-04-07 02:18:04,353 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:18:04,353 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:18:04,353 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:18:04,353 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:18:04,353 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:18:04,353 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:18:04,358 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:18:08,062 - INFO - combo.training.trainer - Epoch duration: 0:00:48.562741\n",
+      "2023-04-07 02:18:08,062 - INFO - combo.training.trainer - Estimated training time remaining: 4:02:20\n",
+      "2023-04-07 02:18:08,063 - INFO - allennlp.training.trainer - Epoch 185/399\n",
+      "2023-04-07 02:18:08,063 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:18:08,063 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:18:08,077 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9713, LAS: 0.9422, UEM: 0.6968, LEM: 0.4471, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1323, partial_loss/deprel_loss: 0.2587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4170, loss: 0.4686, batch_reg_loss: 0.1836, reg_loss: 0.1836 ||:   5%|5         | 5/95 [00:02<00:36,  2.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9733, LAS: 0.9454, UEM: 0.7769, LEM: 0.5865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4205, partial_loss/deprel_loss: 0.3167, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5210, loss: 0.4507, batch_reg_loss: 0.1836, reg_loss: 0.1836 ||:  11%|#         | 10/95 [00:04<00:35,  2.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9494, UAS: 0.9697, LAS: 0.9426, UEM: 0.7214, LEM: 0.5266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1653, partial_loss/deprel_loss: 0.2448, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4124, loss: 0.4648, batch_reg_loss: 0.1836, reg_loss: 0.1836 ||:  16%|#5        | 15/95 [00:06<00:34,  2.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9487, UAS: 0.9696, LAS: 0.9425, UEM: 0.7060, LEM: 0.5067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2376, partial_loss/deprel_loss: 0.2455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4275, loss: 0.4680, batch_reg_loss: 0.1835, reg_loss: 0.1836 ||:  22%|##2       | 21/95 [00:08<00:30,  2.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9292, UAS: 0.9693, LAS: 0.9420, UEM: 0.6909, LEM: 0.4848, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5075, partial_loss/deprel_loss: 0.3210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5418, loss: 0.4694, batch_reg_loss: 0.1835, reg_loss: 0.1836 ||:  27%|##7       | 26/95 [00:10<00:28,  2.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9561, UAS: 0.9686, LAS: 0.9415, UEM: 0.6786, LEM: 0.4748, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1308, partial_loss/deprel_loss: 0.2191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3850, loss: 0.4728, batch_reg_loss: 0.1835, reg_loss: 0.1836 ||:  33%|###2      | 31/95 [00:12<00:26,  2.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9565, UAS: 0.9707, LAS: 0.9434, UEM: 0.7275, LEM: 0.5268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0810, partial_loss/deprel_loss: 0.1937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3547, loss: 0.4578, batch_reg_loss: 0.1835, reg_loss: 0.1835 ||:  38%|###7      | 36/95 [00:15<00:25,  2.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9684, LAS: 0.9412, UEM: 0.7247, LEM: 0.5329, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3536, partial_loss/deprel_loss: 0.3145, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5058, loss: 0.4714, batch_reg_loss: 0.1835, reg_loss: 0.1835 ||:  43%|####3     | 41/95 [00:18<00:24,  2.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9360, UAS: 0.9692, LAS: 0.9418, UEM: 0.7286, LEM: 0.5308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3186, partial_loss/deprel_loss: 0.3249, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5071, loss: 0.4669, batch_reg_loss: 0.1835, reg_loss: 0.1835 ||:  48%|####8     | 46/95 [00:20<00:22,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9518, UAS: 0.9696, LAS: 0.9421, UEM: 0.7231, LEM: 0.5219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2115, partial_loss/deprel_loss: 0.2225, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4037, loss: 0.4641, batch_reg_loss: 0.1834, reg_loss: 0.1835 ||:  54%|#####3    | 51/95 [00:22<00:19,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9703, LAS: 0.9427, UEM: 0.7311, LEM: 0.5269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1679, partial_loss/deprel_loss: 0.2765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4382, loss: 0.4599, batch_reg_loss: 0.1834, reg_loss: 0.1835 ||:  59%|#####8    | 56/95 [00:24<00:17,  2.21it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9704, LAS: 0.9428, UEM: 0.7298, LEM: 0.5254, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2747, partial_loss/deprel_loss: 0.3156, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4908, loss: 0.4607, batch_reg_loss: 0.1834, reg_loss: 0.1835 ||:  64%|######4   | 61/95 [00:27<00:15,  2.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9514, UAS: 0.9706, LAS: 0.9430, UEM: 0.7294, LEM: 0.5232, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1501, partial_loss/deprel_loss: 0.2593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4208, loss: 0.4599, batch_reg_loss: 0.1834, reg_loss: 0.1835 ||:  69%|######9   | 66/95 [00:29<00:13,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9536, UAS: 0.9701, LAS: 0.9427, UEM: 0.7242, LEM: 0.5180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2449, partial_loss/deprel_loss: 0.2433, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4270, loss: 0.4618, batch_reg_loss: 0.1834, reg_loss: 0.1835 ||:  75%|#######4  | 71/95 [00:31<00:10,  2.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9400, UAS: 0.9697, LAS: 0.9422, UEM: 0.7158, LEM: 0.5097, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2932, partial_loss/deprel_loss: 0.3107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4905, loss: 0.4653, batch_reg_loss: 0.1833, reg_loss: 0.1835 ||:  80%|########  | 76/95 [00:33<00:08,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9523, UAS: 0.9698, LAS: 0.9424, UEM: 0.7206, LEM: 0.5148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1798, partial_loss/deprel_loss: 0.2240, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3985, loss: 0.4648, batch_reg_loss: 0.1833, reg_loss: 0.1835 ||:  85%|########5 | 81/95 [00:36<00:06,  2.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9545, UAS: 0.9701, LAS: 0.9426, UEM: 0.7232, LEM: 0.5165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1152, partial_loss/deprel_loss: 0.2238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3854, loss: 0.4649, batch_reg_loss: 0.1833, reg_loss: 0.1835 ||:  91%|######### | 86/95 [00:38<00:04,  2.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9323, UAS: 0.9697, LAS: 0.9423, UEM: 0.7164, LEM: 0.5110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5114, partial_loss/deprel_loss: 0.3918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5990, loss: 0.4675, batch_reg_loss: 0.1833, reg_loss: 0.1834 ||:  96%|#########5| 91/95 [00:40<00:01,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9695, LAS: 0.9421, UEM: 0.7116, LEM: 0.5053, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2759, partial_loss/deprel_loss: 0.2409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4312, loss: 0.4684, batch_reg_loss: 0.1833, reg_loss: 0.1834 ||: 100%|##########| 95/95 [00:42<00:00,  2.23it/s]\n",
+      "2023-04-07 02:18:53,988 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9645, LAS: 0.9191, UEM: 0.7971, LEM: 0.5561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2151, partial_loss/deprel_loss: 4.5998, partial_loss/cycle_loss: 0.0000, batch_loss: 3.7228, loss: 5.0399, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  36%|###6      | 4/11 [00:02<00:04,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9536, LAS: 0.9045, UEM: 0.6965, LEM: 0.4431, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1079, partial_loss/deprel_loss: 7.6961, partial_loss/cycle_loss: 0.0000, batch_loss: 6.3784, loss: 6.6649, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  73%|#######2  | 8/11 [00:05<00:01,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8993, UAS: 0.9526, LAS: 0.9014, UEM: 0.6878, LEM: 0.4156, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5696, partial_loss/deprel_loss: 6.9750, partial_loss/cycle_loss: 0.0000, batch_loss: 5.6939, loss: 6.9893, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:06<00:00,  1.57it/s]\n",
+      "2023-04-07 02:19:00,987 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:19:00,987 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 02:19:00,987 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.183  |     0.000\n",
+      "2023-04-07 02:19:00,987 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 02:19:00,987 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 02:19:00,987 - INFO - combo.training.tensorboard_writer - UEM                      |     0.712  |     0.688\n",
+      "2023-04-07 02:19:00,987 - INFO - combo.training.tensorboard_writer - LEM                      |     0.505  |     0.416\n",
+      "2023-04-07 02:19:00,987 - INFO - combo.training.tensorboard_writer - EM                       |     0.941  |     0.899\n",
+      "2023-04-07 02:19:00,987 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.276  |     0.570\n",
+      "2023-04-07 02:19:00,987 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - UAS                      |     0.970  |     0.953\n",
+      "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.241  |     6.975\n",
+      "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - loss                     |     0.468  |     6.989\n",
+      "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - LAS                      |     0.942  |     0.901\n",
+      "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 02:19:00,988 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 02:19:00,994 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:19:05,879 - INFO - combo.training.trainer - Epoch duration: 0:00:57.816087\n",
+      "2023-04-07 02:19:05,879 - INFO - combo.training.trainer - Estimated training time remaining: 4:01:01\n",
+      "2023-04-07 02:19:05,879 - INFO - allennlp.training.trainer - Epoch 186/399\n",
+      "2023-04-07 02:19:05,880 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:19:05,880 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:19:05,888 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9510, UAS: 0.9657, LAS: 0.9372, UEM: 0.6630, LEM: 0.4470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1662, partial_loss/deprel_loss: 0.2648, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4284, loss: 0.5067, batch_reg_loss: 0.1833, reg_loss: 0.1833 ||:   5%|5         | 5/95 [00:02<00:40,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9652, LAS: 0.9376, UEM: 0.6355, LEM: 0.4284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2578, partial_loss/deprel_loss: 0.2794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4583, loss: 0.5016, batch_reg_loss: 0.1832, reg_loss: 0.1833 ||:  11%|#         | 10/95 [00:04<00:38,  2.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9340, UAS: 0.9661, LAS: 0.9395, UEM: 0.6360, LEM: 0.4271, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4989, partial_loss/deprel_loss: 0.3126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5331, loss: 0.4916, batch_reg_loss: 0.1832, reg_loss: 0.1832 ||:  16%|#5        | 15/95 [00:06<00:36,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9617, UAS: 0.9693, LAS: 0.9426, UEM: 0.6979, LEM: 0.4948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1027, partial_loss/deprel_loss: 0.2005, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3642, loss: 0.4722, batch_reg_loss: 0.1832, reg_loss: 0.1832 ||:  21%|##1       | 20/95 [00:09<00:34,  2.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9408, UAS: 0.9701, LAS: 0.9433, UEM: 0.6981, LEM: 0.4870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2823, partial_loss/deprel_loss: 0.3129, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4900, loss: 0.4657, batch_reg_loss: 0.1832, reg_loss: 0.1832 ||:  26%|##6       | 25/95 [00:11<00:31,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9691, LAS: 0.9426, UEM: 0.6975, LEM: 0.4926, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6066, partial_loss/deprel_loss: 0.3537, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5875, loss: 0.4675, batch_reg_loss: 0.1832, reg_loss: 0.1832 ||:  32%|###1      | 30/95 [00:13<00:30,  2.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9689, LAS: 0.9426, UEM: 0.6882, LEM: 0.4837, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3191, partial_loss/deprel_loss: 0.3388, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5180, loss: 0.4660, batch_reg_loss: 0.1832, reg_loss: 0.1832 ||:  37%|###6      | 35/95 [00:15<00:26,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9689, LAS: 0.9425, UEM: 0.6775, LEM: 0.4721, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3450, partial_loss/deprel_loss: 0.3127, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5023, loss: 0.4663, batch_reg_loss: 0.1831, reg_loss: 0.1832 ||:  42%|####2     | 40/95 [00:18<00:24,  2.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9542, UAS: 0.9680, LAS: 0.9416, UEM: 0.6728, LEM: 0.4692, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1351, partial_loss/deprel_loss: 0.2079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3765, loss: 0.4703, batch_reg_loss: 0.1831, reg_loss: 0.1832 ||:  47%|####7     | 45/95 [00:20<00:22,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9502, UAS: 0.9686, LAS: 0.9422, UEM: 0.6827, LEM: 0.4776, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1947, partial_loss/deprel_loss: 0.2492, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4214, loss: 0.4682, batch_reg_loss: 0.1831, reg_loss: 0.1832 ||:  53%|#####2    | 50/95 [00:22<00:20,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9549, UAS: 0.9677, LAS: 0.9412, UEM: 0.6730, LEM: 0.4682, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1068, partial_loss/deprel_loss: 0.2095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3721, loss: 0.4745, batch_reg_loss: 0.1831, reg_loss: 0.1832 ||:  58%|#####7    | 55/95 [00:25<00:18,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9680, LAS: 0.9414, UEM: 0.6839, LEM: 0.4801, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2162, partial_loss/deprel_loss: 0.2580, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4327, loss: 0.4726, batch_reg_loss: 0.1831, reg_loss: 0.1832 ||:  63%|######3   | 60/95 [00:27<00:15,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9448, UAS: 0.9677, LAS: 0.9412, UEM: 0.6740, LEM: 0.4704, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2590, partial_loss/deprel_loss: 0.2636, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4457, loss: 0.4741, batch_reg_loss: 0.1831, reg_loss: 0.1832 ||:  68%|######8   | 65/95 [00:29<00:13,  2.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9296, UAS: 0.9678, LAS: 0.9413, UEM: 0.6783, LEM: 0.4759, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4853, partial_loss/deprel_loss: 0.3729, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5785, loss: 0.4748, batch_reg_loss: 0.1830, reg_loss: 0.1832 ||:  74%|#######3  | 70/95 [00:32<00:11,  2.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9683, LAS: 0.9417, UEM: 0.6893, LEM: 0.4874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3323, partial_loss/deprel_loss: 0.3248, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5093, loss: 0.4712, batch_reg_loss: 0.1830, reg_loss: 0.1831 ||:  79%|#######8  | 75/95 [00:34<00:09,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9529, UAS: 0.9690, LAS: 0.9425, UEM: 0.6999, LEM: 0.4975, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1083, partial_loss/deprel_loss: 0.2321, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3904, loss: 0.4659, batch_reg_loss: 0.1830, reg_loss: 0.1831 ||:  84%|########4 | 80/95 [00:36<00:06,  2.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9299, UAS: 0.9694, LAS: 0.9429, UEM: 0.7109, LEM: 0.5137, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4694, partial_loss/deprel_loss: 0.2877, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5070, loss: 0.4625, batch_reg_loss: 0.1830, reg_loss: 0.1831 ||:  89%|########9 | 85/95 [00:39<00:04,  2.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9688, LAS: 0.9424, UEM: 0.7054, LEM: 0.5069, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4620, partial_loss/deprel_loss: 0.3096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5230, loss: 0.4659, batch_reg_loss: 0.1830, reg_loss: 0.1831 ||:  95%|#########4| 90/95 [00:41<00:02,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9380, UAS: 0.9692, LAS: 0.9427, UEM: 0.7096, LEM: 0.5088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3484, partial_loss/deprel_loss: 0.3102, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5008, loss: 0.4638, batch_reg_loss: 0.1830, reg_loss: 0.1831 ||: 100%|##########| 95/95 [00:43<00:00,  2.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9380, UAS: 0.9692, LAS: 0.9427, UEM: 0.7096, LEM: 0.5088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3484, partial_loss/deprel_loss: 0.3102, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5008, loss: 0.4638, batch_reg_loss: 0.1830, reg_loss: 0.1831 ||: 100%|##########| 95/95 [00:43<00:00,  2.20it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 02:19:51,737 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:19:51,737 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 02:19:51,737 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.183  |       N/A\n",
+      "2023-04-07 02:19:51,737 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:19:51,737 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:19:51,737 - INFO - combo.training.tensorboard_writer - UEM                      |     0.710  |       N/A\n",
+      "2023-04-07 02:19:51,737 - INFO - combo.training.tensorboard_writer - LEM                      |     0.509  |       N/A\n",
+      "2023-04-07 02:19:51,737 - INFO - combo.training.tensorboard_writer - EM                       |     0.938  |       N/A\n",
+      "2023-04-07 02:19:51,737 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.348  |       N/A\n",
+      "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - UAS                      |     0.969  |       N/A\n",
+      "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.310  |       N/A\n",
+      "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - loss                     |     0.464  |       N/A\n",
+      "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - LAS                      |     0.943  |       N/A\n",
+      "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:19:51,738 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:19:51,743 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:19:55,738 - INFO - combo.training.trainer - Epoch duration: 0:00:49.858388\n",
+      "2023-04-07 02:19:55,738 - INFO - combo.training.trainer - Estimated training time remaining: 3:59:34\n",
+      "2023-04-07 02:19:55,738 - INFO - allennlp.training.trainer - Epoch 187/399\n",
+      "2023-04-07 02:19:55,738 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:19:55,739 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:19:55,746 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9468, UAS: 0.9738, LAS: 0.9445, UEM: 0.7373, LEM: 0.5254, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1277, partial_loss/deprel_loss: 0.2377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3987, loss: 0.4425, batch_reg_loss: 0.1829, reg_loss: 0.1829 ||:   5%|5         | 5/95 [00:02<00:44,  2.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9494, UAS: 0.9701, LAS: 0.9425, UEM: 0.6734, LEM: 0.4657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1659, partial_loss/deprel_loss: 0.2346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4037, loss: 0.4636, batch_reg_loss: 0.1829, reg_loss: 0.1829 ||:  11%|#         | 10/95 [00:04<00:40,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9259, UAS: 0.9687, LAS: 0.9405, UEM: 0.6641, LEM: 0.4524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4510, partial_loss/deprel_loss: 0.3956, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5896, loss: 0.4761, batch_reg_loss: 0.1829, reg_loss: 0.1829 ||:  16%|#5        | 15/95 [00:06<00:36,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9681, LAS: 0.9403, UEM: 0.6361, LEM: 0.4227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2226, partial_loss/deprel_loss: 0.2724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4453, loss: 0.4780, batch_reg_loss: 0.1829, reg_loss: 0.1829 ||:  21%|##1       | 20/95 [00:08<00:33,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9513, UAS: 0.9676, LAS: 0.9398, UEM: 0.6648, LEM: 0.4587, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1633, partial_loss/deprel_loss: 0.2320, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4011, loss: 0.4773, batch_reg_loss: 0.1829, reg_loss: 0.1829 ||:  26%|##6       | 25/95 [00:11<00:32,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9577, UAS: 0.9700, LAS: 0.9428, UEM: 0.7328, LEM: 0.5448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1102, partial_loss/deprel_loss: 0.2185, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3797, loss: 0.4601, batch_reg_loss: 0.1828, reg_loss: 0.1829 ||:  32%|###1      | 30/95 [00:13<00:30,  2.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9504, UAS: 0.9706, LAS: 0.9435, UEM: 0.7399, LEM: 0.5511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1414, partial_loss/deprel_loss: 0.2290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3943, loss: 0.4567, batch_reg_loss: 0.1828, reg_loss: 0.1829 ||:  37%|###6      | 35/95 [00:15<00:27,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9550, UAS: 0.9713, LAS: 0.9441, UEM: 0.7467, LEM: 0.5537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1221, partial_loss/deprel_loss: 0.2234, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3859, loss: 0.4536, batch_reg_loss: 0.1828, reg_loss: 0.1829 ||:  42%|####2     | 40/95 [00:18<00:25,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9698, LAS: 0.9424, UEM: 0.7320, LEM: 0.5373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3804, partial_loss/deprel_loss: 0.3606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5473, loss: 0.4639, batch_reg_loss: 0.1828, reg_loss: 0.1829 ||:  47%|####7     | 45/95 [00:20<00:23,  2.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9387, UAS: 0.9692, LAS: 0.9415, UEM: 0.7200, LEM: 0.5233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2031, partial_loss/deprel_loss: 0.2722, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4411, loss: 0.4696, batch_reg_loss: 0.1828, reg_loss: 0.1829 ||:  53%|#####2    | 50/95 [00:22<00:20,  2.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9697, LAS: 0.9423, UEM: 0.7238, LEM: 0.5278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2850, partial_loss/deprel_loss: 0.2954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4761, loss: 0.4640, batch_reg_loss: 0.1827, reg_loss: 0.1828 ||:  58%|#####7    | 55/95 [00:25<00:18,  2.16it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9534, UAS: 0.9697, LAS: 0.9424, UEM: 0.7291, LEM: 0.5372, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1354, partial_loss/deprel_loss: 0.2235, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3886, loss: 0.4627, batch_reg_loss: 0.1827, reg_loss: 0.1828 ||:  63%|######3   | 60/95 [00:27<00:16,  2.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9514, UAS: 0.9696, LAS: 0.9423, UEM: 0.7209, LEM: 0.5266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1485, partial_loss/deprel_loss: 0.2856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4409, loss: 0.4656, batch_reg_loss: 0.1827, reg_loss: 0.1828 ||:  68%|######8   | 65/95 [00:29<00:13,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9580, UAS: 0.9699, LAS: 0.9426, UEM: 0.7262, LEM: 0.5327, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0640, partial_loss/deprel_loss: 0.2180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3699, loss: 0.4637, batch_reg_loss: 0.1827, reg_loss: 0.1828 ||:  74%|#######3  | 70/95 [00:32<00:11,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9472, UAS: 0.9700, LAS: 0.9426, UEM: 0.7239, LEM: 0.5272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1377, partial_loss/deprel_loss: 0.2182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3848, loss: 0.4625, batch_reg_loss: 0.1827, reg_loss: 0.1828 ||:  79%|#######8  | 75/95 [00:34<00:08,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9704, LAS: 0.9430, UEM: 0.7238, LEM: 0.5237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3018, partial_loss/deprel_loss: 0.2760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4638, loss: 0.4602, batch_reg_loss: 0.1827, reg_loss: 0.1828 ||:  84%|########4 | 80/95 [00:36<00:06,  2.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9702, LAS: 0.9427, UEM: 0.7180, LEM: 0.5160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2898, partial_loss/deprel_loss: 0.3097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4883, loss: 0.4630, batch_reg_loss: 0.1826, reg_loss: 0.1828 ||:  91%|######### | 86/95 [00:38<00:03,  2.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9367, UAS: 0.9696, LAS: 0.9422, UEM: 0.7158, LEM: 0.5159, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4609, partial_loss/deprel_loss: 0.3057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5194, loss: 0.4663, batch_reg_loss: 0.1826, reg_loss: 0.1828 ||:  96%|#########5| 91/95 [00:40<00:01,  2.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9692, LAS: 0.9417, UEM: 0.7090, LEM: 0.5090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5085, partial_loss/deprel_loss: 0.3670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5779, loss: 0.4697, batch_reg_loss: 0.1826, reg_loss: 0.1828 ||: 100%|##########| 95/95 [00:42<00:00,  2.24it/s]\n",
+      "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.183  |       N/A\n",
+      "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - UEM                      |     0.709  |       N/A\n",
+      "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - LEM                      |     0.509  |       N/A\n",
+      "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - EM                       |     0.932  |       N/A\n",
+      "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.508  |       N/A\n",
+      "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - UAS                      |     0.969  |       N/A\n",
+      "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.367  |       N/A\n",
+      "2023-04-07 02:20:40,922 - INFO - combo.training.tensorboard_writer - loss                     |     0.470  |       N/A\n",
+      "2023-04-07 02:20:40,923 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:20:40,923 - INFO - combo.training.tensorboard_writer - LAS                      |     0.942  |       N/A\n",
+      "2023-04-07 02:20:40,923 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:20:40,923 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:20:40,923 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:20:40,923 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:20:40,923 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:20:40,923 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:20:40,927 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:20:44,479 - INFO - combo.training.trainer - Epoch duration: 0:00:48.740412\n",
+      "2023-04-07 02:20:44,479 - INFO - combo.training.trainer - Estimated training time remaining: 3:58:05\n",
+      "2023-04-07 02:20:44,479 - INFO - allennlp.training.trainer - Epoch 188/399\n",
+      "2023-04-07 02:20:44,480 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:20:44,481 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:20:44,491 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9801, LAS: 0.9529, UEM: 0.8096, LEM: 0.5966, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2648, partial_loss/deprel_loss: 0.2622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4453, loss: 0.3854, batch_reg_loss: 0.1826, reg_loss: 0.1826 ||:   5%|5         | 5/95 [00:02<00:37,  2.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9472, UAS: 0.9742, LAS: 0.9481, UEM: 0.7212, LEM: 0.5115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2372, partial_loss/deprel_loss: 0.2542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4334, loss: 0.4284, batch_reg_loss: 0.1826, reg_loss: 0.1826 ||:  11%|#         | 10/95 [00:04<00:35,  2.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9751, LAS: 0.9487, UEM: 0.7435, LEM: 0.5323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1917, partial_loss/deprel_loss: 0.2284, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4036, loss: 0.4221, batch_reg_loss: 0.1825, reg_loss: 0.1826 ||:  16%|#5        | 15/95 [00:06<00:34,  2.35it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9750, LAS: 0.9483, UEM: 0.7447, LEM: 0.5299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1541, partial_loss/deprel_loss: 0.1990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3726, loss: 0.4249, batch_reg_loss: 0.1825, reg_loss: 0.1826 ||:  21%|##1       | 20/95 [00:08<00:33,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9740, LAS: 0.9479, UEM: 0.7233, LEM: 0.5085, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3368, partial_loss/deprel_loss: 0.2994, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4894, loss: 0.4316, batch_reg_loss: 0.1825, reg_loss: 0.1826 ||:  26%|##6       | 25/95 [00:10<00:30,  2.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9502, UAS: 0.9734, LAS: 0.9470, UEM: 0.7199, LEM: 0.5031, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1018, partial_loss/deprel_loss: 0.2249, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3828, loss: 0.4370, batch_reg_loss: 0.1825, reg_loss: 0.1825 ||:  32%|###1      | 30/95 [00:13<00:28,  2.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9728, LAS: 0.9462, UEM: 0.7209, LEM: 0.5014, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2378, partial_loss/deprel_loss: 0.2886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4609, loss: 0.4429, batch_reg_loss: 0.1825, reg_loss: 0.1825 ||:  37%|###6      | 35/95 [00:15<00:26,  2.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9717, LAS: 0.9452, UEM: 0.7065, LEM: 0.4878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3008, partial_loss/deprel_loss: 0.2881, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4731, loss: 0.4492, batch_reg_loss: 0.1825, reg_loss: 0.1825 ||:  42%|####2     | 40/95 [00:17<00:23,  2.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9347, UAS: 0.9723, LAS: 0.9455, UEM: 0.7222, LEM: 0.5056, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3109, partial_loss/deprel_loss: 0.3028, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4868, loss: 0.4452, batch_reg_loss: 0.1824, reg_loss: 0.1825 ||:  47%|####7     | 45/95 [00:19<00:22,  2.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9549, UAS: 0.9719, LAS: 0.9452, UEM: 0.7191, LEM: 0.5032, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0901, partial_loss/deprel_loss: 0.2167, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3738, loss: 0.4478, batch_reg_loss: 0.1824, reg_loss: 0.1825 ||:  53%|#####2    | 50/95 [00:22<00:19,  2.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9707, LAS: 0.9439, UEM: 0.7071, LEM: 0.4909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2655, partial_loss/deprel_loss: 0.3009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4762, loss: 0.4575, batch_reg_loss: 0.1824, reg_loss: 0.1825 ||:  58%|#####7    | 55/95 [00:24<00:17,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9697, LAS: 0.9428, UEM: 0.6977, LEM: 0.4819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2602, partial_loss/deprel_loss: 0.2986, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4733, loss: 0.4643, batch_reg_loss: 0.1824, reg_loss: 0.1825 ||:  63%|######3   | 60/95 [00:26<00:15,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9328, UAS: 0.9696, LAS: 0.9427, UEM: 0.6931, LEM: 0.4770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4630, partial_loss/deprel_loss: 0.3783, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5776, loss: 0.4668, batch_reg_loss: 0.1824, reg_loss: 0.1825 ||:  68%|######8   | 65/95 [00:28<00:13,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9134, UAS: 0.9698, LAS: 0.9427, UEM: 0.6992, LEM: 0.4843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5744, partial_loss/deprel_loss: 0.3772, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5990, loss: 0.4668, batch_reg_loss: 0.1824, reg_loss: 0.1825 ||:  74%|#######3  | 70/95 [00:31<00:11,  2.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9530, UAS: 0.9698, LAS: 0.9429, UEM: 0.7004, LEM: 0.4858, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1531, partial_loss/deprel_loss: 0.2386, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4039, loss: 0.4653, batch_reg_loss: 0.1823, reg_loss: 0.1825 ||:  79%|#######8  | 75/95 [00:33<00:09,  2.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9692, LAS: 0.9423, UEM: 0.6951, LEM: 0.4819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5602, partial_loss/deprel_loss: 0.3634, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5851, loss: 0.4688, batch_reg_loss: 0.1823, reg_loss: 0.1825 ||:  84%|########4 | 80/95 [00:36<00:07,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9744, UAS: 0.9699, LAS: 0.9431, UEM: 0.7190, LEM: 0.5157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0234, partial_loss/deprel_loss: 0.1003, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2672, loss: 0.4637, batch_reg_loss: 0.1823, reg_loss: 0.1824 ||:  89%|########9 | 85/95 [00:38<00:04,  2.05it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9620, UAS: 0.9700, LAS: 0.9432, UEM: 0.7213, LEM: 0.5185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0915, partial_loss/deprel_loss: 0.1827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3468, loss: 0.4623, batch_reg_loss: 0.1823, reg_loss: 0.1824 ||:  95%|#########4| 90/95 [00:40<00:02,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9343, UAS: 0.9697, LAS: 0.9429, UEM: 0.7152, LEM: 0.5121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4256, partial_loss/deprel_loss: 0.3442, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5428, loss: 0.4639, batch_reg_loss: 0.1823, reg_loss: 0.1824 ||: 100%|##########| 95/95 [00:42<00:00,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9343, UAS: 0.9697, LAS: 0.9429, UEM: 0.7152, LEM: 0.5121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4256, partial_loss/deprel_loss: 0.3442, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5428, loss: 0.4639, batch_reg_loss: 0.1823, reg_loss: 0.1824 ||: 100%|##########| 95/95 [00:42<00:00,  2.21it/s]\n",
+      "2023-04-07 02:21:30,456 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:21:30,456 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 02:21:30,456 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.182  |       N/A\n",
+      "2023-04-07 02:21:30,456 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:21:30,456 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:21:30,456 - INFO - combo.training.tensorboard_writer - UEM                      |     0.715  |       N/A\n",
+      "2023-04-07 02:21:30,456 - INFO - combo.training.tensorboard_writer - LEM                      |     0.512  |       N/A\n",
+      "2023-04-07 02:21:30,456 - INFO - combo.training.tensorboard_writer - EM                       |     0.934  |       N/A\n",
+      "2023-04-07 02:21:30,456 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.426  |       N/A\n",
+      "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - UAS                      |     0.970  |       N/A\n",
+      "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.344  |       N/A\n",
+      "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - loss                     |     0.464  |       N/A\n",
+      "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - LAS                      |     0.943  |       N/A\n",
+      "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:21:30,457 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:21:30,463 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 02:21:34,372 - INFO - combo.training.trainer - Epoch duration: 0:00:49.892762\n",
+      "2023-04-07 02:21:34,372 - INFO - combo.training.trainer - Estimated training time remaining: 3:56:38\n",
+      "2023-04-07 02:21:34,373 - INFO - allennlp.training.trainer - Epoch 189/399\n",
+      "2023-04-07 02:21:34,373 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:21:34,373 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:21:34,382 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9513, UAS: 0.9734, LAS: 0.9445, UEM: 0.7078, LEM: 0.4754, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1072, partial_loss/deprel_loss: 0.1919, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3572, loss: 0.4531, batch_reg_loss: 0.1823, reg_loss: 0.1823 ||:   5%|5         | 5/95 [00:02<00:37,  2.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9699, LAS: 0.9423, UEM: 0.6860, LEM: 0.4664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4790, partial_loss/deprel_loss: 0.3559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5628, loss: 0.4679, batch_reg_loss: 0.1822, reg_loss: 0.1823 ||:  12%|#1        | 11/95 [00:04<00:34,  2.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8991, UAS: 0.9651, LAS: 0.9384, UEM: 0.6247, LEM: 0.4092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8505, partial_loss/deprel_loss: 0.4051, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6764, loss: 0.4925, batch_reg_loss: 0.1822, reg_loss: 0.1823 ||:  17%|#6        | 16/95 [00:06<00:32,  2.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9525, UAS: 0.9659, LAS: 0.9389, UEM: 0.6478, LEM: 0.4336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1255, partial_loss/deprel_loss: 0.2007, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3679, loss: 0.4855, batch_reg_loss: 0.1822, reg_loss: 0.1822 ||:  22%|##2       | 21/95 [00:09<00:32,  2.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9484, UAS: 0.9671, LAS: 0.9400, UEM: 0.6776, LEM: 0.4734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1830, partial_loss/deprel_loss: 0.2994, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4583, loss: 0.4797, batch_reg_loss: 0.1822, reg_loss: 0.1822 ||:  27%|##7       | 26/95 [00:11<00:30,  2.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9537, UAS: 0.9684, LAS: 0.9412, UEM: 0.7049, LEM: 0.4990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1352, partial_loss/deprel_loss: 0.2439, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4043, loss: 0.4711, batch_reg_loss: 0.1822, reg_loss: 0.1822 ||:  33%|###2      | 31/95 [00:13<00:29,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9439, UAS: 0.9696, LAS: 0.9427, UEM: 0.7321, LEM: 0.5369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2710, partial_loss/deprel_loss: 0.2446, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4321, loss: 0.4622, batch_reg_loss: 0.1822, reg_loss: 0.1822 ||:  38%|###7      | 36/95 [00:16<00:27,  2.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9507, UAS: 0.9686, LAS: 0.9421, UEM: 0.7178, LEM: 0.5225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2108, partial_loss/deprel_loss: 0.2257, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4049, loss: 0.4658, batch_reg_loss: 0.1822, reg_loss: 0.1822 ||:  43%|####3     | 41/95 [00:18<00:24,  2.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9681, LAS: 0.9415, UEM: 0.7043, LEM: 0.5062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3203, partial_loss/deprel_loss: 0.2869, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4757, loss: 0.4691, batch_reg_loss: 0.1821, reg_loss: 0.1822 ||:  48%|####8     | 46/95 [00:20<00:22,  2.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9561, UAS: 0.9690, LAS: 0.9422, UEM: 0.7141, LEM: 0.5133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1231, partial_loss/deprel_loss: 0.1746, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3464, loss: 0.4630, batch_reg_loss: 0.1821, reg_loss: 0.1822 ||:  55%|#####4    | 52/95 [00:23<00:18,  2.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9700, LAS: 0.9431, UEM: 0.7255, LEM: 0.5227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2795, partial_loss/deprel_loss: 0.3428, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5122, loss: 0.4575, batch_reg_loss: 0.1821, reg_loss: 0.1822 ||:  61%|######1   | 58/95 [00:25<00:15,  2.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9597, UAS: 0.9706, LAS: 0.9436, UEM: 0.7270, LEM: 0.5214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1552, partial_loss/deprel_loss: 0.2337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4001, loss: 0.4545, batch_reg_loss: 0.1821, reg_loss: 0.1822 ||:  66%|######6   | 63/95 [00:27<00:13,  2.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9585, UAS: 0.9705, LAS: 0.9436, UEM: 0.7209, LEM: 0.5134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1139, partial_loss/deprel_loss: 0.2043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3683, loss: 0.4561, batch_reg_loss: 0.1821, reg_loss: 0.1822 ||:  72%|#######1  | 68/95 [00:29<00:11,  2.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9705, LAS: 0.9435, UEM: 0.7166, LEM: 0.5079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2353, partial_loss/deprel_loss: 0.2779, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4514, loss: 0.4572, batch_reg_loss: 0.1820, reg_loss: 0.1822 ||:  77%|#######6  | 73/95 [00:31<00:09,  2.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9430, UAS: 0.9701, LAS: 0.9430, UEM: 0.7112, LEM: 0.5012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1620, partial_loss/deprel_loss: 0.2726, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4325, loss: 0.4609, batch_reg_loss: 0.1820, reg_loss: 0.1822 ||:  82%|########2 | 78/95 [00:33<00:07,  2.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9704, LAS: 0.9434, UEM: 0.7200, LEM: 0.5111, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5661, partial_loss/deprel_loss: 0.2539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4983, loss: 0.4580, batch_reg_loss: 0.1820, reg_loss: 0.1822 ||:  87%|########7 | 83/95 [00:36<00:05,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9488, UAS: 0.9706, LAS: 0.9435, UEM: 0.7200, LEM: 0.5105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2367, partial_loss/deprel_loss: 0.2492, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4287, loss: 0.4566, batch_reg_loss: 0.1820, reg_loss: 0.1821 ||:  93%|#########2| 88/95 [00:38<00:03,  2.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9702, LAS: 0.9431, UEM: 0.7186, LEM: 0.5104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8426, partial_loss/deprel_loss: 0.4660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7233, loss: 0.4596, batch_reg_loss: 0.1820, reg_loss: 0.1821 ||:  98%|#########7| 93/95 [00:41<00:00,  2.16it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9704, LAS: 0.9433, UEM: 0.7191, LEM: 0.5098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1980, partial_loss/deprel_loss: 0.2064, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3867, loss: 0.4587, batch_reg_loss: 0.1820, reg_loss: 0.1821 ||: 100%|##########| 95/95 [00:41<00:00,  2.27it/s]\n",
+      "2023-04-07 02:22:19,518 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:22:19,518 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 02:22:19,518 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.182  |       N/A\n",
+      "2023-04-07 02:22:19,518 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - UEM                      |     0.719  |       N/A\n",
+      "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - LEM                      |     0.510  |       N/A\n",
+      "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - EM                       |     0.951  |       N/A\n",
+      "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.198  |       N/A\n",
+      "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - UAS                      |     0.970  |       N/A\n",
+      "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.206  |       N/A\n",
+      "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - loss                     |     0.459  |       N/A\n",
+      "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - LAS                      |     0.943  |       N/A\n",
+      "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:22:19,519 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:22:19,520 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:22:19,520 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:22:19,520 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:22:19,526 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:22:23,753 - INFO - combo.training.trainer - Epoch duration: 0:00:49.380132\n",
+      "2023-04-07 02:22:23,753 - INFO - combo.training.trainer - Estimated training time remaining: 3:55:11\n",
+      "2023-04-07 02:22:23,754 - INFO - allennlp.training.trainer - Epoch 190/399\n",
+      "2023-04-07 02:22:23,754 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:22:23,755 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:22:23,765 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9683, LAS: 0.9431, UEM: 0.6156, LEM: 0.3905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1820, partial_loss/deprel_loss: 0.2421, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4121, loss: 0.4673, batch_reg_loss: 0.1820, reg_loss: 0.1820 ||:   5%|5         | 5/95 [00:02<00:39,  2.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9589, UAS: 0.9722, LAS: 0.9465, UEM: 0.7104, LEM: 0.4901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1259, partial_loss/deprel_loss: 0.2186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3820, loss: 0.4511, batch_reg_loss: 0.1819, reg_loss: 0.1819 ||:  11%|#         | 10/95 [00:04<00:38,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9308, UAS: 0.9674, LAS: 0.9419, UEM: 0.6680, LEM: 0.4588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4621, partial_loss/deprel_loss: 0.3890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5856, loss: 0.4839, batch_reg_loss: 0.1819, reg_loss: 0.1819 ||:  15%|#4        | 14/95 [00:06<00:37,  2.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9502, UAS: 0.9697, LAS: 0.9430, UEM: 0.7076, LEM: 0.4921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2136, partial_loss/deprel_loss: 0.2377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4147, loss: 0.4676, batch_reg_loss: 0.1819, reg_loss: 0.1819 ||:  20%|##        | 19/95 [00:08<00:34,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9292, UAS: 0.9694, LAS: 0.9427, UEM: 0.6963, LEM: 0.4818, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4350, partial_loss/deprel_loss: 0.3412, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5418, loss: 0.4686, batch_reg_loss: 0.1819, reg_loss: 0.1819 ||:  25%|##5       | 24/95 [00:10<00:31,  2.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9601, UAS: 0.9705, LAS: 0.9440, UEM: 0.7347, LEM: 0.5340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0790, partial_loss/deprel_loss: 0.1966, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3549, loss: 0.4606, batch_reg_loss: 0.1819, reg_loss: 0.1819 ||:  29%|##9       | 28/95 [00:12<00:31,  2.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9484, UAS: 0.9705, LAS: 0.9440, UEM: 0.7253, LEM: 0.5191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2995, partial_loss/deprel_loss: 0.2734, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4605, loss: 0.4621, batch_reg_loss: 0.1819, reg_loss: 0.1819 ||:  35%|###4      | 33/95 [00:15<00:28,  2.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9697, LAS: 0.9433, UEM: 0.7059, LEM: 0.4992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2593, partial_loss/deprel_loss: 0.2728, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4520, loss: 0.4638, batch_reg_loss: 0.1818, reg_loss: 0.1819 ||:  40%|####      | 38/95 [00:17<00:26,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9704, LAS: 0.9442, UEM: 0.7282, LEM: 0.5355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3659, partial_loss/deprel_loss: 0.2750, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4750, loss: 0.4565, batch_reg_loss: 0.1818, reg_loss: 0.1819 ||:  45%|####5     | 43/95 [00:19<00:24,  2.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9498, UAS: 0.9698, LAS: 0.9438, UEM: 0.7174, LEM: 0.5219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1917, partial_loss/deprel_loss: 0.2269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4017, loss: 0.4600, batch_reg_loss: 0.1818, reg_loss: 0.1819 ||:  51%|#####     | 48/95 [00:21<00:21,  2.18it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9701, LAS: 0.9439, UEM: 0.7219, LEM: 0.5263, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3302, partial_loss/deprel_loss: 0.2916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4811, loss: 0.4571, batch_reg_loss: 0.1818, reg_loss: 0.1819 ||:  56%|#####5    | 53/95 [00:24<00:19,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9508, UAS: 0.9704, LAS: 0.9441, UEM: 0.7257, LEM: 0.5294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1361, partial_loss/deprel_loss: 0.2343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3964, loss: 0.4548, batch_reg_loss: 0.1818, reg_loss: 0.1819 ||:  61%|######1   | 58/95 [00:26<00:16,  2.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9494, UAS: 0.9708, LAS: 0.9445, UEM: 0.7259, LEM: 0.5276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1945, partial_loss/deprel_loss: 0.2593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4281, loss: 0.4531, batch_reg_loss: 0.1818, reg_loss: 0.1819 ||:  66%|######6   | 63/95 [00:28<00:14,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9531, UAS: 0.9708, LAS: 0.9444, UEM: 0.7213, LEM: 0.5212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1591, partial_loss/deprel_loss: 0.2158, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3862, loss: 0.4532, batch_reg_loss: 0.1817, reg_loss: 0.1819 ||:  72%|#######1  | 68/95 [00:30<00:12,  2.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9708, LAS: 0.9443, UEM: 0.7210, LEM: 0.5207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1151, partial_loss/deprel_loss: 0.2258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3854, loss: 0.4537, batch_reg_loss: 0.1817, reg_loss: 0.1818 ||:  77%|#######6  | 73/95 [00:33<00:09,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9486, UAS: 0.9708, LAS: 0.9442, UEM: 0.7237, LEM: 0.5240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2139, partial_loss/deprel_loss: 0.2541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4278, loss: 0.4542, batch_reg_loss: 0.1817, reg_loss: 0.1818 ||:  82%|########2 | 78/95 [00:35<00:07,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9702, LAS: 0.9438, UEM: 0.7130, LEM: 0.5141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3370, partial_loss/deprel_loss: 0.2908, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4817, loss: 0.4579, batch_reg_loss: 0.1817, reg_loss: 0.1818 ||:  87%|########7 | 83/95 [00:37<00:05,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9699, LAS: 0.9435, UEM: 0.7117, LEM: 0.5103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7758, partial_loss/deprel_loss: 0.4238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6759, loss: 0.4598, batch_reg_loss: 0.1817, reg_loss: 0.1818 ||:  93%|#########2| 88/95 [00:39<00:03,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9696, LAS: 0.9432, UEM: 0.7087, LEM: 0.5072, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4431, partial_loss/deprel_loss: 0.3670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5639, loss: 0.4626, batch_reg_loss: 0.1816, reg_loss: 0.1818 ||:  99%|#########8| 94/95 [00:42<00:00,  2.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9697, LAS: 0.9432, UEM: 0.7116, LEM: 0.5106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1498, partial_loss/deprel_loss: 0.2243, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3911, loss: 0.4619, batch_reg_loss: 0.1816, reg_loss: 0.1818 ||: 100%|##########| 95/95 [00:42<00:00,  2.21it/s]\n",
+      "2023-04-07 02:23:09,717 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8558, UAS: 0.9366, LAS: 0.8829, UEM: 0.5207, LEM: 0.2590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6660, partial_loss/deprel_loss: 15.5290, partial_loss/cycle_loss: 0.0000, batch_loss: 12.7564, loss: 9.2649, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  27%|##7       | 3/11 [00:02<00:05,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9520, LAS: 0.9041, UEM: 0.7383, LEM: 0.4969, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0763, partial_loss/deprel_loss: 7.6127, partial_loss/cycle_loss: 0.0000, batch_loss: 6.3054, loss: 6.6328, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  64%|######3   | 7/11 [00:04<00:02,  1.48it/s]  \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8942, UAS: 0.9520, LAS: 0.9007, UEM: 0.6888, LEM: 0.4156, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9626, partial_loss/deprel_loss: 8.4763, partial_loss/cycle_loss: 0.0000, batch_loss: 6.9736, loss: 6.7944, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:06<00:00,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8942, UAS: 0.9520, LAS: 0.9007, UEM: 0.6888, LEM: 0.4156, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9626, partial_loss/deprel_loss: 8.4763, partial_loss/cycle_loss: 0.0000, batch_loss: 6.9736, loss: 6.7944, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:06<00:00,  1.59it/s]\n",
+      "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.182  |     0.000\n",
+      "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - UEM                      |     0.712  |     0.689\n",
+      "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - LEM                      |     0.511  |     0.416\n",
+      "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - EM                       |     0.950  |     0.894\n",
+      "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.150  |     0.963\n",
+      "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 02:23:16,654 - INFO - combo.training.tensorboard_writer - UAS                      |     0.970  |     0.952\n",
+      "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.224  |     8.476\n",
+      "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - loss                     |     0.462  |     6.794\n",
+      "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - LAS                      |     0.943  |     0.901\n",
+      "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 02:23:16,655 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 02:23:16,659 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 02:23:21,377 - INFO - combo.training.trainer - Epoch duration: 0:00:57.623587\n",
+      "2023-04-07 02:23:21,378 - INFO - combo.training.trainer - Estimated training time remaining: 3:53:53\n",
+      "2023-04-07 02:23:21,378 - INFO - allennlp.training.trainer - Epoch 191/399\n",
+      "2023-04-07 02:23:21,378 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:23:21,379 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:23:21,387 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9762, LAS: 0.9530, UEM: 0.8104, LEM: 0.6826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4080, partial_loss/deprel_loss: 0.2985, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5020, loss: 0.4168, batch_reg_loss: 0.1816, reg_loss: 0.1816 ||:   5%|5         | 5/95 [00:02<00:43,  2.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9546, UAS: 0.9707, LAS: 0.9478, UEM: 0.7378, LEM: 0.5919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1372, partial_loss/deprel_loss: 0.2182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3836, loss: 0.4425, batch_reg_loss: 0.1816, reg_loss: 0.1816 ||:  11%|#         | 10/95 [00:04<00:40,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9518, UAS: 0.9730, LAS: 0.9487, UEM: 0.7628, LEM: 0.5917, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1339, partial_loss/deprel_loss: 0.2414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4015, loss: 0.4341, batch_reg_loss: 0.1816, reg_loss: 0.1816 ||:  16%|#5        | 15/95 [00:06<00:36,  2.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9489, UAS: 0.9723, LAS: 0.9473, UEM: 0.7500, LEM: 0.5666, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1988, partial_loss/deprel_loss: 0.2770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4429, loss: 0.4364, batch_reg_loss: 0.1816, reg_loss: 0.1816 ||:  21%|##1       | 20/95 [00:09<00:35,  2.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9455, UAS: 0.9718, LAS: 0.9467, UEM: 0.7363, LEM: 0.5494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2069, partial_loss/deprel_loss: 0.3008, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4636, loss: 0.4407, batch_reg_loss: 0.1815, reg_loss: 0.1816 ||:  26%|##6       | 25/95 [00:11<00:32,  2.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9443, UAS: 0.9727, LAS: 0.9474, UEM: 0.7427, LEM: 0.5499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2506, partial_loss/deprel_loss: 0.2547, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4354, loss: 0.4369, batch_reg_loss: 0.1815, reg_loss: 0.1816 ||:  32%|###1      | 30/95 [00:13<00:28,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9709, LAS: 0.9456, UEM: 0.7265, LEM: 0.5331, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5312, partial_loss/deprel_loss: 0.4106, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6162, loss: 0.4465, batch_reg_loss: 0.1815, reg_loss: 0.1816 ||:  37%|###6      | 35/95 [00:15<00:26,  2.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9701, LAS: 0.9450, UEM: 0.7112, LEM: 0.5160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3045, partial_loss/deprel_loss: 0.2685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4572, loss: 0.4508, batch_reg_loss: 0.1815, reg_loss: 0.1816 ||:  43%|####3     | 41/95 [00:18<00:22,  2.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9503, UAS: 0.9708, LAS: 0.9456, UEM: 0.7304, LEM: 0.5394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2075, partial_loss/deprel_loss: 0.2609, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4317, loss: 0.4471, batch_reg_loss: 0.1815, reg_loss: 0.1816 ||:  48%|####8     | 46/95 [00:20<00:21,  2.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9629, UAS: 0.9708, LAS: 0.9457, UEM: 0.7308, LEM: 0.5406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0844, partial_loss/deprel_loss: 0.1644, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3299, loss: 0.4468, batch_reg_loss: 0.1815, reg_loss: 0.1815 ||:  54%|#####3    | 51/95 [00:22<00:19,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9709, LAS: 0.9458, UEM: 0.7358, LEM: 0.5494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5184, partial_loss/deprel_loss: 0.3087, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5321, loss: 0.4456, batch_reg_loss: 0.1814, reg_loss: 0.1815 ||:  59%|#####8    | 56/95 [00:24<00:17,  2.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9710, LAS: 0.9459, UEM: 0.7306, LEM: 0.5424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2881, partial_loss/deprel_loss: 0.3186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4939, loss: 0.4462, batch_reg_loss: 0.1814, reg_loss: 0.1815 ||:  64%|######4   | 61/95 [00:27<00:15,  2.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9552, UAS: 0.9711, LAS: 0.9460, UEM: 0.7318, LEM: 0.5432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1279, partial_loss/deprel_loss: 0.2277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3891, loss: 0.4458, batch_reg_loss: 0.1814, reg_loss: 0.1815 ||:  69%|######9   | 66/95 [00:29<00:12,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9712, LAS: 0.9460, UEM: 0.7271, LEM: 0.5366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3800, partial_loss/deprel_loss: 0.3084, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5041, loss: 0.4449, batch_reg_loss: 0.1814, reg_loss: 0.1815 ||:  75%|#######4  | 71/95 [00:31<00:10,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9539, UAS: 0.9709, LAS: 0.9455, UEM: 0.7214, LEM: 0.5291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2137, partial_loss/deprel_loss: 0.2812, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4490, loss: 0.4481, batch_reg_loss: 0.1814, reg_loss: 0.1815 ||:  80%|########  | 76/95 [00:33<00:08,  2.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9463, UAS: 0.9710, LAS: 0.9455, UEM: 0.7300, LEM: 0.5386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2097, partial_loss/deprel_loss: 0.2878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4535, loss: 0.4480, batch_reg_loss: 0.1813, reg_loss: 0.1815 ||:  85%|########5 | 81/95 [00:36<00:06,  2.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9708, LAS: 0.9452, UEM: 0.7248, LEM: 0.5333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6504, partial_loss/deprel_loss: 0.4025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6334, loss: 0.4495, batch_reg_loss: 0.1813, reg_loss: 0.1815 ||:  91%|######### | 86/95 [00:38<00:04,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9703, LAS: 0.9448, UEM: 0.7224, LEM: 0.5305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8756, partial_loss/deprel_loss: 0.3987, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6754, loss: 0.4529, batch_reg_loss: 0.1813, reg_loss: 0.1815 ||:  96%|#########5| 91/95 [00:41<00:01,  2.14it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9303, UAS: 0.9700, LAS: 0.9445, UEM: 0.7157, LEM: 0.5243, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4311, partial_loss/deprel_loss: 0.3561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5524, loss: 0.4553, batch_reg_loss: 0.1813, reg_loss: 0.1815 ||: 100%|##########| 95/95 [00:42<00:00,  2.22it/s]\n",
+      "2023-04-07 02:24:07,237 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.181  |       N/A\n",
+      "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - UEM                      |     0.716  |       N/A\n",
+      "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - LEM                      |     0.524  |       N/A\n",
+      "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - EM                       |     0.930  |       N/A\n",
+      "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.431  |       N/A\n",
+      "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - UAS                      |     0.970  |       N/A\n",
+      "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:24:07,238 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.356  |       N/A\n",
+      "2023-04-07 02:24:07,239 - INFO - combo.training.tensorboard_writer - loss                     |     0.455  |       N/A\n",
+      "2023-04-07 02:24:07,239 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:24:07,239 - INFO - combo.training.tensorboard_writer - LAS                      |     0.944  |       N/A\n",
+      "2023-04-07 02:24:07,239 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:24:07,239 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:24:07,239 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:24:07,239 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:24:07,239 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:24:07,239 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:24:07,245 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:24:10,763 - INFO - combo.training.trainer - Epoch duration: 0:00:49.385025\n",
+      "2023-04-07 02:24:10,763 - INFO - combo.training.trainer - Estimated training time remaining: 3:52:27\n",
+      "2023-04-07 02:24:10,763 - INFO - allennlp.training.trainer - Epoch 192/399\n",
+      "2023-04-07 02:24:10,764 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:24:10,764 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:24:10,773 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9613, UAS: 0.9789, LAS: 0.9571, UEM: 0.8140, LEM: 0.6628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1674, partial_loss/deprel_loss: 0.1925, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3687, loss: 0.3693, batch_reg_loss: 0.1813, reg_loss: 0.1813 ||:   5%|5         | 5/95 [00:02<00:40,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9470, UAS: 0.9768, LAS: 0.9515, UEM: 0.7751, LEM: 0.5848, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1505, partial_loss/deprel_loss: 0.2764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4325, loss: 0.3985, batch_reg_loss: 0.1813, reg_loss: 0.1813 ||:  11%|#         | 10/95 [00:04<00:37,  2.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9420, UAS: 0.9755, LAS: 0.9494, UEM: 0.7461, LEM: 0.5409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3569, partial_loss/deprel_loss: 0.2681, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4671, loss: 0.4175, batch_reg_loss: 0.1812, reg_loss: 0.1813 ||:  16%|#5        | 15/95 [00:06<00:35,  2.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9706, LAS: 0.9449, UEM: 0.6997, LEM: 0.5008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5681, partial_loss/deprel_loss: 0.3962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6118, loss: 0.4494, batch_reg_loss: 0.1812, reg_loss: 0.1813 ||:  21%|##1       | 20/95 [00:08<00:32,  2.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9695, LAS: 0.9437, UEM: 0.6775, LEM: 0.4728, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1283, partial_loss/deprel_loss: 0.2054, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3712, loss: 0.4588, batch_reg_loss: 0.1812, reg_loss: 0.1813 ||:  26%|##6       | 25/95 [00:10<00:30,  2.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9399, UAS: 0.9710, LAS: 0.9448, UEM: 0.7127, LEM: 0.5073, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3621, partial_loss/deprel_loss: 0.3050, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4976, loss: 0.4494, batch_reg_loss: 0.1812, reg_loss: 0.1812 ||:  32%|###1      | 30/95 [00:13<00:28,  2.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9696, LAS: 0.9436, UEM: 0.6882, LEM: 0.4838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2967, partial_loss/deprel_loss: 0.3378, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5108, loss: 0.4580, batch_reg_loss: 0.1812, reg_loss: 0.1812 ||:  37%|###6      | 35/95 [00:15<00:27,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9696, LAS: 0.9434, UEM: 0.6808, LEM: 0.4750, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3107, partial_loss/deprel_loss: 0.2804, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4677, loss: 0.4592, batch_reg_loss: 0.1812, reg_loss: 0.1812 ||:  42%|####2     | 40/95 [00:17<00:24,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9513, UAS: 0.9701, LAS: 0.9441, UEM: 0.6826, LEM: 0.4732, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2059, partial_loss/deprel_loss: 0.2073, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3882, loss: 0.4544, batch_reg_loss: 0.1812, reg_loss: 0.1812 ||:  47%|####7     | 45/95 [00:19<00:22,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9109, UAS: 0.9690, LAS: 0.9429, UEM: 0.6746, LEM: 0.4675, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7076, partial_loss/deprel_loss: 0.3990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6418, loss: 0.4621, batch_reg_loss: 0.1811, reg_loss: 0.1812 ||:  53%|#####2    | 50/95 [00:22<00:20,  2.17it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9628, UAS: 0.9695, LAS: 0.9435, UEM: 0.6949, LEM: 0.4947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0965, partial_loss/deprel_loss: 0.1971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3581, loss: 0.4580, batch_reg_loss: 0.1811, reg_loss: 0.1812 ||:  58%|#####7    | 55/95 [00:24<00:18,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9772, UAS: 0.9699, LAS: 0.9442, UEM: 0.7150, LEM: 0.5234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0246, partial_loss/deprel_loss: 0.0824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2520, loss: 0.4537, batch_reg_loss: 0.1811, reg_loss: 0.1812 ||:  63%|######3   | 60/95 [00:27<00:16,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9482, UAS: 0.9705, LAS: 0.9448, UEM: 0.7184, LEM: 0.5227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2057, partial_loss/deprel_loss: 0.2958, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4589, loss: 0.4506, batch_reg_loss: 0.1811, reg_loss: 0.1812 ||:  68%|######8   | 65/95 [00:29<00:13,  2.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9705, LAS: 0.9448, UEM: 0.7193, LEM: 0.5254, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5896, partial_loss/deprel_loss: 0.3207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5555, loss: 0.4494, batch_reg_loss: 0.1811, reg_loss: 0.1812 ||:  74%|#######3  | 70/95 [00:31<00:11,  2.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9704, LAS: 0.9447, UEM: 0.7176, LEM: 0.5238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1456, partial_loss/deprel_loss: 0.2796, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4338, loss: 0.4503, batch_reg_loss: 0.1811, reg_loss: 0.1812 ||:  79%|#######8  | 75/95 [00:33<00:09,  2.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9514, UAS: 0.9702, LAS: 0.9445, UEM: 0.7141, LEM: 0.5192, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1663, partial_loss/deprel_loss: 0.2351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4024, loss: 0.4520, batch_reg_loss: 0.1810, reg_loss: 0.1812 ||:  84%|########4 | 80/95 [00:36<00:06,  2.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9522, UAS: 0.9703, LAS: 0.9446, UEM: 0.7100, LEM: 0.5132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1606, partial_loss/deprel_loss: 0.2619, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4226, loss: 0.4517, batch_reg_loss: 0.1810, reg_loss: 0.1812 ||:  89%|########9 | 85/95 [00:38<00:04,  2.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9703, LAS: 0.9445, UEM: 0.7135, LEM: 0.5165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1958, partial_loss/deprel_loss: 0.2959, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4569, loss: 0.4512, batch_reg_loss: 0.1810, reg_loss: 0.1812 ||:  95%|#########4| 90/95 [00:40<00:02,  2.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9705, LAS: 0.9447, UEM: 0.7152, LEM: 0.5187, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3115, partial_loss/deprel_loss: 0.2870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4729, loss: 0.4505, batch_reg_loss: 0.1810, reg_loss: 0.1811 ||: 100%|##########| 95/95 [00:42<00:00,  2.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9705, LAS: 0.9447, UEM: 0.7152, LEM: 0.5187, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3115, partial_loss/deprel_loss: 0.2870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4729, loss: 0.4505, batch_reg_loss: 0.1810, reg_loss: 0.1811 ||: 100%|##########| 95/95 [00:42<00:00,  2.24it/s]\n",
+      "2023-04-07 02:24:55,870 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:24:55,870 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.181  |       N/A\n",
+      "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - UEM                      |     0.715  |       N/A\n",
+      "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - LEM                      |     0.519  |       N/A\n",
+      "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - EM                       |     0.945  |       N/A\n",
+      "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.311  |       N/A\n",
+      "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - UAS                      |     0.971  |       N/A\n",
+      "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.287  |       N/A\n",
+      "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - loss                     |     0.450  |       N/A\n",
+      "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - LAS                      |     0.945  |       N/A\n",
+      "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:24:55,871 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:24:55,872 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:24:55,872 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:24:55,872 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:24:55,876 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:24:59,808 - INFO - combo.training.trainer - Epoch duration: 0:00:49.044927\n",
+      "2023-04-07 02:24:59,809 - INFO - combo.training.trainer - Estimated training time remaining: 3:51:01\n",
+      "2023-04-07 02:24:59,809 - INFO - allennlp.training.trainer - Epoch 193/399\n",
+      "2023-04-07 02:24:59,809 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:24:59,809 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:24:59,816 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9584, UAS: 0.9712, LAS: 0.9460, UEM: 0.6768, LEM: 0.4649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1532, partial_loss/deprel_loss: 0.1918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3650, loss: 0.4546, batch_reg_loss: 0.1810, reg_loss: 0.1810 ||:   5%|5         | 5/95 [00:02<00:37,  2.40it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9629, UAS: 0.9743, LAS: 0.9499, UEM: 0.7249, LEM: 0.5187, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1009, partial_loss/deprel_loss: 0.1800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3451, loss: 0.4308, batch_reg_loss: 0.1809, reg_loss: 0.1810 ||:  12%|#1        | 11/95 [00:04<00:34,  2.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9506, UAS: 0.9751, LAS: 0.9503, UEM: 0.7506, LEM: 0.5484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2127, partial_loss/deprel_loss: 0.2848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4513, loss: 0.4221, batch_reg_loss: 0.1809, reg_loss: 0.1810 ||:  17%|#6        | 16/95 [00:06<00:33,  2.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9543, UAS: 0.9744, LAS: 0.9492, UEM: 0.7438, LEM: 0.5364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2282, partial_loss/deprel_loss: 0.2250, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4066, loss: 0.4259, batch_reg_loss: 0.1809, reg_loss: 0.1809 ||:  22%|##2       | 21/95 [00:08<00:31,  2.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9750, LAS: 0.9494, UEM: 0.7493, LEM: 0.5388, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2943, partial_loss/deprel_loss: 0.3258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5004, loss: 0.4243, batch_reg_loss: 0.1809, reg_loss: 0.1809 ||:  27%|##7       | 26/95 [00:11<00:29,  2.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9720, LAS: 0.9467, UEM: 0.7135, LEM: 0.5080, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4501, partial_loss/deprel_loss: 0.3221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5285, loss: 0.4414, batch_reg_loss: 0.1809, reg_loss: 0.1809 ||:  33%|###2      | 31/95 [00:13<00:27,  2.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9707, LAS: 0.9454, UEM: 0.6946, LEM: 0.4908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2969, partial_loss/deprel_loss: 0.3191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4955, loss: 0.4463, batch_reg_loss: 0.1808, reg_loss: 0.1809 ||:  38%|###7      | 36/95 [00:15<00:25,  2.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9716, LAS: 0.9462, UEM: 0.7253, LEM: 0.5326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2574, partial_loss/deprel_loss: 0.2802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4565, loss: 0.4415, batch_reg_loss: 0.1808, reg_loss: 0.1809 ||:  43%|####3     | 41/95 [00:18<00:24,  2.19it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9501, UAS: 0.9716, LAS: 0.9461, UEM: 0.7216, LEM: 0.5266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2191, partial_loss/deprel_loss: 0.2556, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4291, loss: 0.4434, batch_reg_loss: 0.1808, reg_loss: 0.1809 ||:  48%|####8     | 46/95 [00:20<00:21,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9528, UAS: 0.9709, LAS: 0.9453, UEM: 0.7201, LEM: 0.5261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1397, partial_loss/deprel_loss: 0.2232, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3873, loss: 0.4483, batch_reg_loss: 0.1808, reg_loss: 0.1809 ||:  54%|#####3    | 51/95 [00:22<00:20,  2.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9491, UAS: 0.9708, LAS: 0.9452, UEM: 0.7142, LEM: 0.5176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2631, partial_loss/deprel_loss: 0.2539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4366, loss: 0.4499, batch_reg_loss: 0.1808, reg_loss: 0.1809 ||:  59%|#####8    | 56/95 [00:25<00:18,  2.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9432, UAS: 0.9702, LAS: 0.9444, UEM: 0.7056, LEM: 0.5090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2823, partial_loss/deprel_loss: 0.2712, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4542, loss: 0.4541, batch_reg_loss: 0.1808, reg_loss: 0.1809 ||:  64%|######4   | 61/95 [00:27<00:15,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9463, UAS: 0.9708, LAS: 0.9450, UEM: 0.7201, LEM: 0.5261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2971, partial_loss/deprel_loss: 0.2723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4580, loss: 0.4490, batch_reg_loss: 0.1808, reg_loss: 0.1809 ||:  69%|######9   | 66/95 [00:29<00:13,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9711, LAS: 0.9454, UEM: 0.7264, LEM: 0.5341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3060, partial_loss/deprel_loss: 0.2579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4482, loss: 0.4458, batch_reg_loss: 0.1807, reg_loss: 0.1809 ||:  75%|#######4  | 71/95 [00:34<00:14,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9530, UAS: 0.9713, LAS: 0.9456, UEM: 0.7259, LEM: 0.5322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1649, partial_loss/deprel_loss: 0.2355, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4021, loss: 0.4462, batch_reg_loss: 0.1807, reg_loss: 0.1808 ||:  80%|########  | 76/95 [00:36<00:10,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9148, UAS: 0.9706, LAS: 0.9448, UEM: 0.7206, LEM: 0.5273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8308, partial_loss/deprel_loss: 0.4701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7229, loss: 0.4521, batch_reg_loss: 0.1807, reg_loss: 0.1808 ||:  85%|########5 | 81/95 [00:38<00:07,  1.93it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9524, UAS: 0.9705, LAS: 0.9447, UEM: 0.7170, LEM: 0.5219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0917, partial_loss/deprel_loss: 0.2132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3696, loss: 0.4528, batch_reg_loss: 0.1807, reg_loss: 0.1808 ||:  91%|######### | 86/95 [00:40<00:04,  2.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9613, UAS: 0.9710, LAS: 0.9451, UEM: 0.7263, LEM: 0.5314, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0982, partial_loss/deprel_loss: 0.1860, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3491, loss: 0.4496, batch_reg_loss: 0.1807, reg_loss: 0.1808 ||:  96%|#########5| 91/95 [00:43<00:01,  2.05it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9379, UAS: 0.9704, LAS: 0.9445, UEM: 0.7170, LEM: 0.5231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5476, partial_loss/deprel_loss: 0.3039, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5333, loss: 0.4536, batch_reg_loss: 0.1807, reg_loss: 0.1808 ||: 100%|##########| 95/95 [00:45<00:00,  2.11it/s]\n",
+      "2023-04-07 02:25:47,752 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:25:47,752 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 02:25:47,752 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.181  |       N/A\n",
+      "2023-04-07 02:25:47,752 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - UEM                      |     0.717  |       N/A\n",
+      "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - LEM                      |     0.523  |       N/A\n",
+      "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - EM                       |     0.938  |       N/A\n",
+      "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.548  |       N/A\n",
+      "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - UAS                      |     0.970  |       N/A\n",
+      "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.304  |       N/A\n",
+      "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - loss                     |     0.454  |       N/A\n",
+      "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - LAS                      |     0.945  |       N/A\n",
+      "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:25:47,753 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:25:47,754 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:25:47,754 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:25:47,758 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 02:25:52,111 - INFO - combo.training.trainer - Epoch duration: 0:00:52.302130\n",
+      "2023-04-07 02:25:52,111 - INFO - combo.training.trainer - Estimated training time remaining: 3:49:38\n",
+      "2023-04-07 02:25:52,112 - INFO - allennlp.training.trainer - Epoch 194/399\n",
+      "2023-04-07 02:25:52,112 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:25:52,112 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:25:52,121 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9784, UAS: 0.9727, LAS: 0.9475, UEM: 0.8671, LEM: 0.7463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0226, partial_loss/deprel_loss: 0.0932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2598, loss: 0.4254, batch_reg_loss: 0.1806, reg_loss: 0.1806 ||:   4%|4         | 4/95 [00:02<00:46,  1.97it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9577, UAS: 0.9729, LAS: 0.9472, UEM: 0.8300, LEM: 0.6810, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0788, partial_loss/deprel_loss: 0.1887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3473, loss: 0.4168, batch_reg_loss: 0.1806, reg_loss: 0.1806 ||:   9%|9         | 9/95 [00:04<00:42,  2.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9737, LAS: 0.9473, UEM: 0.7973, LEM: 0.6318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3108, partial_loss/deprel_loss: 0.3603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5310, loss: 0.4248, batch_reg_loss: 0.1806, reg_loss: 0.1806 ||:  15%|#4        | 14/95 [00:06<00:38,  2.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9531, UAS: 0.9739, LAS: 0.9478, UEM: 0.7835, LEM: 0.6102, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1577, partial_loss/deprel_loss: 0.2080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3785, loss: 0.4242, batch_reg_loss: 0.1806, reg_loss: 0.1806 ||:  20%|##        | 19/95 [00:08<00:36,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9668, UAS: 0.9741, LAS: 0.9482, UEM: 0.7857, LEM: 0.6130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0600, partial_loss/deprel_loss: 0.1196, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2882, loss: 0.4240, batch_reg_loss: 0.1806, reg_loss: 0.1806 ||:  25%|##5       | 24/95 [00:11<00:34,  2.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9124, UAS: 0.9724, LAS: 0.9465, UEM: 0.7654, LEM: 0.5906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6934, partial_loss/deprel_loss: 0.3886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6301, loss: 0.4365, batch_reg_loss: 0.1806, reg_loss: 0.1806 ||:  31%|###       | 29/95 [00:13<00:31,  2.12it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9725, LAS: 0.9466, UEM: 0.7548, LEM: 0.5730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2552, partial_loss/deprel_loss: 0.2985, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4704, loss: 0.4383, batch_reg_loss: 0.1805, reg_loss: 0.1806 ||:  37%|###6      | 35/95 [00:15<00:26,  2.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9720, LAS: 0.9462, UEM: 0.7437, LEM: 0.5612, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2174, partial_loss/deprel_loss: 0.2386, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4149, loss: 0.4398, batch_reg_loss: 0.1805, reg_loss: 0.1806 ||:  42%|####2     | 40/95 [00:18<00:24,  2.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9708, LAS: 0.9450, UEM: 0.7368, LEM: 0.5538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8662, partial_loss/deprel_loss: 0.4060, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6785, loss: 0.4482, batch_reg_loss: 0.1805, reg_loss: 0.1806 ||:  47%|####7     | 45/95 [00:20<00:22,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9300, UAS: 0.9700, LAS: 0.9442, UEM: 0.7249, LEM: 0.5406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6876, partial_loss/deprel_loss: 0.3537, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6009, loss: 0.4535, batch_reg_loss: 0.1805, reg_loss: 0.1806 ||:  53%|#####2    | 50/95 [00:22<00:19,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9307, UAS: 0.9699, LAS: 0.9442, UEM: 0.7165, LEM: 0.5298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4022, partial_loss/deprel_loss: 0.3170, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5145, loss: 0.4529, batch_reg_loss: 0.1805, reg_loss: 0.1806 ||:  58%|#####7    | 55/95 [00:24<00:17,  2.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9699, LAS: 0.9441, UEM: 0.7215, LEM: 0.5327, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6227, partial_loss/deprel_loss: 0.3280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5674, loss: 0.4533, batch_reg_loss: 0.1805, reg_loss: 0.1805 ||:  63%|######3   | 60/95 [00:26<00:15,  2.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9597, UAS: 0.9702, LAS: 0.9444, UEM: 0.7187, LEM: 0.5262, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0994, partial_loss/deprel_loss: 0.2168, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3737, loss: 0.4522, batch_reg_loss: 0.1804, reg_loss: 0.1805 ||:  68%|######8   | 65/95 [00:28<00:12,  2.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9702, LAS: 0.9444, UEM: 0.7136, LEM: 0.5193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4027, partial_loss/deprel_loss: 0.3527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5431, loss: 0.4520, batch_reg_loss: 0.1804, reg_loss: 0.1805 ||:  74%|#######3  | 70/95 [00:31<00:10,  2.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9702, LAS: 0.9442, UEM: 0.7087, LEM: 0.5118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1623, partial_loss/deprel_loss: 0.2495, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4125, loss: 0.4532, batch_reg_loss: 0.1804, reg_loss: 0.1805 ||:  79%|#######8  | 75/95 [00:33<00:08,  2.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9526, UAS: 0.9700, LAS: 0.9440, UEM: 0.7087, LEM: 0.5108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1335, partial_loss/deprel_loss: 0.2324, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3931, loss: 0.4542, batch_reg_loss: 0.1804, reg_loss: 0.1805 ||:  84%|########4 | 80/95 [00:35<00:06,  2.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9172, UAS: 0.9700, LAS: 0.9437, UEM: 0.7158, LEM: 0.5179, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6074, partial_loss/deprel_loss: 0.3437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5768, loss: 0.4542, batch_reg_loss: 0.1804, reg_loss: 0.1805 ||:  89%|########9 | 85/95 [00:37<00:04,  2.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9704, LAS: 0.9442, UEM: 0.7185, LEM: 0.5193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2901, partial_loss/deprel_loss: 0.2797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4622, loss: 0.4521, batch_reg_loss: 0.1804, reg_loss: 0.1805 ||:  95%|#########4| 90/95 [00:39<00:02,  2.27it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9485, UAS: 0.9706, LAS: 0.9443, UEM: 0.7174, LEM: 0.5159, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1724, partial_loss/deprel_loss: 0.2301, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3989, loss: 0.4508, batch_reg_loss: 0.1803, reg_loss: 0.1805 ||: 100%|##########| 95/95 [00:42<00:00,  2.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9485, UAS: 0.9706, LAS: 0.9443, UEM: 0.7174, LEM: 0.5159, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1724, partial_loss/deprel_loss: 0.2301, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3989, loss: 0.4508, batch_reg_loss: 0.1803, reg_loss: 0.1805 ||: 100%|##########| 95/95 [00:42<00:00,  2.26it/s]\n",
+      "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.180  |       N/A\n",
+      "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - UEM                      |     0.717  |       N/A\n",
+      "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - LEM                      |     0.516  |       N/A\n",
+      "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - EM                       |     0.949  |       N/A\n",
+      "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.172  |       N/A\n",
+      "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - UAS                      |     0.971  |       N/A\n",
+      "2023-04-07 02:26:36,884 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:26:36,885 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.230  |       N/A\n",
+      "2023-04-07 02:26:36,885 - INFO - combo.training.tensorboard_writer - loss                     |     0.451  |       N/A\n",
+      "2023-04-07 02:26:36,885 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:26:36,885 - INFO - combo.training.tensorboard_writer - LAS                      |     0.944  |       N/A\n",
+      "2023-04-07 02:26:36,885 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:26:36,885 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 02:26:36,885 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 02:26:36,885 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 02:26:36,885 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 02:26:36,885 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 02:26:36,889 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n",
+      "2023-04-07 02:26:41,701 - INFO - combo.training.trainer - Epoch duration: 0:00:49.589770\n",
+      "2023-04-07 02:26:41,702 - INFO - combo.training.trainer - Estimated training time remaining: 3:48:13\n",
+      "2023-04-07 02:26:41,702 - INFO - allennlp.training.trainer - Epoch 195/399\n",
+      "2023-04-07 02:26:41,702 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:26:41,703 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:26:41,710 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9527, UAS: 0.9720, LAS: 0.9488, UEM: 0.6780, LEM: 0.4529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2827, partial_loss/deprel_loss: 0.2622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4466, loss: 0.4437, batch_reg_loss: 0.1803, reg_loss: 0.1803 ||:   5%|5         | 5/95 [00:02<00:38,  2.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9565, UAS: 0.9784, LAS: 0.9557, UEM: 0.8436, LEM: 0.6916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1188, partial_loss/deprel_loss: 0.1871, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3538, loss: 0.3926, batch_reg_loss: 0.1803, reg_loss: 0.1803 ||:   9%|9         | 9/95 [00:04<00:38,  2.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9521, UAS: 0.9762, LAS: 0.9520, UEM: 0.8126, LEM: 0.6409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1724, partial_loss/deprel_loss: 0.2548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4186, loss: 0.4159, batch_reg_loss: 0.1803, reg_loss: 0.1803 ||:  15%|#4        | 14/95 [00:06<00:36,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9316, UAS: 0.9743, LAS: 0.9495, UEM: 0.7793, LEM: 0.6013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4681, partial_loss/deprel_loss: 0.3194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5294, loss: 0.4299, batch_reg_loss: 0.1803, reg_loss: 0.1803 ||:  20%|##        | 19/95 [00:08<00:34,  2.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9711, LAS: 0.9466, UEM: 0.7379, LEM: 0.5623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2964, partial_loss/deprel_loss: 0.2368, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4290, loss: 0.4462, batch_reg_loss: 0.1803, reg_loss: 0.1803 ||:  25%|##5       | 24/95 [00:10<00:31,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9395, UAS: 0.9702, LAS: 0.9454, UEM: 0.7296, LEM: 0.5485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2643, partial_loss/deprel_loss: 0.2978, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4713, loss: 0.4505, batch_reg_loss: 0.1802, reg_loss: 0.1803 ||:  31%|###       | 29/95 [00:13<00:29,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9534, UAS: 0.9701, LAS: 0.9452, UEM: 0.7177, LEM: 0.5304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1545, partial_loss/deprel_loss: 0.2642, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4225, loss: 0.4506, batch_reg_loss: 0.1802, reg_loss: 0.1803 ||:  36%|###5      | 34/95 [00:15<00:26,  2.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9700, LAS: 0.9451, UEM: 0.7127, LEM: 0.5224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4534, partial_loss/deprel_loss: 0.3090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5181, loss: 0.4517, batch_reg_loss: 0.1802, reg_loss: 0.1803 ||:  41%|####1     | 39/95 [00:17<00:24,  2.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9488, UAS: 0.9705, LAS: 0.9453, UEM: 0.7117, LEM: 0.5165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2453, partial_loss/deprel_loss: 0.2147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4010, loss: 0.4485, batch_reg_loss: 0.1802, reg_loss: 0.1803 ||:  46%|####6     | 44/95 [00:19<00:22,  2.23it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9529, UAS: 0.9692, LAS: 0.9440, UEM: 0.7051, LEM: 0.5115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1320, partial_loss/deprel_loss: 0.1871, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3562, loss: 0.4569, batch_reg_loss: 0.1802, reg_loss: 0.1803 ||:  52%|#####1    | 49/95 [00:22<00:21,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9486, UAS: 0.9700, LAS: 0.9451, UEM: 0.7170, LEM: 0.5275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2821, partial_loss/deprel_loss: 0.2490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4358, loss: 0.4512, batch_reg_loss: 0.1802, reg_loss: 0.1802 ||:  57%|#####6    | 54/95 [00:24<00:19,  2.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9483, UAS: 0.9699, LAS: 0.9451, UEM: 0.7076, LEM: 0.5154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3030, partial_loss/deprel_loss: 0.2799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4647, loss: 0.4522, batch_reg_loss: 0.1801, reg_loss: 0.1802 ||:  63%|######3   | 60/95 [00:27<00:15,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9593, UAS: 0.9703, LAS: 0.9453, UEM: 0.7074, LEM: 0.5125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0932, partial_loss/deprel_loss: 0.1992, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3581, loss: 0.4512, batch_reg_loss: 0.1801, reg_loss: 0.1802 ||:  68%|######8   | 65/95 [00:29<00:13,  2.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9641, UAS: 0.9701, LAS: 0.9452, UEM: 0.7060, LEM: 0.5122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0897, partial_loss/deprel_loss: 0.1406, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3105, loss: 0.4523, batch_reg_loss: 0.1801, reg_loss: 0.1802 ||:  74%|#######3  | 70/95 [00:31<00:10,  2.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9703, LAS: 0.9452, UEM: 0.7059, LEM: 0.5089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3544, partial_loss/deprel_loss: 0.3097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4987, loss: 0.4509, batch_reg_loss: 0.1801, reg_loss: 0.1802 ||:  79%|#######8  | 75/95 [00:33<00:08,  2.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9475, UAS: 0.9696, LAS: 0.9444, UEM: 0.6974, LEM: 0.5001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1896, partial_loss/deprel_loss: 0.2326, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4040, loss: 0.4551, batch_reg_loss: 0.1801, reg_loss: 0.1802 ||:  84%|########4 | 80/95 [00:35<00:06,  2.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9584, UAS: 0.9699, LAS: 0.9447, UEM: 0.7109, LEM: 0.5164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0795, partial_loss/deprel_loss: 0.1642, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3273, loss: 0.4524, batch_reg_loss: 0.1801, reg_loss: 0.1802 ||:  89%|########9 | 85/95 [00:38<00:04,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9544, UAS: 0.9697, LAS: 0.9445, UEM: 0.7068, LEM: 0.5130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1100, partial_loss/deprel_loss: 0.2053, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3663, loss: 0.4535, batch_reg_loss: 0.1800, reg_loss: 0.1802 ||:  95%|#########4| 90/95 [00:40<00:02,  2.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9573, UAS: 0.9702, LAS: 0.9449, UEM: 0.7149, LEM: 0.5209, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0860, partial_loss/deprel_loss: 0.1579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3235, loss: 0.4497, batch_reg_loss: 0.1800, reg_loss: 0.1802 ||: 100%|##########| 95/95 [00:42<00:00,  2.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9573, UAS: 0.9702, LAS: 0.9449, UEM: 0.7149, LEM: 0.5209, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0860, partial_loss/deprel_loss: 0.1579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3235, loss: 0.4497, batch_reg_loss: 0.1800, reg_loss: 0.1802 ||: 100%|##########| 95/95 [00:42<00:00,  2.23it/s]\n",
+      "2023-04-07 02:27:27,488 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/11 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9532, LAS: 0.9049, UEM: 0.6861, LEM: 0.4048, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4058, partial_loss/deprel_loss: 6.5936, partial_loss/cycle_loss: 0.0000, batch_loss: 5.3561, loss: 6.3438, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  36%|###6      | 4/11 [00:02<00:04,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8582, UAS: 0.9536, LAS: 0.9068, UEM: 0.7453, LEM: 0.5038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5532, partial_loss/deprel_loss: 15.5781, partial_loss/cycle_loss: 0.0000, batch_loss: 12.7731, loss: 6.6323, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  64%|######3   | 7/11 [00:04<00:02,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9531, LAS: 0.9027, UEM: 0.6908, LEM: 0.4182, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5501, partial_loss/deprel_loss: 6.8559, partial_loss/cycle_loss: 0.0000, batch_loss: 5.5948, loss: 6.8042, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:07<00:00,  1.55it/s] \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9531, LAS: 0.9027, UEM: 0.6908, LEM: 0.4182, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5501, partial_loss/deprel_loss: 6.8559, partial_loss/cycle_loss: 0.0000, batch_loss: 5.5948, loss: 6.8042, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 11/11 [00:07<00:00,  1.54it/s]\n",
+      "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.180  |     0.000\n",
+      "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - UEM                      |     0.715  |     0.691\n",
+      "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - LEM                      |     0.521  |     0.418\n",
+      "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - EM                       |     0.957  |     0.903\n",
+      "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.086  |     0.550\n",
+      "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - UAS                      |     0.970  |     0.953\n",
+      "2023-04-07 02:27:34,645 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6955.898  |       N/A\n",
+      "2023-04-07 02:27:34,646 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.158  |     6.856\n",
+      "2023-04-07 02:27:34,646 - INFO - combo.training.tensorboard_writer - loss                     |     0.450  |     6.804\n",
+      "2023-04-07 02:27:34,646 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 02:27:34,646 - INFO - combo.training.tensorboard_writer - LAS                      |     0.945  |     0.903\n",
+      "2023-04-07 02:27:34,646 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2426.041  |       N/A\n",
+      "2023-04-07 02:27:34,646 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 02:27:34,646 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 02:27:34,646 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 02:27:34,646 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 02:27:34,646 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 02:27:34,651 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlp867qpopk/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 02:27:38,944 - INFO - combo.training.trainer - Epoch duration: 0:00:57.242174\n",
+      "2023-04-07 02:27:38,945 - INFO - combo.training.trainer - Estimated training time remaining: 3:46:56\n",
+      "2023-04-07 02:27:38,945 - INFO - allennlp.training.trainer - Epoch 196/399\n",
+      "2023-04-07 02:27:38,945 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.8G\n",
+      "2023-04-07 02:27:38,946 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 02:27:38,956 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/95 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9574, UAS: 0.9680, LAS: 0.9432, UEM: 0.6083, LEM: 0.3994, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2071, partial_loss/deprel_loss: 0.2123, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3913, loss: 0.4754, batch_reg_loss: 0.1800, reg_loss: 0.1800 ||:   5%|5         | 5/95 [00:02<00:41,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9652, LAS: 0.9405, UEM: 0.5337, LEM: 0.3395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5089, partial_loss/deprel_loss: 0.3847, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5895, loss: 0.4913, batch_reg_loss: 0.1800, reg_loss: 0.1800 ||:  11%|#         | 10/95 [00:04<00:38,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9419, UAS: 0.9684, LAS: 0.9435, UEM: 0.6476, LEM: 0.4498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3862, partial_loss/deprel_loss: 0.3155, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5096, loss: 0.4663, batch_reg_loss: 0.1800, reg_loss: 0.1800 ||:  16%|#5        | 15/95 [00:06<00:36,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9702, LAS: 0.9457, UEM: 0.7184, LEM: 0.5454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4626, partial_loss/deprel_loss: 0.2818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4979, loss: 0.4515, batch_reg_loss: 0.1800, reg_loss: 0.1800 ||:  20%|##        | 19/95 [00:08<00:36,  2.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9569, UAS: 0.9711, LAS: 0.9459, UEM: 0.7201, LEM: 0.5365, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1590, partial_loss/deprel_loss: 0.2219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3893, loss: 0.4462, batch_reg_loss: 0.1799, reg_loss: 0.1800 ||:  25%|##5       | 24/95 [00:10<00:32,  2.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9592, UAS: 0.9717, LAS: 0.9463, UEM: 0.7125, LEM: 0.5195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1199, partial_loss/deprel_loss: 0.1988, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3629, loss: 0.4442, batch_reg_loss: 0.1799, reg_loss: 0.1800 ||:  32%|###1      | 30/95 [00:13<00:28,  2.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9511, UAS: 0.9710, LAS: 0.9456, UEM: 0.6994, LEM: 0.5027, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2418, partial_loss/deprel_loss: 0.2540, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4315, loss: 0.4491, batch_reg_loss: 0.1799, reg_loss: 0.1800 ||:  38%|###7      | 36/95 [00:15<00:25,  2.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9713, LAS: 0.9459, UEM: 0.7014, LEM: 0.5015, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2789, partial_loss/deprel_loss: 0.2864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4648, loss: 0.4461, batch_reg_loss: 0.1799, reg_loss: 0.1800 ||:  43%|####3     | 41/95 [00:17<00:22,  2.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9491, UAS: 0.9716, LAS: 0.9463, UEM: 0.7029, LEM: 0.5023, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1904, partial_loss/deprel_loss: 0.2487, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4169, loss: 0.4436, batch_reg_loss: 0.1799, reg_loss: 0.1800 ||:  48%|####8     | 46/95 [00:20<00:21,  2.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9580, UAS: 0.9721, LAS: 0.9468, UEM: 0.7241, LEM: 0.5305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0812, partial_loss/deprel_loss: 0.1878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3463, loss: 0.4396, batch_reg_loss: 0.1799, reg_loss: 0.1799 ||:  54%|#####3    | 51/95 [00:22<00:19,  2.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9479, UAS: 0.9718, LAS: 0.9463, UEM: 0.7154, LEM: 0.5183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1933, partial_loss/deprel_loss: 0.2721, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4362, loss: 0.4425, batch_reg_loss: 0.1798, reg_loss: 0.1799 ||:  59%|#####8    | 56/95 [00:24<00:16,  2.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9034, UAS: 0.9707, LAS: 0.9449, UEM: 0.7084, LEM: 0.5105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8299, partial_loss/deprel_loss: 0.4358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6945, loss: 0.4511, batch_reg_loss: 0.1798, reg_loss: 0.1799 ||:  64%|######4   | 61/95 [00:26<00:15,  2.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9478, UAS: 0.9708, LAS: 0.9450, UEM: 0.7059, LEM: 0.5047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1677, partial_loss/deprel_loss: 0.2619, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4229, loss: 0.4509, batch_reg_loss: 0.1798, reg_loss: 0.1799 ||:  69%|######9   | 66/95 [00:28<00:12,  2.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9588, UAS: 0.9704, LAS: 0.9446, UEM: 0.7017, LEM: 0.5009, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1216, partial_loss/deprel_loss: 0.2030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3665, loss: 0.4535, batch_reg_loss: 0.1798, reg_loss: 0.1799 ||:  75%|#######4  | 71/95 [00:31<00:10,  2.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9276, UAS: 0.9707, LAS: 0.9448, UEM: 0.7072, LEM: 0.5067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5046, partial_loss/deprel_loss: 0.3261, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5416, loss: 0.4516, batch_reg_loss: 0.1798, reg_loss: 0.1799 ||:  80%|########  | 76/95 [00:33<00:08,  2.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9706, LAS: 0.9446, UEM: 0.7021, LEM: 0.5010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4056, partial_loss/deprel_loss: 0.3401, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5330, loss: 0.4530, batch_reg_loss: 0.1798, reg_loss: 0.1799 ||:  85%|########5 | 81/95 [00:35<00:06,  2.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9476, UAS: 0.9711, LAS: 0.9451, UEM: 0.7149, LEM: 0.5145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1468, partial_loss/deprel_loss: 0.2580, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4155, loss: 0.4493, batch_reg_loss: 0.1798, reg_loss: 0.1799 ||:  91%|######### | 86/95 [00:37<00:03,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9481, UAS: 0.9708, LAS: 0.9447, UEM: 0.7110, LEM: 0.5093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2038, partial_loss/deprel_loss: 0.2541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4238, loss: 0.4509, batch_reg_loss: 0.1797, reg_loss: 0.1799 ||:  96%|#########5| 91/95 [00:39<00:01,  2.24it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9613, UAS: 0.9712, LAS: 0.9451, UEM: 0.7205, LEM: 0.5204, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0793, partial_loss/deprel_loss: 0.1742, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3349, loss: 0.4479, batch_reg_loss: 0.1797, reg_loss: 0.1799 ||: 100%|##########| 95/95 [00:41<00:00,  2.27it/s]\n",
+      "2023-04-07 02:28:24,033 - INFO - combo.training.trainer - Ran out of patience.  Stopping training.\n",
+      "2023-04-07 02:28:24,034 - INFO - allennlp.training.checkpointer - loading best weights\n",
+      "2023-04-07 02:28:25,595 - INFO - allennlp.common.util - Metrics: {\n",
+      "  \"best_epoch\": 195,\n",
+      "  \"peak_worker_0_memory_MB\": 6955.8984375,\n",
+      "  \"peak_gpu_0_memory_MB\": 2426.04052734375,\n",
+      "  \"training_duration\": \"3:37:58.447135\",\n",
+      "  \"training_start_epoch\": 0,\n",
+      "  \"training_epochs\": 195,\n",
+      "  \"epoch\": 195,\n",
+      "  \"training_UPOS_ACC\": 0.0,\n",
+      "  \"training_XPOS_ACC\": 0.0,\n",
+      "  \"training_SEMREL_ACC\": 0.0,\n",
+      "  \"training_LEMMA_ACC\": 0.0,\n",
+      "  \"training_FEATS_ACC\": 0.0,\n",
+      "  \"training_EM\": 0.9572854042053223,\n",
+      "  \"training_UAS\": 0.9701954834274984,\n",
+      "  \"training_LAS\": 0.9448924505842707,\n",
+      "  \"training_UEM\": 0.7148521082441788,\n",
+      "  \"training_LEM\": 0.5208936438011328,\n",
+      "  \"training_EUAS\": 0.0,\n",
+      "  \"training_ELAS\": 0.0,\n",
+      "  \"training_EUEM\": 0.0,\n",
+      "  \"training_ELEM\": 0.0,\n",
+      "  \"training_partial_loss/head_loss\": 0.08596646785736084,\n",
+      "  \"training_partial_loss/deprel_loss\": 0.15788140892982483,\n",
+      "  \"training_partial_loss/cycle_loss\": 0.0,\n",
+      "  \"training_loss\": 0.4496598549579319,\n",
+      "  \"training_reg_loss\": 0.18018160729031812,\n",
+      "  \"training_worker_0_memory_MB\": 6955.8984375,\n",
+      "  \"training_gpu_0_memory_MB\": 2426.04052734375,\n",
+      "  \"training_patience\": 1,\n",
+      "  \"validation_UPOS_ACC\": 0.0,\n",
+      "  \"validation_XPOS_ACC\": 0.0,\n",
+      "  \"validation_SEMREL_ACC\": 0.0,\n",
+      "  \"validation_LEMMA_ACC\": 0.0,\n",
+      "  \"validation_FEATS_ACC\": 0.0,\n",
+      "  \"validation_EM\": 0.9029048681259155,\n",
+      "  \"validation_UAS\": 0.9531431054461182,\n",
+      "  \"validation_LAS\": 0.9027375434530707,\n",
+      "  \"validation_UEM\": 0.690843621399177,\n",
+      "  \"validation_LEM\": 0.4182098765432099,\n",
+      "  \"validation_EUAS\": 0.0,\n",
+      "  \"validation_ELAS\": 0.0,\n",
+      "  \"validation_EUEM\": 0.0,\n",
+      "  \"validation_ELEM\": 0.0,\n",
+      "  \"validation_partial_loss/head_loss\": 0.5501478910446167,\n",
+      "  \"validation_partial_loss/deprel_loss\": 6.855911731719971,\n",
+      "  \"validation_partial_loss/cycle_loss\": 0.0,\n",
+      "  \"validation_loss\": 6.80415695363825,\n",
+      "  \"validation_reg_loss\": 0.0,\n",
+      "  \"best_validation_UPOS_ACC\": 0.0,\n",
+      "  \"best_validation_XPOS_ACC\": 0.0,\n",
+      "  \"best_validation_SEMREL_ACC\": 0.0,\n",
+      "  \"best_validation_LEMMA_ACC\": 0.0,\n",
+      "  \"best_validation_FEATS_ACC\": 0.0,\n",
+      "  \"best_validation_EM\": 0.9029048681259155,\n",
+      "  \"best_validation_UAS\": 0.9531431054461182,\n",
+      "  \"best_validation_LAS\": 0.9027375434530707,\n",
+      "  \"best_validation_UEM\": 0.690843621399177,\n",
+      "  \"best_validation_LEM\": 0.4182098765432099,\n",
+      "  \"best_validation_EUAS\": 0.0,\n",
+      "  \"best_validation_ELAS\": 0.0,\n",
+      "  \"best_validation_EUEM\": 0.0,\n",
+      "  \"best_validation_ELEM\": 0.0,\n",
+      "  \"best_validation_partial_loss/head_loss\": 0.5501478910446167,\n",
+      "  \"best_validation_partial_loss/deprel_loss\": 6.855911731719971,\n",
+      "  \"best_validation_partial_loss/cycle_loss\": 0.0,\n",
+      "  \"best_validation_loss\": 6.80415695363825,\n",
+      "  \"best_validation_reg_loss\": 0.0\n",
+      "}\n",
+      "2023-04-07 02:28:25,596 - INFO - allennlp.models.archival - archiving weights and vocabulary to ./allennlp867qpopk/model.tar.gz\n",
+      "2023-04-07 02:40:44,065 - INFO - combo.main - Training model stored in: ./allennlp867qpopk\n"
+     ]
+    }
+   ],
+   "source": [
+    "! {COMBO} --mode train \\\n",
+    "    --training_data_path connlu/pdbc-cont-train.conllu \\\n",
+    "    --validation_data_path connlu/pdbc-cont-validation.conllu \\\n",
+    "    --cuda_device 0 \\\n",
+    "    --pretrained_transformer_name allegro/herbert-large-cased \\\n",
+    "    --targets head,deprel \\\n",
+    "    --serialization_dir ."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "74363e00",
+   "metadata": {},
+   "source": [
+    "Change `allennlp...` to the directory produced by COMBO."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "ae258726",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "! rm -r model-pdbc-cont/\n",
+    "! mv allennlp867qpopk/ model-pdbc-cont/"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "combo_python39",
+   "language": "python",
+   "name": "combo_python39"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.16"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git b/COMBO/TrainModel.ipynb a/COMBO/TrainModel.ipynb
new file mode 100644
index 0000000..f327a58
--- /dev/null
+++ a/COMBO/TrainModel.ipynb
@@ -0,0 +1,11222 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "aabfb24b",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "COMBO = '/home/kkrasnowska/anaconda3/envs/combo_p39/bin/combo'"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "54a97ebd",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "I0406 22:49:19.084177 139884283720768 params.py:248] include_in_archive = None\n",
+      "2023-04-06 22:49:19,085 - INFO - allennlp.common.params - random_seed = 8787\n",
+      "2023-04-06 22:49:19,085 - INFO - allennlp.common.params - numpy_seed = 8787\n",
+      "2023-04-06 22:49:19,085 - INFO - allennlp.common.params - pytorch_seed = 8787\n",
+      "2023-04-06 22:49:19,086 - INFO - allennlp.common.checks - Pytorch version: 1.13.1\n",
+      "2023-04-06 22:49:19,087 - INFO - allennlp.common.params - type = default\n",
+      "2023-04-06 22:49:19,087 - INFO - allennlp.common.params - dataset_reader.type = conllu\n",
+      "2023-04-06 22:49:19,088 - INFO - allennlp.common.params - dataset_reader.lazy = False\n",
+      "2023-04-06 22:49:19,088 - INFO - allennlp.common.params - dataset_reader.cache_directory = None\n",
+      "2023-04-06 22:49:19,088 - INFO - allennlp.common.params - dataset_reader.max_instances = None\n",
+      "2023-04-06 22:49:19,088 - INFO - allennlp.common.params - dataset_reader.manual_distributed_sharding = False\n",
+      "2023-04-06 22:49:19,088 - INFO - allennlp.common.params - dataset_reader.manual_multi_process_sharding = False\n",
+      "2023-04-06 22:49:19,088 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.type = characters_const_padding\n",
+      "2023-04-06 22:49:19,089 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.namespace = token_characters\n",
+      "2023-04-06 22:49:19,089 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.character_tokenizer.byte_encoding = None\n",
+      "2023-04-06 22:49:19,089 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.character_tokenizer.lowercase_characters = False\n",
+      "2023-04-06 22:49:19,089 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
+      "2023-04-06 22:49:19,089 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
+      "2023-04-06 22:49:19,089 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.start_tokens = None\n",
+      "2023-04-06 22:49:19,089 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.end_tokens = None\n",
+      "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.min_padding_length = 32\n",
+      "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.token_min_padding_length = 0\n",
+      "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.feats.type = feats_indexer\n",
+      "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.feats.namespace = feats\n",
+      "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.feats.feature_name = feats_\n",
+      "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.feats.token_min_padding_length = 0\n",
+      "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.type = characters_const_padding\n",
+      "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.namespace = token_characters\n",
+      "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.character_tokenizer.byte_encoding = None\n",
+      "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.character_tokenizer.lowercase_characters = False\n",
+      "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.character_tokenizer.start_tokens = ['__START__']\n",
+      "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.character_tokenizer.end_tokens = ['__END__']\n",
+      "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.start_tokens = None\n",
+      "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.end_tokens = None\n",
+      "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.min_padding_length = 32\n",
+      "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.token_min_padding_length = 0\n",
+      "2023-04-06 22:49:19,092 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.type = pretrained_transformer_mismatched_fixed\n",
+      "2023-04-06 22:49:19,092 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.token_min_padding_length = 0\n",
+      "2023-04-06 22:49:19,092 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.model_name = allegro/herbert-large-cased\n",
+      "2023-04-06 22:49:19,092 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.namespace = tags\n",
+      "2023-04-06 22:49:19,092 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.max_length = None\n",
+      "2023-04-06 22:49:19,092 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.tokenizer_kwargs.use_fast = False\n",
+      "2023-04-06 22:49:21,857 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.type = single_id\n",
+      "2023-04-06 22:49:21,857 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.namespace = upostag\n",
+      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.lowercase_tokens = False\n",
+      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.start_tokens = None\n",
+      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.end_tokens = None\n",
+      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.feature_name = pos_\n",
+      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
+      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.token_min_padding_length = 0\n",
+      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.type = single_id\n",
+      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.namespace = xpostag\n",
+      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.lowercase_tokens = False\n",
+      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.start_tokens = None\n",
+      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.end_tokens = None\n",
+      "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.feature_name = tag_\n",
+      "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
+      "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.token_min_padding_length = 0\n",
+      "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.type = characters_const_padding\n",
+      "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.namespace = lemma_characters\n",
+      "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.character_tokenizer.byte_encoding = None\n",
+      "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.character_tokenizer.lowercase_characters = False\n",
+      "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
+      "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
+      "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.start_tokens = None\n",
+      "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.end_tokens = None\n",
+      "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.min_padding_length = 32\n",
+      "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.token_min_padding_length = 0\n",
+      "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.features = ['token', 'char']\n",
+      "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.targets = ['head', 'deprel']\n",
+      "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.use_sem = False\n",
+      "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - train_data_path = connlu/pdbc-train.conllu\n",
+      "2023-04-06 22:49:21,861 - INFO - allennlp.common.params - datasets_for_vocab_creation = ['train']\n",
+      "2023-04-06 22:49:21,861 - INFO - allennlp.common.params - validation_dataset_reader = None\n",
+      "2023-04-06 22:49:21,861 - INFO - allennlp.common.params - validation_data_path = connlu/pdbc-validation.conllu\n",
+      "2023-04-06 22:49:21,861 - INFO - allennlp.common.params - validation_data_loader = None\n",
+      "2023-04-06 22:49:21,861 - INFO - allennlp.common.params - test_data_path = None\n",
+      "2023-04-06 22:49:21,861 - INFO - allennlp.common.params - evaluate_on_test = False\n",
+      "2023-04-06 22:49:21,862 - INFO - allennlp.common.params - batch_weight_key = \n",
+      "2023-04-06 22:49:21,862 - INFO - allennlp.training.util - Reading training data from connlu/pdbc-train.conllu\n",
+      "reading instances: 0it [00:00, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "reading instances: 3853it [00:02, 1926.46it/s]\n",
+      "reading instances: 8024it [00:04, 1907.69it/s]\n",
+      "reading instances: 11424it [00:06, 1840.15it/s]\n",
+      "reading instances: 14555it [00:08, 1654.52it/s]\n",
+      "reading instances: 17659it [00:09, 1772.69it/s]\n",
+      "2023-04-06 22:49:31,824 - INFO - allennlp.training.util - Reading validation data from connlu/pdbc-validation.conllu\n",
+      "reading instances: 0it [00:00, ?it/s]\n",
+      "reading instances: 1851it [00:02, 897.46it/s]\n",
+      "reading instances: 2211it [00:02, 933.13it/s]\n",
+      "2023-04-06 22:49:34,194 - INFO - allennlp.commands.train - From dataset instances, train will be considered for vocabulary creation.\n",
+      "2023-04-06 22:49:34,194 - INFO - allennlp.common.params - vocabulary.type = from_instances_extended\n",
+      "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.min_count = None\n",
+      "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.max_vocab_size = None\n",
+      "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.non_padded_namespaces = ['head_labels']\n",
+      "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.pretrained_files = None\n",
+      "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.only_include_pretrained_words = True\n",
+      "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.min_pretrained_embeddings = None\n",
+      "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.padding_token = __PAD__\n",
+      "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.oov_token = _\n",
+      "2023-04-06 22:49:34,195 - INFO - allennlp.data.vocabulary - Fitting token dictionary from dataset.\n",
+      "building vocab: 0it [00:00, ?it/s]\n",
+      "building vocab: 16773it [00:02, 8386.16it/s]\n",
+      "building vocab: 17659it [00:02, 8423.42it/s]\n",
+      "2023-04-06 22:49:36,293 - INFO - allennlp.common.params - model.type = semantic_multitask\n",
+      "2023-04-06 22:49:36,293 - INFO - allennlp.common.params - model.text_field_embedder.type = basic\n",
+      "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.type = char_embeddings_from_config\n",
+      "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.embedding_dim = 64\n",
+      "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.input_dim = 64\n",
+      "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.filters = [512, 256, 64]\n",
+      "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.kernel_size = [3, 3, 3]\n",
+      "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.stride = [1, 1, 1]\n",
+      "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.padding = [1, 2, 4]\n",
+      "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.dilation = [1, 2, 4]\n",
+      "2023-04-06 22:49:36,295 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.activations = ['relu', 'relu', 'linear']\n",
+      "2023-04-06 22:49:36,295 - INFO - allennlp.common.params - type = relu\n",
+      "2023-04-06 22:49:36,295 - INFO - allennlp.common.params - type = relu\n",
+      "2023-04-06 22:49:36,295 - INFO - allennlp.common.params - type = linear\n",
+      "2023-04-06 22:49:36,300 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.vocab_namespace = token_characters\n",
+      "2023-04-06 22:49:36,300 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.type = transformers_word_embeddings\n",
+      "2023-04-06 22:49:36,300 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.model_name = allegro/herbert-large-cased\n",
+      "2023-04-06 22:49:36,301 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.projection_dim = 100\n",
+      "2023-04-06 22:49:36,301 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.projection_activation = <function TransformersWordEmbedder.<lambda> at 0x7f388b745280>\n",
+      "2023-04-06 22:49:36,301 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.projection_dropout_rate = 0.0\n",
+      "2023-04-06 22:49:36,301 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.freeze_transformer = True\n",
+      "2023-04-06 22:49:36,301 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.last_layer_only = True\n",
+      "2023-04-06 22:49:36,301 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.tokenizer_kwargs.use_fast = False\n",
+      "2023-04-06 22:49:36,301 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.transformer_kwargs = None\n",
+      "2023-04-06 22:49:44,104 - INFO - allennlp.common.params - model.seq_encoder.type = combo_encoder\n",
+      "2023-04-06 22:49:44,105 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.input_size = 164\n",
+      "2023-04-06 22:49:44,105 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.hidden_size = 512\n",
+      "2023-04-06 22:49:44,105 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.num_layers = 2\n",
+      "2023-04-06 22:49:44,105 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.recurrent_dropout_probability = 0.33\n",
+      "2023-04-06 22:49:44,105 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.layer_dropout_probability = 0.33\n",
+      "2023-04-06 22:49:44,105 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.use_highway = False\n",
+      "2023-04-06 22:49:44,804 - INFO - allennlp.common.params - model.seq_encoder.layer_dropout_probability = 0.33\n",
+      "2023-04-06 22:49:44,805 - INFO - allennlp.common.params - model.use_sample_weight = True\n",
+      "2023-04-06 22:49:44,805 - INFO - allennlp.common.params - model.lemmatizer = None\n",
+      "2023-04-06 22:49:44,805 - INFO - allennlp.common.params - model.upos_tagger = None\n",
+      "2023-04-06 22:49:44,805 - INFO - allennlp.common.params - model.xpos_tagger = None\n",
+      "2023-04-06 22:49:44,805 - INFO - allennlp.common.params - model.semantic_relation = None\n",
+      "2023-04-06 22:49:44,805 - INFO - allennlp.common.params - model.morphological_feat = None\n",
+      "2023-04-06 22:49:44,805 - INFO - allennlp.common.params - model.dependency_relation.type = combo_dependency_parsing_from_vocab\n",
+      "2023-04-06 22:49:44,806 - INFO - allennlp.common.params - model.dependency_relation.vocab_namespace = deprel_labels\n",
+      "2023-04-06 22:49:44,806 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.head_projection_layer.in_features = 1024\n",
+      "2023-04-06 22:49:44,806 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.head_projection_layer.out_features = 512\n",
+      "2023-04-06 22:49:44,806 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.head_projection_layer.activation = tanh\n",
+      "2023-04-06 22:49:44,806 - INFO - allennlp.common.params - type = tanh\n",
+      "2023-04-06 22:49:44,806 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.head_projection_layer.dropout_rate = 0.0\n",
+      "2023-04-06 22:49:44,811 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.dependency_projection_layer.in_features = 1024\n",
+      "2023-04-06 22:49:44,811 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.dependency_projection_layer.out_features = 512\n",
+      "2023-04-06 22:49:44,811 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.dependency_projection_layer.activation = tanh\n",
+      "2023-04-06 22:49:44,811 - INFO - allennlp.common.params - type = tanh\n",
+      "2023-04-06 22:49:44,811 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.dependency_projection_layer.dropout_rate = 0.0\n",
+      "2023-04-06 22:49:44,816 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.cycle_loss_n = 0\n",
+      "2023-04-06 22:49:44,816 - INFO - allennlp.common.params - model.dependency_relation.head_projection_layer.in_features = 1024\n",
+      "2023-04-06 22:49:44,816 - INFO - allennlp.common.params - model.dependency_relation.head_projection_layer.out_features = 128\n",
+      "2023-04-06 22:49:44,816 - INFO - allennlp.common.params - model.dependency_relation.head_projection_layer.activation = tanh\n",
+      "2023-04-06 22:49:44,816 - INFO - allennlp.common.params - type = tanh\n",
+      "2023-04-06 22:49:44,816 - INFO - allennlp.common.params - model.dependency_relation.head_projection_layer.dropout_rate = 0.25\n",
+      "2023-04-06 22:49:44,818 - INFO - allennlp.common.params - model.dependency_relation.dependency_projection_layer.in_features = 1024\n",
+      "2023-04-06 22:49:44,818 - INFO - allennlp.common.params - model.dependency_relation.dependency_projection_layer.out_features = 128\n",
+      "2023-04-06 22:49:44,818 - INFO - allennlp.common.params - model.dependency_relation.dependency_projection_layer.activation = tanh\n",
+      "2023-04-06 22:49:44,818 - INFO - allennlp.common.params - type = tanh\n",
+      "2023-04-06 22:49:44,818 - INFO - allennlp.common.params - model.dependency_relation.dependency_projection_layer.dropout_rate = 0.25\n",
+      "2023-04-06 22:49:44,820 - INFO - allennlp.common.params - model.enhanced_dependency_relation = None\n",
+      "2023-04-06 22:49:44,821 - INFO - allennlp.common.params - model.regularizer.regexes.0.1.type = l2\n",
+      "2023-04-06 22:49:44,821 - INFO - allennlp.common.params - model.regularizer.regexes.0.1.alpha = 1e-06\n",
+      "2023-04-06 22:49:44,821 - INFO - allennlp.common.params - model.regularizer.regexes.1.1.type = l2\n",
+      "2023-04-06 22:49:44,821 - INFO - allennlp.common.params - model.regularizer.regexes.1.1.alpha = 1e-06\n",
+      "2023-04-06 22:49:44,821 - INFO - allennlp.common.params - model.regularizer.regexes.2.1.type = l2\n",
+      "2023-04-06 22:49:44,821 - INFO - allennlp.common.params - model.regularizer.regexes.2.1.alpha = 1e-06\n",
+      "2023-04-06 22:49:44,822 - INFO - allennlp.common.params - model.regularizer.regexes.3.1.type = l2\n",
+      "2023-04-06 22:49:44,822 - INFO - allennlp.common.params - model.regularizer.regexes.3.1.alpha = 1e-05\n",
+      "2023-04-06 22:49:44,822 - INFO - filelock - Lock 139878665944848 acquired on ./allennlpru3hb8qq/vocabulary/.lock\n",
+      "2023-04-06 22:49:44,823 - INFO - filelock - Lock 139878665944848 released on ./allennlpru3hb8qq/vocabulary/.lock\n",
+      "2023-04-06 22:49:44,823 - INFO - allennlp.common.params - data_loader.type = pytorch_dataloader\n",
+      "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.batch_size = 1\n",
+      "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.shuffle = False\n",
+      "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.sampler = None\n",
+      "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.num_workers = 0\n",
+      "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.pin_memory = False\n",
+      "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.drop_last = False\n",
+      "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.timeout = 0\n",
+      "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.worker_init_fn = None\n",
+      "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.multiprocessing_context = None\n",
+      "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.batches_per_epoch = None\n",
+      "2023-04-06 22:49:44,825 - INFO - allennlp.common.params - data_loader.batch_sampler.type = token_count\n",
+      "2023-04-06 22:49:44,825 - INFO - allennlp.common.params - data_loader.batch_sampler.word_batch_size = 2500\n",
+      "2023-04-06 22:49:44,825 - INFO - allennlp.common.params - data_loader.batch_sampler.shuffle_dataset = True\n",
+      "/home/kkrasnowska/anaconda3/envs/combo_p39/lib/python3.8/site-packages/combo/data/samplers/samplers.py:51: VisibleDeprecationWarning: Creating an ndarray from ragged nested sequences (which is a list-or-tuple of lists-or-tuples-or ndarrays with different lengths or shapes) is deprecated. If you meant to do this, you must specify 'dtype=object' when creating the ndarray.\n",
+      "  self.batch_dataset = np.array(self.batch_dataset)[indices].tolist()\n",
+      "2023-04-06 22:49:44,845 - INFO - allennlp.common.params - data_loader.type = pytorch_dataloader\n",
+      "2023-04-06 22:49:44,845 - INFO - allennlp.common.params - data_loader.batch_size = 1\n",
+      "2023-04-06 22:49:44,845 - INFO - allennlp.common.params - data_loader.shuffle = False\n",
+      "2023-04-06 22:49:44,845 - INFO - allennlp.common.params - data_loader.sampler = None\n",
+      "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.num_workers = 0\n",
+      "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.pin_memory = False\n",
+      "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.drop_last = False\n",
+      "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.timeout = 0\n",
+      "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.worker_init_fn = None\n",
+      "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.multiprocessing_context = None\n",
+      "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.batches_per_epoch = None\n",
+      "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.batch_sampler.type = token_count\n",
+      "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.batch_sampler.word_batch_size = 2500\n",
+      "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.batch_sampler.shuffle_dataset = True\n",
+      "2023-04-06 22:49:44,849 - INFO - allennlp.common.params - trainer.type = gradient_descent_validate_n\n",
+      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.patience = 1\n",
+      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.validation_metric = +EM\n",
+      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.num_epochs = 400\n",
+      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.cuda_device = 0\n",
+      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.grad_norm = None\n",
+      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.grad_clipping = 5\n",
+      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.distributed = None\n",
+      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.world_size = 1\n",
+      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.num_gradient_accumulation_steps = 1\n",
+      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.use_amp = False\n",
+      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.no_grad = None\n",
+      "2023-04-06 22:49:44,851 - INFO - allennlp.common.params - trainer.momentum_scheduler = None\n",
+      "2023-04-06 22:49:44,851 - INFO - allennlp.common.params - trainer.tensorboard_writer = None\n",
+      "2023-04-06 22:49:44,851 - INFO - allennlp.common.params - trainer.moving_average = None\n",
+      "2023-04-06 22:49:44,851 - INFO - allennlp.common.params - trainer.batch_callbacks = None\n",
+      "2023-04-06 22:49:44,851 - INFO - allennlp.common.params - trainer.epoch_callbacks.0.type = transfer_patience\n",
+      "2023-04-06 22:49:44,851 - INFO - allennlp.common.params - trainer.end_callbacks = None\n",
+      "2023-04-06 22:49:44,851 - INFO - allennlp.common.params - trainer.trainer_callbacks = None\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-06 22:49:47,277 - INFO - allennlp.common.params - trainer.optimizer.type = adam\r\n",
+      "2023-04-06 22:49:47,277 - INFO - allennlp.common.params - trainer.optimizer.parameter_groups = None\r\n",
+      "2023-04-06 22:49:47,277 - INFO - allennlp.common.params - trainer.optimizer.lr = 0.002\r\n",
+      "2023-04-06 22:49:47,277 - INFO - allennlp.common.params - trainer.optimizer.betas = [0.9, 0.9]\r\n",
+      "2023-04-06 22:49:47,278 - INFO - allennlp.common.params - trainer.optimizer.eps = 1e-08\r\n",
+      "2023-04-06 22:49:47,278 - INFO - allennlp.common.params - trainer.optimizer.weight_decay = 0.0\r\n",
+      "2023-04-06 22:49:47,278 - INFO - allennlp.common.params - trainer.optimizer.amsgrad = False\r\n",
+      "2023-04-06 22:49:47,278 - INFO - allennlp.training.optimizers - Number of trainable parameters: 11053872\r\n",
+      "2023-04-06 22:49:47,278 - INFO - allennlp.common.util - The following parameters are Frozen (without gradient):\r\n",
+      "2023-04-06 22:49:47,278 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.word_embeddings.weight\r\n",
+      "2023-04-06 22:49:47,278 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.position_embeddings.weight\r\n",
+      "2023-04-06 22:49:47,278 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.token_type_embeddings.weight\r\n",
+      "2023-04-06 22:49:47,278 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,278 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,278 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.query.weight\r\n",
+      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.query.bias\r\n",
+      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.key.weight\r\n",
+      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.key.bias\r\n",
+      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.value.weight\r\n",
+      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.value.bias\r\n",
+      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.intermediate.dense.weight\r\n",
+      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.intermediate.dense.bias\r\n",
+      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.output.dense.weight\r\n",
+      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.output.dense.bias\r\n",
+      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.output.LayerNorm.weight\r\n",
+      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.output.LayerNorm.bias\r\n",
+      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.pooler.dense.weight\r\n",
+      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.pooler.dense.bias\r\n",
+      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - The following parameters are Tunable (with gradient):\r\n",
+      "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - _head_sentinel\r\n",
+      "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.char_embed.weight\r\n",
+      "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.0.weight\r\n",
+      "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.0.bias\r\n",
+      "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.1.weight\r\n",
+      "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.1.bias\r\n",
+      "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.2.weight\r\n",
+      "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.2.bias\r\n",
+      "2023-04-06 22:49:47,303 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token.projection_layer.weight\r\n",
+      "2023-04-06 22:49:47,303 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token.projection_layer.bias\r\n",
+      "2023-04-06 22:49:47,303 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_0.cell.input_linearity.weight\r\n",
+      "2023-04-06 22:49:47,303 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_0.cell.state_linearity.weight\r\n",
+      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_0.cell.state_linearity.bias\r\n",
+      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_0.cell.input_linearity.weight\r\n",
+      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_0.cell.state_linearity.weight\r\n",
+      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_0.cell.state_linearity.bias\r\n",
+      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_1.cell.input_linearity.weight\r\n",
+      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_1.cell.state_linearity.weight\r\n",
+      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_1.cell.state_linearity.bias\r\n",
+      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_1.cell.input_linearity.weight\r\n",
+      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_1.cell.state_linearity.weight\r\n",
+      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_1.cell.state_linearity.bias\r\n",
+      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - dependency_relation.head_predictor.head_projection_layer.weight\r\n",
+      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - dependency_relation.head_predictor.head_projection_layer.bias\r\n",
+      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - dependency_relation.head_predictor.dependency_projection_layer.weight\r\n",
+      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - dependency_relation.head_predictor.dependency_projection_layer.bias\r\n",
+      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - dependency_relation.head_projection_layer.weight\r\n",
+      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - dependency_relation.head_projection_layer.bias\r\n",
+      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - dependency_relation.dependency_projection_layer.weight\r\n",
+      "2023-04-06 22:49:47,305 - INFO - allennlp.common.util - dependency_relation.dependency_projection_layer.bias\r\n",
+      "2023-04-06 22:49:47,305 - INFO - allennlp.common.util - dependency_relation.relation_prediction_layer.weight\r\n",
+      "2023-04-06 22:49:47,305 - INFO - allennlp.common.util - dependency_relation.relation_prediction_layer.bias\r\n",
+      "2023-04-06 22:49:47,305 - INFO - allennlp.common.params - trainer.learning_rate_scheduler.type = combo_scheduler\r\n",
+      "2023-04-06 22:49:47,305 - INFO - allennlp.common.params - trainer.learning_rate_scheduler.patience = 6\r\n",
+      "2023-04-06 22:49:47,305 - INFO - allennlp.common.params - trainer.learning_rate_scheduler.decreases = 2\r\n",
+      "2023-04-06 22:49:47,305 - INFO - allennlp.common.params - trainer.learning_rate_scheduler.threshold = 0.001\r\n",
+      "2023-04-06 22:49:47,305 - INFO - allennlp.common.params - trainer.checkpointer.type = finishing_only_checkpointer\r\n",
+      "2023-04-06 22:49:47,306 - INFO - allennlp.common.params - trainer.checkpointer.keep_serialized_model_every_num_seconds = None\r\n",
+      "2023-04-06 22:49:47,306 - INFO - allennlp.common.params - trainer.checkpointer.num_serialized_models_to_keep = 2\r\n",
+      "2023-04-06 22:49:47,306 - INFO - allennlp.common.params - trainer.checkpointer.model_save_interval = None\r\n",
+      "2023-04-06 22:49:47,308 - INFO - combo.training.trainer - Beginning training.\r\n",
+      "2023-04-06 22:49:47,308 - INFO - allennlp.training.trainer - Epoch 0/399\r\n",
+      "2023-04-06 22:49:47,308 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.3G\r\n",
+      "2023-04-06 22:49:47,308 - INFO - allennlp.training.trainer - GPU 0 memory usage: 1.4G\r\n",
+      "2023-04-06 22:49:47,315 - INFO - allennlp.training.trainer - Training\r\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\r\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0000, UAS: 0.0492, LAS: 0.0000, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.7155, partial_loss/deprel_loss: 12.9573, partial_loss/cycle_loss: 0.0000, batch_loss: 12.4107, loss: 12.4107, batch_reg_loss: 0.1018, reg_loss: 0.1018 ||:   1%|          | 1/111 [00:03<07:00,  3.82s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0000, UAS: 0.0559, LAS: 0.0045, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 19.7004, partial_loss/deprel_loss: 16.3879, partial_loss/cycle_loss: 0.0000, batch_loss: 17.1516, loss: 25.2089, batch_reg_loss: 0.1012, reg_loss: 0.1015 ||:   4%|3         | 4/111 [00:06<05:11,  2.91s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0120, UAS: 0.0714, LAS: 0.0044, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 22.1129, partial_loss/deprel_loss: 9.0855, partial_loss/cycle_loss: 0.0000, batch_loss: 11.7916, loss: 24.6851, batch_reg_loss: 0.1006, reg_loss: 0.1012 ||:   6%|6         | 7/111 [00:08<03:56,  2.27s/it] \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0099, UAS: 0.0608, LAS: 0.0046, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 15.5869, partial_loss/deprel_loss: 9.3639, partial_loss/cycle_loss: 0.0000, batch_loss: 10.7085, loss: 21.3806, batch_reg_loss: 0.1000, reg_loss: 0.1009 ||:   9%|9         | 10/111 [00:10<03:01,  1.80s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0315, UAS: 0.0725, LAS: 0.0092, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 18.3275, partial_loss/deprel_loss: 7.1568, partial_loss/cycle_loss: 0.0000, batch_loss: 9.4905, loss: 18.5717, batch_reg_loss: 0.0995, reg_loss: 0.1006 ||:  12%|#1        | 13/111 [00:12<02:26,  1.49s/it] \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0000, UAS: 0.0633, LAS: 0.0083, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 25.8989, partial_loss/deprel_loss: 11.7684, partial_loss/cycle_loss: 0.0000, batch_loss: 14.6935, loss: 17.9697, batch_reg_loss: 0.0991, reg_loss: 0.1003 ||:  14%|#4        | 16/111 [00:15<01:59,  1.26s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0064, UAS: 0.0604, LAS: 0.0079, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 16.1143, partial_loss/deprel_loss: 10.8376, partial_loss/cycle_loss: 0.0000, batch_loss: 11.9915, loss: 16.8737, batch_reg_loss: 0.0986, reg_loss: 0.1001 ||:  17%|#7        | 19/111 [00:17<01:39,  1.08s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0079, UAS: 0.0579, LAS: 0.0081, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 15.2368, partial_loss/deprel_loss: 10.3155, partial_loss/cycle_loss: 0.0000, batch_loss: 11.3978, loss: 16.0851, batch_reg_loss: 0.0981, reg_loss: 0.0998 ||:  20%|#9        | 22/111 [00:19<01:25,  1.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0259, UAS: 0.0602, LAS: 0.0091, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 13.9253, partial_loss/deprel_loss: 7.4326, partial_loss/cycle_loss: 0.0000, batch_loss: 8.8288, loss: 15.3859, batch_reg_loss: 0.0976, reg_loss: 0.0996 ||:  23%|##2       | 25/111 [00:21<01:17,  1.11it/s]  \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0267, UAS: 0.0629, LAS: 0.0101, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 23.9539, partial_loss/deprel_loss: 6.4690, partial_loss/cycle_loss: 0.0000, batch_loss: 10.0631, loss: 14.9031, batch_reg_loss: 0.0971, reg_loss: 0.0994 ||:  25%|##5       | 28/111 [00:23<01:10,  1.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0139, UAS: 0.0629, LAS: 0.0103, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 19.2664, partial_loss/deprel_loss: 8.1915, partial_loss/cycle_loss: 0.0000, batch_loss: 10.5031, loss: 14.5860, batch_reg_loss: 0.0966, reg_loss: 0.0991 ||:  28%|##7       | 31/111 [00:25<01:04,  1.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0056, UAS: 0.0635, LAS: 0.0105, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 14.2399, partial_loss/deprel_loss: 9.7935, partial_loss/cycle_loss: 0.0000, batch_loss: 10.7789, loss: 14.1692, batch_reg_loss: 0.0961, reg_loss: 0.0989 ||:  31%|###       | 34/111 [00:27<01:00,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0148, UAS: 0.0660, LAS: 0.0107, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 8.0003, partial_loss/deprel_loss: 6.0032, partial_loss/cycle_loss: 0.0000, batch_loss: 6.4982, loss: 13.6788, batch_reg_loss: 0.0956, reg_loss: 0.0986 ||:  33%|###3      | 37/111 [00:30<00:58,  1.26it/s]  \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0159, UAS: 0.0717, LAS: 0.0140, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 10.5919, partial_loss/deprel_loss: 8.8836, partial_loss/cycle_loss: 0.0000, batch_loss: 9.3203, loss: 13.2278, batch_reg_loss: 0.0950, reg_loss: 0.0983 ||:  36%|###6      | 40/111 [00:32<00:58,  1.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0160, UAS: 0.0744, LAS: 0.0148, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 10.1016, partial_loss/deprel_loss: 9.2769, partial_loss/cycle_loss: 0.0000, batch_loss: 9.5363, loss: 12.8973, batch_reg_loss: 0.0945, reg_loss: 0.0981 ||:  39%|###8      | 43/111 [00:34<00:52,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0467, UAS: 0.0768, LAS: 0.0156, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.8362, partial_loss/deprel_loss: 6.5938, partial_loss/cycle_loss: 0.0000, batch_loss: 6.5361, loss: 12.5863, batch_reg_loss: 0.0939, reg_loss: 0.0978 ||:  41%|####1     | 46/111 [00:37<00:49,  1.31it/s] \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0130, UAS: 0.0790, LAS: 0.0162, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 12.9970, partial_loss/deprel_loss: 11.0561, partial_loss/cycle_loss: 0.0000, batch_loss: 11.5376, loss: 12.3941, batch_reg_loss: 0.0933, reg_loss: 0.0976 ||:  44%|####4     | 49/111 [00:39<00:46,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0044, UAS: 0.0785, LAS: 0.0158, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 14.6006, partial_loss/deprel_loss: 11.6897, partial_loss/cycle_loss: 0.0000, batch_loss: 12.3646, loss: 12.3354, batch_reg_loss: 0.0927, reg_loss: 0.0973 ||:  47%|####6     | 52/111 [00:41<00:43,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0115, UAS: 0.0791, LAS: 0.0156, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 12.7207, partial_loss/deprel_loss: 11.0801, partial_loss/cycle_loss: 0.0000, batch_loss: 11.5003, loss: 12.2236, batch_reg_loss: 0.0921, reg_loss: 0.0970 ||:  50%|####9     | 55/111 [00:43<00:42,  1.32it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0243, UAS: 0.0817, LAS: 0.0158, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.6552, partial_loss/deprel_loss: 7.4151, partial_loss/cycle_loss: 0.0000, batch_loss: 7.3545, loss: 12.0074, batch_reg_loss: 0.0915, reg_loss: 0.0967 ||:  52%|#####2    | 58/111 [00:45<00:38,  1.36it/s]   \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0191, UAS: 0.0860, LAS: 0.0174, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 11.0116, partial_loss/deprel_loss: 10.2631, partial_loss/cycle_loss: 0.0000, batch_loss: 10.5036, loss: 11.7766, batch_reg_loss: 0.0908, reg_loss: 0.0965 ||:  55%|#####4    | 61/111 [00:48<00:38,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0343, UAS: 0.0937, LAS: 0.0194, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.9906, partial_loss/deprel_loss: 8.5044, partial_loss/cycle_loss: 0.0000, batch_loss: 8.4916, loss: 11.4687, batch_reg_loss: 0.0900, reg_loss: 0.0961 ||:  59%|#####8    | 65/111 [00:50<00:33,  1.38it/s]   \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0919, UAS: 0.0972, LAS: 0.0205, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.0429, partial_loss/deprel_loss: 5.5430, partial_loss/cycle_loss: 0.0000, batch_loss: 5.3323, loss: 11.3481, batch_reg_loss: 0.0893, reg_loss: 0.0958 ||:  61%|######1   | 68/111 [00:53<00:33,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0574, UAS: 0.1052, LAS: 0.0221, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.5849, partial_loss/deprel_loss: 6.9327, partial_loss/cycle_loss: 0.0000, batch_loss: 6.7516, loss: 11.1225, batch_reg_loss: 0.0885, reg_loss: 0.0954 ||:  65%|######4   | 72/111 [00:56<00:28,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0301, UAS: 0.1099, LAS: 0.0231, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.2882, partial_loss/deprel_loss: 9.4010, partial_loss/cycle_loss: 0.0000, batch_loss: 9.4663, loss: 10.9824, batch_reg_loss: 0.0878, reg_loss: 0.0951 ||:  68%|######7   | 75/111 [01:00<00:33,  1.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0518, UAS: 0.1162, LAS: 0.0250, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.7446, partial_loss/deprel_loss: 8.7894, partial_loss/cycle_loss: 0.0000, batch_loss: 8.6676, loss: 10.8571, batch_reg_loss: 0.0872, reg_loss: 0.0948 ||:  70%|#######   | 78/111 [01:02<00:29,  1.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0834, UAS: 0.1219, LAS: 0.0265, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.8250, partial_loss/deprel_loss: 7.3410, partial_loss/cycle_loss: 0.0000, batch_loss: 7.1244, loss: 10.7374, batch_reg_loss: 0.0866, reg_loss: 0.0945 ||:  73%|#######2  | 81/111 [01:04<00:24,  1.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0427, UAS: 0.1239, LAS: 0.0269, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 10.8399, partial_loss/deprel_loss: 10.0552, partial_loss/cycle_loss: 0.0000, batch_loss: 10.2981, loss: 10.7271, batch_reg_loss: 0.0860, reg_loss: 0.0942 ||:  76%|#######5  | 84/111 [01:07<00:22,  1.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0643, UAS: 0.1288, LAS: 0.0287, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.8981, partial_loss/deprel_loss: 9.3547, partial_loss/cycle_loss: 0.0000, batch_loss: 9.5488, loss: 10.6448, batch_reg_loss: 0.0854, reg_loss: 0.0939 ||:  78%|#######8  | 87/111 [01:09<00:19,  1.24it/s]   \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0661, UAS: 0.1356, LAS: 0.0319, UEM: 0.0004, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.0897, partial_loss/deprel_loss: 9.0732, partial_loss/cycle_loss: 0.0000, batch_loss: 9.1614, loss: 10.5082, batch_reg_loss: 0.0849, reg_loss: 0.0936 ||:  81%|########1 | 90/111 [01:12<00:17,  1.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0714, UAS: 0.1426, LAS: 0.0350, UEM: 0.0004, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 8.3305, partial_loss/deprel_loss: 8.5479, partial_loss/cycle_loss: 0.0000, batch_loss: 8.5886, loss: 10.3707, batch_reg_loss: 0.0842, reg_loss: 0.0932 ||:  85%|########4 | 94/111 [01:14<00:12,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0987, UAS: 0.1504, LAS: 0.0398, UEM: 0.0005, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.8474, partial_loss/deprel_loss: 6.8979, partial_loss/cycle_loss: 0.0000, batch_loss: 6.7715, loss: 10.2165, batch_reg_loss: 0.0837, reg_loss: 0.0929 ||:  87%|########7 | 97/111 [01:17<00:10,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0733, UAS: 0.1541, LAS: 0.0412, UEM: 0.0004, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.9606, partial_loss/deprel_loss: 9.1819, partial_loss/cycle_loss: 0.0000, batch_loss: 9.4208, loss: 10.1551, batch_reg_loss: 0.0831, reg_loss: 0.0927 ||:  90%|######### | 100/111 [01:19<00:08,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0887, UAS: 0.1585, LAS: 0.0433, UEM: 0.0004, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 8.6073, partial_loss/deprel_loss: 8.5581, partial_loss/cycle_loss: 0.0000, batch_loss: 8.6506, loss: 10.0863, batch_reg_loss: 0.0826, reg_loss: 0.0924 ||:  93%|#########2| 103/111 [01:21<00:06,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0763, UAS: 0.1650, LAS: 0.0476, UEM: 0.0015, LEM: 0.0001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.8387, partial_loss/deprel_loss: 8.8138, partial_loss/cycle_loss: 0.0000, batch_loss: 9.1009, loss: 9.9700, batch_reg_loss: 0.0821, reg_loss: 0.0921 ||:  95%|#########5| 106/111 [01:24<00:04,  1.15it/s] \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1713, UAS: 0.1692, LAS: 0.0496, UEM: 0.0014, LEM: 0.0001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.5725, partial_loss/deprel_loss: 5.1460, partial_loss/cycle_loss: 0.0000, batch_loss: 5.1130, loss: 9.8781, batch_reg_loss: 0.0817, reg_loss: 0.0918 ||:  98%|#########8| 109/111 [01:27<00:01,  1.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1029, UAS: 0.1708, LAS: 0.0502, UEM: 0.0014, LEM: 0.0001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.0519, partial_loss/deprel_loss: 7.4492, partial_loss/cycle_loss: 0.0000, batch_loss: 7.4511, loss: 9.8521, batch_reg_loss: 0.0813, reg_loss: 0.0916 ||: 100%|##########| 111/111 [01:28<00:00,  1.25it/s]\n",
+      "2023-04-06 22:51:15,927 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1167, UAS: 0.3116, LAS: 0.1456, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.9999, partial_loss/deprel_loss: 15.2844, partial_loss/cycle_loss: 0.0000, batch_loss: 13.8275, loss: 12.0213, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:12,  1.11s/it]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2614, UAS: 0.3885, LAS: 0.1921, UEM: 0.0012, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.7361, partial_loss/deprel_loss: 8.9365, partial_loss/cycle_loss: 0.0000, batch_loss: 7.8964, loss: 10.3315, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  31%|###       | 4/13 [00:04<00:10,  1.15s/it]  \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1863, UAS: 0.3556, LAS: 0.1713, UEM: 0.0009, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.5918, partial_loss/deprel_loss: 8.8550, partial_loss/cycle_loss: 0.0000, batch_loss: 8.2024, loss: 11.6787, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:07<00:08,  1.17s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1274, UAS: 0.3363, LAS: 0.1580, UEM: 0.0008, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.5021, partial_loss/deprel_loss: 14.9977, partial_loss/cycle_loss: 0.0000, batch_loss: 13.4986, loss: 12.1599, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:09<00:05,  1.17s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0952, UAS: 0.3134, LAS: 0.1427, UEM: 0.0007, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 8.8305, partial_loss/deprel_loss: 17.7009, partial_loss/cycle_loss: 0.0000, batch_loss: 15.9268, loss: 13.2406, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  77%|#######6  | 10/13 [00:12<00:03,  1.20s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3824, UAS: 0.3342, LAS: 0.1583, UEM: 0.0460, LEM: 0.0089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2575, partial_loss/deprel_loss: 6.4260, partial_loss/cycle_loss: 0.0000, batch_loss: 5.5923, loss: 12.9753, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  92%|#########2| 12/13 [00:14<00:01,  1.20s/it]  \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1377, UAS: 0.3324, LAS: 0.1568, UEM: 0.0427, LEM: 0.0083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.7160, partial_loss/deprel_loss: 11.9092, partial_loss/cycle_loss: 0.0000, batch_loss: 10.8705, loss: 12.8134, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:15<00:00,  1.18s/it]\n",
+      "2023-04-06 22:51:31,252 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     7.449  |    11.909\n",
+      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     7.052  |     6.716\n",
+      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.092  |     0.000\n",
+      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - UEM                      |     0.001  |     0.043\n",
+      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - LAS                      |     0.050  |     0.157\n",
+      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - loss                     |     9.852  |    12.813\n",
+      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  1397.911  |       N/A\n",
+      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - LEM                      |     0.000  |     0.008\n",
+      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 22:51:31,254 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 22:51:31,254 - INFO - combo.training.tensorboard_writer - UAS                      |     0.171  |     0.332\n",
+      "2023-04-06 22:51:31,254 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 22:51:31,254 - INFO - combo.training.tensorboard_writer - EM                       |     0.103  |     0.138\n",
+      "2023-04-06 22:51:31,254 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6486.516  |       N/A\n",
+      "2023-04-06 22:51:31,254 - INFO - combo.training.trainer - Epoch duration: 0:01:43.946313\n",
+      "2023-04-06 22:51:31,254 - INFO - combo.training.trainer - Estimated training time remaining: 11:31:14\n",
+      "2023-04-06 22:51:31,254 - INFO - allennlp.training.trainer - Epoch 1/399\n",
+      "2023-04-06 22:51:31,254 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 22:51:31,255 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 22:51:31,259 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5026, UAS: 0.5009, LAS: 0.2748, UEM: 0.3237, LEM: 0.0478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9612, partial_loss/deprel_loss: 2.2067, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0384, loss: 4.7510, batch_reg_loss: 0.0809, reg_loss: 0.0810 ||:   3%|2         | 3/111 [00:02<01:25,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2153, UAS: 0.4222, LAS: 0.2111, UEM: 0.2335, LEM: 0.0345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.8553, partial_loss/deprel_loss: 5.3630, partial_loss/cycle_loss: 0.0000, batch_loss: 5.1419, loss: 5.9501, batch_reg_loss: 0.0804, reg_loss: 0.0808 ||:   5%|5         | 6/111 [00:04<01:21,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1178, UAS: 0.3878, LAS: 0.1808, UEM: 0.1884, LEM: 0.0278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.1742, partial_loss/deprel_loss: 7.5720, partial_loss/cycle_loss: 0.0000, batch_loss: 7.5724, loss: 6.4967, batch_reg_loss: 0.0800, reg_loss: 0.0806 ||:   8%|8         | 9/111 [00:06<01:17,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1538, UAS: 0.3796, LAS: 0.1788, UEM: 0.1554, LEM: 0.0230, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.8665, partial_loss/deprel_loss: 7.3143, partial_loss/cycle_loss: 0.0000, batch_loss: 7.3044, loss: 6.6142, batch_reg_loss: 0.0796, reg_loss: 0.0804 ||:  11%|#         | 12/111 [00:08<01:14,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3034, UAS: 0.3993, LAS: 0.1915, UEM: 0.1191, LEM: 0.0176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.8777, partial_loss/deprel_loss: 4.3489, partial_loss/cycle_loss: 0.0000, batch_loss: 4.1338, loss: 6.2776, batch_reg_loss: 0.0791, reg_loss: 0.0801 ||:  14%|#3        | 15/111 [00:11<01:10,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0891, UAS: 0.4053, LAS: 0.1952, UEM: 0.0993, LEM: 0.0147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 11.4397, partial_loss/deprel_loss: 9.1175, partial_loss/cycle_loss: 0.0000, batch_loss: 9.6606, loss: 6.2553, batch_reg_loss: 0.0787, reg_loss: 0.0799 ||:  16%|#6        | 18/111 [00:13<01:07,  1.38it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1735, UAS: 0.3983, LAS: 0.1911, UEM: 0.0899, LEM: 0.0133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.8049, partial_loss/deprel_loss: 6.6946, partial_loss/cycle_loss: 0.0000, batch_loss: 6.5950, loss: 6.3528, batch_reg_loss: 0.0783, reg_loss: 0.0797 ||:  19%|#8        | 21/111 [00:15<01:03,  1.41it/s] \n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2083, UAS: 0.3981, LAS: 0.1902, UEM: 0.0799, LEM: 0.0118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.1757, partial_loss/deprel_loss: 6.1916, partial_loss/cycle_loss: 0.0000, batch_loss: 6.0662, loss: 6.4057, batch_reg_loss: 0.0778, reg_loss: 0.0794 ||:  23%|##2       | 25/111 [00:17<00:58,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2246, UAS: 0.4012, LAS: 0.1929, UEM: 0.0725, LEM: 0.0107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.8645, partial_loss/deprel_loss: 6.6577, partial_loss/cycle_loss: 0.0000, batch_loss: 6.5763, loss: 6.4495, batch_reg_loss: 0.0772, reg_loss: 0.0792 ||:  26%|##6       | 29/111 [00:19<00:53,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2794, UAS: 0.4082, LAS: 0.1982, UEM: 0.0672, LEM: 0.0099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.1211, partial_loss/deprel_loss: 5.4412, partial_loss/cycle_loss: 0.0000, batch_loss: 5.2540, loss: 6.4181, batch_reg_loss: 0.0768, reg_loss: 0.0790 ||:  29%|##8       | 32/111 [00:22<00:52,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4732, UAS: 0.4244, LAS: 0.2122, UEM: 0.0709, LEM: 0.0090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3779, partial_loss/deprel_loss: 2.8672, partial_loss/cycle_loss: 0.0000, batch_loss: 2.6458, loss: 6.2343, batch_reg_loss: 0.0764, reg_loss: 0.0787 ||:  32%|###1      | 35/111 [00:24<00:51,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3141, UAS: 0.4378, LAS: 0.2248, UEM: 0.0649, LEM: 0.0081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.3674, partial_loss/deprel_loss: 5.2037, partial_loss/cycle_loss: 0.0000, batch_loss: 5.1125, loss: 6.0777, batch_reg_loss: 0.0761, reg_loss: 0.0785 ||:  34%|###4      | 38/111 [00:26<00:49,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2198, UAS: 0.4458, LAS: 0.2334, UEM: 0.0596, LEM: 0.0074, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.4857, partial_loss/deprel_loss: 7.1532, partial_loss/cycle_loss: 0.0000, batch_loss: 7.2953, loss: 6.0151, batch_reg_loss: 0.0756, reg_loss: 0.0783 ||:  38%|###7      | 42/111 [00:28<00:44,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1855, UAS: 0.4456, LAS: 0.2364, UEM: 0.0564, LEM: 0.0070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.3300, partial_loss/deprel_loss: 7.6093, partial_loss/cycle_loss: 0.0000, batch_loss: 8.0285, loss: 6.0670, batch_reg_loss: 0.0751, reg_loss: 0.0780 ||:  41%|####1     | 46/111 [00:31<00:41,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3267, UAS: 0.4538, LAS: 0.2458, UEM: 0.0542, LEM: 0.0064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.7855, partial_loss/deprel_loss: 5.4041, partial_loss/cycle_loss: 0.0000, batch_loss: 5.3551, loss: 5.9627, batch_reg_loss: 0.0747, reg_loss: 0.0778 ||:  45%|####5     | 50/111 [00:33<00:40,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2382, UAS: 0.4571, LAS: 0.2516, UEM: 0.0580, LEM: 0.0061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 8.0241, partial_loss/deprel_loss: 6.9911, partial_loss/cycle_loss: 0.0000, batch_loss: 7.2719, loss: 5.9374, batch_reg_loss: 0.0743, reg_loss: 0.0775 ||:  49%|####8     | 54/111 [00:36<00:38,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3417, UAS: 0.4640, LAS: 0.2595, UEM: 0.0551, LEM: 0.0057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.8885, partial_loss/deprel_loss: 5.4813, partial_loss/cycle_loss: 0.0000, batch_loss: 5.4367, loss: 5.8601, batch_reg_loss: 0.0740, reg_loss: 0.0773 ||:  51%|#####1    | 57/111 [00:38<00:37,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5159, UAS: 0.4709, LAS: 0.2672, UEM: 0.0535, LEM: 0.0055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9516, partial_loss/deprel_loss: 3.0269, partial_loss/cycle_loss: 0.0000, batch_loss: 2.8855, loss: 5.7894, batch_reg_loss: 0.0737, reg_loss: 0.0772 ||:  54%|#####4    | 60/111 [00:41<00:35,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3337, UAS: 0.4761, LAS: 0.2741, UEM: 0.0511, LEM: 0.0052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.5468, partial_loss/deprel_loss: 5.5245, partial_loss/cycle_loss: 0.0000, batch_loss: 5.6022, loss: 5.7441, batch_reg_loss: 0.0733, reg_loss: 0.0769 ||:  58%|#####7    | 64/111 [00:43<00:32,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4904, UAS: 0.4849, LAS: 0.2834, UEM: 0.0531, LEM: 0.0049, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4105, partial_loss/deprel_loss: 3.4176, partial_loss/cycle_loss: 0.0000, batch_loss: 3.2892, loss: 5.6526, batch_reg_loss: 0.0730, reg_loss: 0.0768 ||:  60%|######    | 67/111 [00:45<00:29,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4030, UAS: 0.4920, LAS: 0.2912, UEM: 0.0521, LEM: 0.0047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.4853, partial_loss/deprel_loss: 4.8174, partial_loss/cycle_loss: 0.0000, batch_loss: 4.8237, loss: 5.5778, batch_reg_loss: 0.0727, reg_loss: 0.0766 ||:  63%|######3   | 70/111 [00:47<00:28,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5730, UAS: 0.4957, LAS: 0.2965, UEM: 0.0518, LEM: 0.0046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8525, partial_loss/deprel_loss: 2.9431, partial_loss/cycle_loss: 0.0000, batch_loss: 2.7975, loss: 5.5408, batch_reg_loss: 0.0724, reg_loss: 0.0764 ||:  66%|######5   | 73/111 [00:50<00:26,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6026, UAS: 0.5030, LAS: 0.3044, UEM: 0.0582, LEM: 0.0055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2230, partial_loss/deprel_loss: 2.2791, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1400, loss: 5.4648, batch_reg_loss: 0.0722, reg_loss: 0.0763 ||:  68%|######8   | 76/111 [00:52<00:24,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5257, UAS: 0.5093, LAS: 0.3114, UEM: 0.0590, LEM: 0.0055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3376, partial_loss/deprel_loss: 3.2408, partial_loss/cycle_loss: 0.0000, batch_loss: 3.1320, loss: 5.3956, batch_reg_loss: 0.0719, reg_loss: 0.0761 ||:  71%|#######1  | 79/111 [00:54<00:22,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4749, UAS: 0.5194, LAS: 0.3224, UEM: 0.0594, LEM: 0.0054, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.3244, partial_loss/deprel_loss: 4.0444, partial_loss/cycle_loss: 0.0000, batch_loss: 3.9720, loss: 5.2892, batch_reg_loss: 0.0716, reg_loss: 0.0759 ||:  75%|#######4  | 83/111 [00:56<00:19,  1.45it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3801, UAS: 0.5250, LAS: 0.3287, UEM: 0.0793, LEM: 0.0098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.3332, partial_loss/deprel_loss: 5.2213, partial_loss/cycle_loss: 0.0000, batch_loss: 5.3150, loss: 5.2322, batch_reg_loss: 0.0713, reg_loss: 0.0757 ||:  77%|#######7  | 86/111 [00:58<00:17,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6195, UAS: 0.5311, LAS: 0.3359, UEM: 0.0901, LEM: 0.0120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5655, partial_loss/deprel_loss: 2.5718, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4416, loss: 5.1692, batch_reg_loss: 0.0711, reg_loss: 0.0756 ||:  80%|########  | 89/111 [01:01<00:15,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3892, UAS: 0.5363, LAS: 0.3422, UEM: 0.0929, LEM: 0.0126, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.3758, partial_loss/deprel_loss: 4.9502, partial_loss/cycle_loss: 0.0000, batch_loss: 5.1062, loss: 5.1101, batch_reg_loss: 0.0708, reg_loss: 0.0754 ||:  83%|########2 | 92/111 [01:03<00:14,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4308, UAS: 0.5397, LAS: 0.3464, UEM: 0.0947, LEM: 0.0126, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.4937, partial_loss/deprel_loss: 4.5762, partial_loss/cycle_loss: 0.0000, batch_loss: 4.6303, loss: 5.0772, batch_reg_loss: 0.0706, reg_loss: 0.0753 ||:  86%|########5 | 95/111 [01:05<00:12,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4948, UAS: 0.5455, LAS: 0.3534, UEM: 0.0926, LEM: 0.0121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.4684, partial_loss/deprel_loss: 3.7837, partial_loss/cycle_loss: 0.0000, batch_loss: 3.7909, loss: 5.0118, batch_reg_loss: 0.0703, reg_loss: 0.0751 ||:  89%|########9 | 99/111 [01:08<00:08,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5697, UAS: 0.5519, LAS: 0.3608, UEM: 0.0901, LEM: 0.0116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5438, partial_loss/deprel_loss: 3.1081, partial_loss/cycle_loss: 0.0000, batch_loss: 3.0652, loss: 4.9450, batch_reg_loss: 0.0700, reg_loss: 0.0749 ||:  93%|#########2| 103/111 [01:11<00:05,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4417, UAS: 0.5557, LAS: 0.3658, UEM: 0.0879, LEM: 0.0113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.9554, partial_loss/deprel_loss: 4.7208, partial_loss/cycle_loss: 0.0000, batch_loss: 4.8375, loss: 4.9064, batch_reg_loss: 0.0697, reg_loss: 0.0747 ||:  96%|#########6| 107/111 [01:13<00:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4557, UAS: 0.5579, LAS: 0.3695, UEM: 0.0862, LEM: 0.0111, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.5091, partial_loss/deprel_loss: 4.5216, partial_loss/cycle_loss: 0.0000, batch_loss: 4.5886, loss: 4.8903, batch_reg_loss: 0.0695, reg_loss: 0.0745 ||: 100%|##########| 111/111 [01:16<00:00,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4557, UAS: 0.5579, LAS: 0.3695, UEM: 0.0862, LEM: 0.0111, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.5091, partial_loss/deprel_loss: 4.5216, partial_loss/cycle_loss: 0.0000, batch_loss: 4.5886, loss: 4.8903, batch_reg_loss: 0.0695, reg_loss: 0.0745 ||: 100%|##########| 111/111 [01:16<00:00,  1.46it/s]\n",
+      "2023-04-06 22:52:47,522 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 22:52:47,522 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:52:47,522 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:52:47,522 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:52:47,522 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 22:52:47,522 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:52:47,522 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     4.522  |       N/A\n",
+      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     4.509  |       N/A\n",
+      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.075  |       N/A\n",
+      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - UEM                      |     0.086  |       N/A\n",
+      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - LAS                      |     0.369  |       N/A\n",
+      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - loss                     |     4.890  |       N/A\n",
+      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.097  |       N/A\n",
+      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - LEM                      |     0.011  |       N/A\n",
+      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - UAS                      |     0.558  |       N/A\n",
+      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - EM                       |     0.456  |       N/A\n",
+      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 22:52:47,524 - INFO - combo.training.trainer - Epoch duration: 0:01:16.269599\n",
+      "2023-04-06 22:52:47,524 - INFO - combo.training.trainer - Estimated training time remaining: 9:57:43\n",
+      "2023-04-06 22:52:47,524 - INFO - allennlp.training.trainer - Epoch 2/399\n",
+      "2023-04-06 22:52:47,524 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 22:52:47,525 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 22:52:47,531 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4964, UAS: 0.6204, LAS: 0.4727, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.5829, partial_loss/deprel_loss: 3.9397, partial_loss/cycle_loss: 0.0000, batch_loss: 3.9376, loss: 4.4478, batch_reg_loss: 0.0693, reg_loss: 0.0693 ||:   3%|2         | 3/111 [00:02<01:15,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6479, UAS: 0.6977, LAS: 0.5419, UEM: 0.1026, LEM: 0.0106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4297, partial_loss/deprel_loss: 2.4040, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2782, loss: 3.5690, batch_reg_loss: 0.0691, reg_loss: 0.0692 ||:   5%|5         | 6/111 [00:04<01:13,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4715, UAS: 0.6718, LAS: 0.5218, UEM: 0.0755, LEM: 0.0079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.3314, partial_loss/deprel_loss: 4.2643, partial_loss/cycle_loss: 0.0000, batch_loss: 4.3466, loss: 3.8142, batch_reg_loss: 0.0688, reg_loss: 0.0691 ||:   9%|9         | 10/111 [00:06<01:08,  1.47it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6659, UAS: 0.6858, LAS: 0.5350, UEM: 0.0982, LEM: 0.0139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2351, partial_loss/deprel_loss: 2.0560, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9605, loss: 3.6185, batch_reg_loss: 0.0687, reg_loss: 0.0690 ||:  12%|#1        | 13/111 [00:09<01:10,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4735, UAS: 0.6843, LAS: 0.5326, UEM: 0.0795, LEM: 0.0112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.1403, partial_loss/deprel_loss: 4.2142, partial_loss/cycle_loss: 0.0000, batch_loss: 4.2679, loss: 3.6370, batch_reg_loss: 0.0685, reg_loss: 0.0689 ||:  15%|#5        | 17/111 [00:11<01:04,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6194, UAS: 0.6898, LAS: 0.5366, UEM: 0.0818, LEM: 0.0096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6949, partial_loss/deprel_loss: 2.5650, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4592, loss: 3.5757, batch_reg_loss: 0.0683, reg_loss: 0.0688 ||:  19%|#8        | 21/111 [00:14<01:00,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8213, UAS: 0.6979, LAS: 0.5455, UEM: 0.2170, LEM: 0.0958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2964, partial_loss/deprel_loss: 0.8507, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8079, loss: 3.5040, batch_reg_loss: 0.0681, reg_loss: 0.0687 ||:  23%|##2       | 25/111 [00:17<01:00,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5476, UAS: 0.7039, LAS: 0.5509, UEM: 0.1942, LEM: 0.0844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.0957, partial_loss/deprel_loss: 3.5291, partial_loss/cycle_loss: 0.0000, batch_loss: 3.5103, loss: 3.4550, batch_reg_loss: 0.0679, reg_loss: 0.0686 ||:  26%|##6       | 29/111 [00:19<00:55,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4213, UAS: 0.7068, LAS: 0.5547, UEM: 0.2095, LEM: 0.0826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.1965, partial_loss/deprel_loss: 4.9298, partial_loss/cycle_loss: 0.0000, batch_loss: 5.2509, loss: 3.4173, batch_reg_loss: 0.0677, reg_loss: 0.0685 ||:  29%|##8       | 32/111 [00:21<00:54,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4924, UAS: 0.7115, LAS: 0.5588, UEM: 0.1968, LEM: 0.0746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.2653, partial_loss/deprel_loss: 4.2745, partial_loss/cycle_loss: 0.0000, batch_loss: 4.3402, loss: 3.3855, batch_reg_loss: 0.0675, reg_loss: 0.0684 ||:  32%|###2      | 36/111 [00:24<00:49,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4861, UAS: 0.7136, LAS: 0.5609, UEM: 0.1834, LEM: 0.0689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.9229, partial_loss/deprel_loss: 4.5551, partial_loss/cycle_loss: 0.0000, batch_loss: 4.6960, loss: 3.3816, batch_reg_loss: 0.0673, reg_loss: 0.0683 ||:  36%|###6      | 40/111 [00:26<00:45,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5632, UAS: 0.7197, LAS: 0.5670, UEM: 0.2184, LEM: 0.0784, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.7730, partial_loss/deprel_loss: 3.3519, partial_loss/cycle_loss: 0.0000, batch_loss: 3.3032, loss: 3.3144, batch_reg_loss: 0.0672, reg_loss: 0.0682 ||:  40%|###9      | 44/111 [00:29<00:43,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6700, UAS: 0.7271, LAS: 0.5743, UEM: 0.2131, LEM: 0.0736, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5173, partial_loss/deprel_loss: 2.2309, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1552, loss: 3.2352, batch_reg_loss: 0.0670, reg_loss: 0.0681 ||:  43%|####3     | 48/111 [00:32<00:42,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6822, UAS: 0.7298, LAS: 0.5776, UEM: 0.2081, LEM: 0.0692, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4613, partial_loss/deprel_loss: 2.0556, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0036, loss: 3.1978, batch_reg_loss: 0.0668, reg_loss: 0.0680 ||:  47%|####6     | 52/111 [00:34<00:38,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5462, UAS: 0.7286, LAS: 0.5768, UEM: 0.2001, LEM: 0.0662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.8922, partial_loss/deprel_loss: 3.8440, partial_loss/cycle_loss: 0.0000, batch_loss: 3.9202, loss: 3.2158, batch_reg_loss: 0.0666, reg_loss: 0.0679 ||:  50%|#####     | 56/111 [00:37<00:34,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6350, UAS: 0.7299, LAS: 0.5784, UEM: 0.1921, LEM: 0.0628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9702, partial_loss/deprel_loss: 2.6377, partial_loss/cycle_loss: 0.0000, batch_loss: 2.5707, loss: 3.2028, batch_reg_loss: 0.0665, reg_loss: 0.0678 ||:  54%|#####4    | 60/111 [00:39<00:31,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5091, UAS: 0.7325, LAS: 0.5817, UEM: 0.2037, LEM: 0.0652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.4303, partial_loss/deprel_loss: 4.1332, partial_loss/cycle_loss: 0.0000, batch_loss: 4.2589, loss: 3.1722, batch_reg_loss: 0.0663, reg_loss: 0.0677 ||:  58%|#####7    | 64/111 [00:42<00:29,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7077, UAS: 0.7373, LAS: 0.5864, UEM: 0.2098, LEM: 0.0632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8847, partial_loss/deprel_loss: 1.6877, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5933, loss: 3.1156, batch_reg_loss: 0.0661, reg_loss: 0.0677 ||:  61%|######1   | 68/111 [00:45<00:28,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6647, UAS: 0.7394, LAS: 0.5886, UEM: 0.2110, LEM: 0.0610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6878, partial_loss/deprel_loss: 2.3390, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2747, loss: 3.0945, batch_reg_loss: 0.0660, reg_loss: 0.0676 ||:  65%|######4   | 72/111 [00:47<00:26,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7484, UAS: 0.7455, LAS: 0.5957, UEM: 0.2179, LEM: 0.0604, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9192, partial_loss/deprel_loss: 1.6239, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5488, loss: 3.0243, batch_reg_loss: 0.0658, reg_loss: 0.0675 ||:  68%|######8   | 76/111 [00:50<00:22,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6129, UAS: 0.7469, LAS: 0.5972, UEM: 0.2108, LEM: 0.0580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4237, partial_loss/deprel_loss: 2.8786, partial_loss/cycle_loss: 0.0000, batch_loss: 2.8533, loss: 3.0067, batch_reg_loss: 0.0657, reg_loss: 0.0674 ||:  72%|#######2  | 80/111 [00:52<00:20,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6110, UAS: 0.7481, LAS: 0.5991, UEM: 0.2070, LEM: 0.0563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.7020, partial_loss/deprel_loss: 2.9102, partial_loss/cycle_loss: 0.0000, batch_loss: 2.9341, loss: 2.9940, batch_reg_loss: 0.0655, reg_loss: 0.0673 ||:  76%|#######5  | 84/111 [00:55<00:17,  1.51it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6596, UAS: 0.7500, LAS: 0.6014, UEM: 0.2146, LEM: 0.0583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7501, partial_loss/deprel_loss: 2.3329, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2817, loss: 2.9726, batch_reg_loss: 0.0654, reg_loss: 0.0672 ||:  79%|#######9  | 88/111 [00:58<00:15,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6643, UAS: 0.7513, LAS: 0.6027, UEM: 0.2091, LEM: 0.0562, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8068, partial_loss/deprel_loss: 2.3690, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3218, loss: 2.9569, batch_reg_loss: 0.0652, reg_loss: 0.0671 ||:  83%|########2 | 92/111 [01:00<00:12,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6382, UAS: 0.7496, LAS: 0.6019, UEM: 0.2044, LEM: 0.0549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3354, partial_loss/deprel_loss: 2.7962, partial_loss/cycle_loss: 0.0000, batch_loss: 2.7691, loss: 2.9764, batch_reg_loss: 0.0651, reg_loss: 0.0670 ||:  86%|########6 | 96/111 [01:03<00:09,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6473, UAS: 0.7524, LAS: 0.6053, UEM: 0.2124, LEM: 0.0594, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9798, partial_loss/deprel_loss: 2.4559, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4257, loss: 2.9392, batch_reg_loss: 0.0650, reg_loss: 0.0670 ||:  90%|######### | 100/111 [01:06<00:07,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7644, UAS: 0.7557, LAS: 0.6091, UEM: 0.2193, LEM: 0.0602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7733, partial_loss/deprel_loss: 1.3687, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3145, loss: 2.9018, batch_reg_loss: 0.0649, reg_loss: 0.0669 ||:  93%|#########2| 103/111 [01:08<00:05,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7474, UAS: 0.7586, LAS: 0.6125, UEM: 0.2241, LEM: 0.0607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8481, partial_loss/deprel_loss: 1.5531, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4769, loss: 2.8675, batch_reg_loss: 0.0648, reg_loss: 0.0668 ||:  95%|#########5| 106/111 [01:10<00:03,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6552, UAS: 0.7581, LAS: 0.6123, UEM: 0.2194, LEM: 0.0593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0818, partial_loss/deprel_loss: 2.4685, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4559, loss: 2.8710, batch_reg_loss: 0.0647, reg_loss: 0.0668 ||:  99%|#########9| 110/111 [01:13<00:00,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7474, UAS: 0.7592, LAS: 0.6135, UEM: 0.2213, LEM: 0.0596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8614, partial_loss/deprel_loss: 1.4801, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4210, loss: 2.8579, batch_reg_loss: 0.0646, reg_loss: 0.0668 ||: 100%|##########| 111/111 [01:13<00:00,  1.50it/s]\n",
+      "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.480  |       N/A\n",
+      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.861  |       N/A\n",
+      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.067  |       N/A\n",
+      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - UEM                      |     0.221  |       N/A\n",
+      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - LAS                      |     0.614  |       N/A\n",
+      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - loss                     |     2.858  |       N/A\n",
+      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.097  |       N/A\n",
+      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - LEM                      |     0.060  |       N/A\n",
+      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - UAS                      |     0.759  |       N/A\n",
+      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - EM                       |     0.747  |       N/A\n",
+      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 22:54:01,489 - INFO - combo.training.trainer - Epoch duration: 0:01:13.964691\n",
+      "2023-04-06 22:54:01,489 - INFO - combo.training.trainer - Estimated training time remaining: 9:20:36\n",
+      "2023-04-06 22:54:01,489 - INFO - allennlp.training.trainer - Epoch 3/399\n",
+      "2023-04-06 22:54:01,489 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 22:54:01,490 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 22:54:01,496 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5522, UAS: 0.7779, LAS: 0.6461, UEM: 0.4911, LEM: 0.1886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.8721, partial_loss/deprel_loss: 3.5902, partial_loss/cycle_loss: 0.0000, batch_loss: 3.7111, loss: 2.6501, batch_reg_loss: 0.0646, reg_loss: 0.0646 ||:   3%|2         | 3/111 [00:02<01:18,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5244, UAS: 0.7464, LAS: 0.6105, UEM: 0.3157, LEM: 0.1195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.4001, partial_loss/deprel_loss: 3.7685, partial_loss/cycle_loss: 0.0000, batch_loss: 3.9592, loss: 2.9957, batch_reg_loss: 0.0644, reg_loss: 0.0645 ||:   6%|6         | 7/111 [00:04<01:12,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7839, UAS: 0.7827, LAS: 0.6504, UEM: 0.3397, LEM: 0.1092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6771, partial_loss/deprel_loss: 1.2152, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1719, loss: 2.5749, batch_reg_loss: 0.0644, reg_loss: 0.0645 ||:   9%|9         | 10/111 [00:07<01:15,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5962, UAS: 0.7864, LAS: 0.6557, UEM: 0.2923, LEM: 0.0888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.4499, partial_loss/deprel_loss: 3.2404, partial_loss/cycle_loss: 0.0000, batch_loss: 3.3466, loss: 2.5323, batch_reg_loss: 0.0643, reg_loss: 0.0644 ||:  12%|#1        | 13/111 [00:09<01:15,  1.30it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7262, UAS: 0.7947, LAS: 0.6646, UEM: 0.2585, LEM: 0.0737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3265, partial_loss/deprel_loss: 2.0057, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9340, loss: 2.4410, batch_reg_loss: 0.0642, reg_loss: 0.0644 ||:  14%|#4        | 16/111 [00:11<01:10,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7504, UAS: 0.7977, LAS: 0.6674, UEM: 0.2444, LEM: 0.0644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9908, partial_loss/deprel_loss: 1.5113, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4713, loss: 2.4127, batch_reg_loss: 0.0641, reg_loss: 0.0644 ||:  18%|#8        | 20/111 [00:14<01:04,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7616, UAS: 0.8064, LAS: 0.6763, UEM: 0.2720, LEM: 0.0723, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6766, partial_loss/deprel_loss: 1.3444, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2749, loss: 2.3152, batch_reg_loss: 0.0640, reg_loss: 0.0643 ||:  22%|##1       | 24/111 [00:17<01:01,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7372, UAS: 0.8092, LAS: 0.6787, UEM: 0.2590, LEM: 0.0651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9644, partial_loss/deprel_loss: 1.6293, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5602, loss: 2.2885, batch_reg_loss: 0.0639, reg_loss: 0.0643 ||:  25%|##5       | 28/111 [00:19<00:56,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6937, UAS: 0.8106, LAS: 0.6800, UEM: 0.2438, LEM: 0.0602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7709, partial_loss/deprel_loss: 2.3077, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2642, loss: 2.2836, batch_reg_loss: 0.0638, reg_loss: 0.0642 ||:  28%|##7       | 31/111 [00:21<00:54,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6296, UAS: 0.8098, LAS: 0.6796, UEM: 0.2471, LEM: 0.0589, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.8165, partial_loss/deprel_loss: 2.8907, partial_loss/cycle_loss: 0.0000, batch_loss: 2.9396, loss: 2.2935, batch_reg_loss: 0.0637, reg_loss: 0.0642 ||:  31%|###       | 34/111 [00:23<00:52,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7206, UAS: 0.8103, LAS: 0.6805, UEM: 0.2360, LEM: 0.0556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4751, partial_loss/deprel_loss: 1.8719, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8562, loss: 2.2865, batch_reg_loss: 0.0637, reg_loss: 0.0641 ||:  33%|###3      | 37/111 [00:25<00:50,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7730, UAS: 0.8120, LAS: 0.6830, UEM: 0.2357, LEM: 0.0549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7538, partial_loss/deprel_loss: 1.3218, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2718, loss: 2.2638, batch_reg_loss: 0.0636, reg_loss: 0.0641 ||:  37%|###6      | 41/111 [00:28<00:48,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7604, UAS: 0.8162, LAS: 0.6880, UEM: 0.2428, LEM: 0.0550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9503, partial_loss/deprel_loss: 1.5284, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4763, loss: 2.2114, batch_reg_loss: 0.0635, reg_loss: 0.0640 ||:  40%|###9      | 44/111 [00:31<00:48,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6857, UAS: 0.8111, LAS: 0.6833, UEM: 0.2349, LEM: 0.0532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9399, partial_loss/deprel_loss: 2.2534, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2541, loss: 2.2633, batch_reg_loss: 0.0634, reg_loss: 0.0640 ||:  42%|####2     | 47/111 [00:33<00:45,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5934, UAS: 0.8120, LAS: 0.6844, UEM: 0.2419, LEM: 0.0557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.2585, partial_loss/deprel_loss: 3.4598, partial_loss/cycle_loss: 0.0000, batch_loss: 3.4829, loss: 2.2516, batch_reg_loss: 0.0634, reg_loss: 0.0640 ||:  45%|####5     | 50/111 [00:35<00:43,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7835, UAS: 0.8132, LAS: 0.6859, UEM: 0.2388, LEM: 0.0539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8033, partial_loss/deprel_loss: 1.3395, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2956, loss: 2.2403, batch_reg_loss: 0.0633, reg_loss: 0.0639 ||:  49%|####8     | 54/111 [00:37<00:39,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6621, UAS: 0.8141, LAS: 0.6874, UEM: 0.2512, LEM: 0.0626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2108, partial_loss/deprel_loss: 2.3082, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3519, loss: 2.2189, batch_reg_loss: 0.0632, reg_loss: 0.0639 ||:  51%|#####1    | 57/111 [00:40<00:38,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7630, UAS: 0.8126, LAS: 0.6865, UEM: 0.2518, LEM: 0.0619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7939, partial_loss/deprel_loss: 1.3554, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3063, loss: 2.2319, batch_reg_loss: 0.0631, reg_loss: 0.0638 ||:  55%|#####4    | 61/111 [00:42<00:34,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6531, UAS: 0.8133, LAS: 0.6870, UEM: 0.2467, LEM: 0.0600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5764, partial_loss/deprel_loss: 2.7017, partial_loss/cycle_loss: 0.0000, batch_loss: 2.7397, loss: 2.2260, batch_reg_loss: 0.0631, reg_loss: 0.0638 ||:  58%|#####7    | 64/111 [00:44<00:32,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7632, UAS: 0.8168, LAS: 0.6906, UEM: 0.2563, LEM: 0.0609, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0152, partial_loss/deprel_loss: 1.4983, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4647, loss: 2.1896, batch_reg_loss: 0.0630, reg_loss: 0.0638 ||:  60%|######    | 67/111 [00:46<00:31,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7593, UAS: 0.8180, LAS: 0.6922, UEM: 0.2522, LEM: 0.0592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0271, partial_loss/deprel_loss: 1.5328, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4947, loss: 2.1787, batch_reg_loss: 0.0630, reg_loss: 0.0637 ||:  63%|######3   | 70/111 [00:49<00:29,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8697, UAS: 0.8196, LAS: 0.6948, UEM: 0.2829, LEM: 0.0893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2393, partial_loss/deprel_loss: 0.5426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5448, loss: 2.1589, batch_reg_loss: 0.0629, reg_loss: 0.0637 ||:  67%|######6   | 74/111 [00:52<00:27,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6841, UAS: 0.8216, LAS: 0.6972, UEM: 0.2908, LEM: 0.0913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9630, partial_loss/deprel_loss: 2.3586, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3423, loss: 2.1351, batch_reg_loss: 0.0628, reg_loss: 0.0637 ||:  69%|######9   | 77/111 [00:54<00:25,  1.32it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7229, UAS: 0.8176, LAS: 0.6935, UEM: 0.2843, LEM: 0.0890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5630, partial_loss/deprel_loss: 1.9479, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9337, loss: 2.1812, batch_reg_loss: 0.0628, reg_loss: 0.0636 ||:  73%|#######2  | 81/111 [00:57<00:21,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7388, UAS: 0.8182, LAS: 0.6943, UEM: 0.2795, LEM: 0.0866, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1689, partial_loss/deprel_loss: 1.7263, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6775, loss: 2.1734, batch_reg_loss: 0.0627, reg_loss: 0.0636 ||:  77%|#######6  | 85/111 [00:59<00:17,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7027, UAS: 0.8202, LAS: 0.6969, UEM: 0.2926, LEM: 0.0965, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7537, partial_loss/deprel_loss: 2.1230, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1117, loss: 2.1483, batch_reg_loss: 0.0626, reg_loss: 0.0635 ||:  80%|########  | 89/111 [01:02<00:14,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7744, UAS: 0.8185, LAS: 0.6957, UEM: 0.2882, LEM: 0.0944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0477, partial_loss/deprel_loss: 1.4812, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4571, loss: 2.1638, batch_reg_loss: 0.0626, reg_loss: 0.0635 ||:  84%|########3 | 93/111 [01:04<00:11,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8176, UAS: 0.8203, LAS: 0.6977, UEM: 0.2968, LEM: 0.0975, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4458, partial_loss/deprel_loss: 0.9504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9120, loss: 2.1448, batch_reg_loss: 0.0625, reg_loss: 0.0635 ||:  87%|########7 | 97/111 [01:07<00:09,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6879, UAS: 0.8175, LAS: 0.6950, UEM: 0.2918, LEM: 0.0958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0558, partial_loss/deprel_loss: 2.3149, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3255, loss: 2.1791, batch_reg_loss: 0.0624, reg_loss: 0.0634 ||:  91%|######### | 101/111 [01:10<00:06,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7525, UAS: 0.8183, LAS: 0.6962, UEM: 0.2889, LEM: 0.0938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1692, partial_loss/deprel_loss: 1.6748, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6361, loss: 2.1703, batch_reg_loss: 0.0624, reg_loss: 0.0634 ||:  95%|#########4| 105/111 [01:13<00:04,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6415, UAS: 0.8200, LAS: 0.6981, UEM: 0.2967, LEM: 0.0958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.9598, partial_loss/deprel_loss: 2.7343, partial_loss/cycle_loss: 0.0000, batch_loss: 2.8417, loss: 2.1535, batch_reg_loss: 0.0623, reg_loss: 0.0633 ||:  98%|#########8| 109/111 [01:15<00:01,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6768, UAS: 0.8197, LAS: 0.6979, UEM: 0.2936, LEM: 0.0948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2748, partial_loss/deprel_loss: 2.3791, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4206, loss: 2.1574, batch_reg_loss: 0.0623, reg_loss: 0.0633 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
+      "2023-04-06 22:55:18,227 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 22:55:18,227 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     2.379  |       N/A\n",
+      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     2.275  |       N/A\n",
+      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.063  |       N/A\n",
+      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - UEM                      |     0.294  |       N/A\n",
+      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - LAS                      |     0.698  |       N/A\n",
+      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - loss                     |     2.157  |       N/A\n",
+      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.097  |       N/A\n",
+      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - LEM                      |     0.095  |       N/A\n",
+      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - UAS                      |     0.820  |       N/A\n",
+      "2023-04-06 22:55:18,229 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:55:18,229 - INFO - combo.training.tensorboard_writer - EM                       |     0.677  |       N/A\n",
+      "2023-04-06 22:55:18,229 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 22:55:18,229 - INFO - combo.training.trainer - Epoch duration: 0:01:16.740242\n",
+      "2023-04-06 22:55:18,229 - INFO - combo.training.trainer - Estimated training time remaining: 9:06:01\n",
+      "2023-04-06 22:55:18,230 - INFO - allennlp.training.trainer - Epoch 4/399\n",
+      "2023-04-06 22:55:18,230 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 22:55:18,230 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 22:55:18,236 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6673, UAS: 0.7876, LAS: 0.6728, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6651, partial_loss/deprel_loss: 2.6082, partial_loss/cycle_loss: 0.0000, batch_loss: 2.6819, loss: 2.5358, batch_reg_loss: 0.0623, reg_loss: 0.0623 ||:   3%|2         | 3/111 [00:02<01:16,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5590, UAS: 0.7847, LAS: 0.6734, UEM: 0.0866, LEM: 0.0162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.1240, partial_loss/deprel_loss: 3.5891, partial_loss/cycle_loss: 0.0000, batch_loss: 3.9583, loss: 2.5349, batch_reg_loss: 0.0623, reg_loss: 0.0623 ||:   5%|5         | 6/111 [00:04<01:14,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8070, UAS: 0.8104, LAS: 0.7009, UEM: 0.1961, LEM: 0.0497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6716, partial_loss/deprel_loss: 1.1607, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1251, loss: 2.2299, batch_reg_loss: 0.0622, reg_loss: 0.0623 ||:   8%|8         | 9/111 [00:06<01:13,  1.38it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6524, UAS: 0.8224, LAS: 0.7121, UEM: 0.2315, LEM: 0.0565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.7101, partial_loss/deprel_loss: 2.5980, partial_loss/cycle_loss: 0.0000, batch_loss: 2.6826, loss: 2.1006, batch_reg_loss: 0.0622, reg_loss: 0.0622 ||:  12%|#1        | 13/111 [00:09<01:08,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8191, UAS: 0.8348, LAS: 0.7248, UEM: 0.3040, LEM: 0.0847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6051, partial_loss/deprel_loss: 1.1280, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0855, loss: 1.9659, batch_reg_loss: 0.0621, reg_loss: 0.0622 ||:  14%|#4        | 16/111 [00:11<01:08,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7504, UAS: 0.8448, LAS: 0.7351, UEM: 0.3447, LEM: 0.0959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1769, partial_loss/deprel_loss: 1.5892, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5688, loss: 1.8513, batch_reg_loss: 0.0621, reg_loss: 0.0622 ||:  17%|#7        | 19/111 [00:13<01:08,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6802, UAS: 0.8436, LAS: 0.7338, UEM: 0.3206, LEM: 0.0886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3447, partial_loss/deprel_loss: 2.3007, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3715, loss: 1.8468, batch_reg_loss: 0.0620, reg_loss: 0.0622 ||:  21%|##        | 23/111 [00:16<01:02,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6018, UAS: 0.8382, LAS: 0.7278, UEM: 0.2957, LEM: 0.0798, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.6370, partial_loss/deprel_loss: 2.9539, partial_loss/cycle_loss: 0.0000, batch_loss: 3.1524, loss: 1.9081, batch_reg_loss: 0.0620, reg_loss: 0.0621 ||:  24%|##4       | 27/111 [00:18<00:56,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8199, UAS: 0.8419, LAS: 0.7321, UEM: 0.3047, LEM: 0.0860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6244, partial_loss/deprel_loss: 1.0798, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0506, loss: 1.8696, batch_reg_loss: 0.0619, reg_loss: 0.0621 ||:  28%|##7       | 31/111 [00:21<00:53,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6994, UAS: 0.8443, LAS: 0.7347, UEM: 0.3040, LEM: 0.0849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3267, partial_loss/deprel_loss: 2.3726, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4253, loss: 1.8526, batch_reg_loss: 0.0619, reg_loss: 0.0621 ||:  31%|###       | 34/111 [00:23<00:52,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8111, UAS: 0.8474, LAS: 0.7388, UEM: 0.3153, LEM: 0.0885, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5854, partial_loss/deprel_loss: 1.0084, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9856, loss: 1.8095, batch_reg_loss: 0.0618, reg_loss: 0.0621 ||:  33%|###3      | 37/111 [00:26<00:54,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7707, UAS: 0.8458, LAS: 0.7371, UEM: 0.3159, LEM: 0.0895, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1063, partial_loss/deprel_loss: 1.5260, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5038, loss: 1.8230, batch_reg_loss: 0.0618, reg_loss: 0.0620 ||:  37%|###6      | 41/111 [00:28<00:49,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6812, UAS: 0.8369, LAS: 0.7281, UEM: 0.3046, LEM: 0.0863, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4355, partial_loss/deprel_loss: 2.4780, partial_loss/cycle_loss: 0.0000, batch_loss: 2.5312, loss: 1.9258, batch_reg_loss: 0.0617, reg_loss: 0.0620 ||:  41%|####      | 45/111 [00:31<00:44,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7159, UAS: 0.8362, LAS: 0.7273, UEM: 0.2977, LEM: 0.0830, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6377, partial_loss/deprel_loss: 2.1209, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0860, loss: 1.9371, batch_reg_loss: 0.0617, reg_loss: 0.0620 ||:  43%|####3     | 48/111 [00:33<00:44,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7413, UAS: 0.8332, LAS: 0.7243, UEM: 0.2893, LEM: 0.0804, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3635, partial_loss/deprel_loss: 1.7896, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7661, loss: 1.9680, batch_reg_loss: 0.0617, reg_loss: 0.0620 ||:  46%|####5     | 51/111 [00:35<00:43,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7546, UAS: 0.8368, LAS: 0.7289, UEM: 0.3044, LEM: 0.0903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4638, partial_loss/deprel_loss: 1.6606, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6829, loss: 1.9241, batch_reg_loss: 0.0617, reg_loss: 0.0620 ||:  50%|####9     | 55/111 [00:38<00:38,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8019, UAS: 0.8378, LAS: 0.7302, UEM: 0.2995, LEM: 0.0866, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7480, partial_loss/deprel_loss: 1.2659, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2240, loss: 1.9138, batch_reg_loss: 0.0617, reg_loss: 0.0619 ||:  53%|#####3    | 59/111 [00:40<00:35,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7229, UAS: 0.8413, LAS: 0.7346, UEM: 0.3580, LEM: 0.1405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7434, partial_loss/deprel_loss: 2.0320, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0359, loss: 1.8734, batch_reg_loss: 0.0616, reg_loss: 0.0619 ||:  56%|#####5    | 62/111 [00:43<00:36,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7846, UAS: 0.8430, LAS: 0.7366, UEM: 0.3472, LEM: 0.1341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0253, partial_loss/deprel_loss: 1.4828, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4530, loss: 1.8528, batch_reg_loss: 0.0616, reg_loss: 0.0619 ||:  59%|#####9    | 66/111 [00:46<00:32,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8108, UAS: 0.8447, LAS: 0.7383, UEM: 0.3415, LEM: 0.1300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7083, partial_loss/deprel_loss: 1.0955, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0797, loss: 1.8399, batch_reg_loss: 0.0616, reg_loss: 0.0619 ||:  63%|######3   | 70/111 [00:49<00:29,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8163, UAS: 0.8453, LAS: 0.7392, UEM: 0.3375, LEM: 0.1274, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6994, partial_loss/deprel_loss: 1.2058, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1661, loss: 1.8386, batch_reg_loss: 0.0616, reg_loss: 0.0619 ||:  66%|######5   | 73/111 [00:51<00:27,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7005, UAS: 0.8452, LAS: 0.7393, UEM: 0.3279, LEM: 0.1228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2810, partial_loss/deprel_loss: 2.1734, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2565, loss: 1.8368, batch_reg_loss: 0.0615, reg_loss: 0.0619 ||:  69%|######9   | 77/111 [00:53<00:23,  1.47it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6741, UAS: 0.8452, LAS: 0.7395, UEM: 0.3431, LEM: 0.1362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5383, partial_loss/deprel_loss: 2.6162, partial_loss/cycle_loss: 0.0000, batch_loss: 2.6622, loss: 1.8377, batch_reg_loss: 0.0615, reg_loss: 0.0618 ||:  72%|#######2  | 80/111 [00:55<00:21,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7905, UAS: 0.8448, LAS: 0.7389, UEM: 0.3355, LEM: 0.1324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8467, partial_loss/deprel_loss: 1.3524, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3128, loss: 1.8435, batch_reg_loss: 0.0615, reg_loss: 0.0618 ||:  76%|#######5  | 84/111 [00:58<00:18,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7866, UAS: 0.8450, LAS: 0.7392, UEM: 0.3311, LEM: 0.1296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9914, partial_loss/deprel_loss: 1.4335, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4066, loss: 1.8406, batch_reg_loss: 0.0615, reg_loss: 0.0618 ||:  78%|#######8  | 87/111 [01:00<00:16,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8356, UAS: 0.8472, LAS: 0.7416, UEM: 0.3370, LEM: 0.1305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3395, partial_loss/deprel_loss: 0.8325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7954, loss: 1.8162, batch_reg_loss: 0.0615, reg_loss: 0.0618 ||:  82%|########1 | 91/111 [01:02<00:13,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6469, UAS: 0.8463, LAS: 0.7407, UEM: 0.3336, LEM: 0.1286, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.0053, partial_loss/deprel_loss: 2.4016, partial_loss/cycle_loss: 0.0000, batch_loss: 2.5838, loss: 1.8231, batch_reg_loss: 0.0615, reg_loss: 0.0618 ||:  85%|########4 | 94/111 [01:05<00:11,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7256, UAS: 0.8454, LAS: 0.7396, UEM: 0.3284, LEM: 0.1263, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6650, partial_loss/deprel_loss: 1.9252, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9346, loss: 1.8328, batch_reg_loss: 0.0614, reg_loss: 0.0618 ||:  87%|########7 | 97/111 [01:07<00:10,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7599, UAS: 0.8465, LAS: 0.7407, UEM: 0.3289, LEM: 0.1240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2847, partial_loss/deprel_loss: 1.7309, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7031, loss: 1.8239, batch_reg_loss: 0.0614, reg_loss: 0.0618 ||:  91%|######### | 101/111 [01:09<00:06,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8397, UAS: 0.8483, LAS: 0.7429, UEM: 0.3366, LEM: 0.1267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5180, partial_loss/deprel_loss: 0.8814, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8701, loss: 1.8040, batch_reg_loss: 0.0614, reg_loss: 0.0618 ||:  95%|#########4| 105/111 [01:11<00:03,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7331, UAS: 0.8486, LAS: 0.7433, UEM: 0.3357, LEM: 0.1260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9632, partial_loss/deprel_loss: 1.9598, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0219, loss: 1.8012, batch_reg_loss: 0.0614, reg_loss: 0.0617 ||:  98%|#########8| 109/111 [01:14<00:01,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8351, UAS: 0.8500, LAS: 0.7451, UEM: 0.3439, LEM: 0.1293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5623, partial_loss/deprel_loss: 0.9248, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9137, loss: 1.7845, batch_reg_loss: 0.0614, reg_loss: 0.0617 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
+      "2023-04-06 22:56:33,798 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 22:56:33,798 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.925  |       N/A\n",
+      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.562  |       N/A\n",
+      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.062  |       N/A\n",
+      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - UEM                      |     0.344  |       N/A\n",
+      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - LAS                      |     0.745  |       N/A\n",
+      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - loss                     |     1.785  |       N/A\n",
+      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.097  |       N/A\n",
+      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - LEM                      |     0.129  |       N/A\n",
+      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:56:33,800 - INFO - combo.training.tensorboard_writer - UAS                      |     0.850  |       N/A\n",
+      "2023-04-06 22:56:33,800 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:56:33,800 - INFO - combo.training.tensorboard_writer - EM                       |     0.835  |       N/A\n",
+      "2023-04-06 22:56:33,800 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 22:56:33,800 - INFO - combo.training.trainer - Epoch duration: 0:01:15.570663\n",
+      "2023-04-06 22:56:33,800 - INFO - combo.training.trainer - Estimated training time remaining: 8:55:12\n",
+      "2023-04-06 22:56:33,800 - INFO - allennlp.training.trainer - Epoch 5/399\n",
+      "2023-04-06 22:56:33,801 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 22:56:33,801 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 22:56:33,806 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7017, UAS: 0.8575, LAS: 0.7564, UEM: 0.2434, LEM: 0.0823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1851, partial_loss/deprel_loss: 2.1142, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1898, loss: 1.6516, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:   4%|3         | 4/111 [00:02<00:55,  1.93it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7902, UAS: 0.8573, LAS: 0.7593, UEM: 0.1945, LEM: 0.0493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1142, partial_loss/deprel_loss: 1.3736, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3831, loss: 1.6800, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:   7%|7         | 8/111 [00:04<00:55,  1.84it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8045, UAS: 0.8581, LAS: 0.7600, UEM: 0.1996, LEM: 0.0437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7492, partial_loss/deprel_loss: 1.2165, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1844, loss: 1.6630, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  10%|9         | 11/111 [00:06<01:00,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7124, UAS: 0.8519, LAS: 0.7533, UEM: 0.1704, LEM: 0.0371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3078, partial_loss/deprel_loss: 2.1321, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2286, loss: 1.7343, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  13%|#2        | 14/111 [00:08<01:02,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8202, UAS: 0.8522, LAS: 0.7539, UEM: 0.1756, LEM: 0.0394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7495, partial_loss/deprel_loss: 1.1383, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1219, loss: 1.7377, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  15%|#5        | 17/111 [00:11<01:03,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7448, UAS: 0.8579, LAS: 0.7603, UEM: 0.2127, LEM: 0.0579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5514, partial_loss/deprel_loss: 1.6989, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7308, loss: 1.6711, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  18%|#8        | 20/111 [00:13<01:03,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8081, UAS: 0.8630, LAS: 0.7659, UEM: 0.2570, LEM: 0.0807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9484, partial_loss/deprel_loss: 1.1780, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1934, loss: 1.6165, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  21%|##        | 23/111 [00:15<01:03,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7710, UAS: 0.8636, LAS: 0.7669, UEM: 0.2827, LEM: 0.0951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3315, partial_loss/deprel_loss: 1.5198, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5435, loss: 1.6098, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  23%|##3       | 26/111 [00:17<01:01,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7620, UAS: 0.8608, LAS: 0.7644, UEM: 0.3072, LEM: 0.1148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3709, partial_loss/deprel_loss: 1.5272, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5573, loss: 1.6290, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  27%|##7       | 30/111 [00:20<00:55,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8430, UAS: 0.8687, LAS: 0.7732, UEM: 0.3575, LEM: 0.1333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5238, partial_loss/deprel_loss: 0.8705, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8625, loss: 1.5422, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  31%|###       | 34/111 [00:22<00:51,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6280, UAS: 0.8659, LAS: 0.7697, UEM: 0.3664, LEM: 0.1405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.5054, partial_loss/deprel_loss: 2.7331, partial_loss/cycle_loss: 0.0000, batch_loss: 2.9489, loss: 1.5726, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  34%|###4      | 38/111 [00:25<00:48,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7226, UAS: 0.8644, LAS: 0.7677, UEM: 0.3535, LEM: 0.1338, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9962, partial_loss/deprel_loss: 2.0087, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0676, loss: 1.5945, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  38%|###7      | 42/111 [00:27<00:45,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7397, UAS: 0.8681, LAS: 0.7717, UEM: 0.3782, LEM: 0.1455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6230, partial_loss/deprel_loss: 1.7756, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8064, loss: 1.5545, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  41%|####1     | 46/111 [00:30<00:42,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8341, UAS: 0.8698, LAS: 0.7736, UEM: 0.3770, LEM: 0.1440, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6194, partial_loss/deprel_loss: 0.9456, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9417, loss: 1.5345, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  45%|####5     | 50/111 [00:33<00:41,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7631, UAS: 0.8696, LAS: 0.7733, UEM: 0.3760, LEM: 0.1438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5292, partial_loss/deprel_loss: 1.6206, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6637, loss: 1.5373, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  48%|####7     | 53/111 [00:35<00:40,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7952, UAS: 0.8706, LAS: 0.7745, UEM: 0.3732, LEM: 0.1419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0361, partial_loss/deprel_loss: 1.3750, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3686, loss: 1.5272, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  50%|#####     | 56/111 [00:37<00:38,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8339, UAS: 0.8725, LAS: 0.7769, UEM: 0.3885, LEM: 0.1536, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6950, partial_loss/deprel_loss: 1.0568, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0458, loss: 1.5054, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  53%|#####3    | 59/111 [00:39<00:36,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.8729, LAS: 0.7771, UEM: 0.3914, LEM: 0.1520, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6869, partial_loss/deprel_loss: 1.1239, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0979, loss: 1.5056, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  56%|#####5    | 62/111 [00:42<00:34,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7123, UAS: 0.8726, LAS: 0.7767, UEM: 0.3847, LEM: 0.1476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1384, partial_loss/deprel_loss: 1.9929, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0833, loss: 1.5100, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  59%|#####8    | 65/111 [00:44<00:32,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9076, UAS: 0.8741, LAS: 0.7786, UEM: 0.4104, LEM: 0.1780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1555, partial_loss/deprel_loss: 0.3590, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3797, loss: 1.4902, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  61%|######1   | 68/111 [00:46<00:31,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6839, UAS: 0.8727, LAS: 0.7774, UEM: 0.4028, LEM: 0.1735, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6867, partial_loss/deprel_loss: 2.2795, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4223, loss: 1.4995, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  64%|######3   | 71/111 [00:48<00:28,  1.40it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7946, UAS: 0.8714, LAS: 0.7764, UEM: 0.3971, LEM: 0.1677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0939, partial_loss/deprel_loss: 1.3590, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3673, loss: 1.5104, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  68%|######7   | 75/111 [00:51<00:24,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6175, UAS: 0.8696, LAS: 0.7746, UEM: 0.3921, LEM: 0.1644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.8233, partial_loss/deprel_loss: 2.8003, partial_loss/cycle_loss: 0.0000, batch_loss: 3.0663, loss: 1.5301, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  71%|#######1  | 79/111 [00:53<00:20,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7637, UAS: 0.8661, LAS: 0.7709, UEM: 0.3842, LEM: 0.1610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5925, partial_loss/deprel_loss: 1.8030, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8223, loss: 1.5739, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  75%|#######4  | 83/111 [00:55<00:18,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7484, UAS: 0.8666, LAS: 0.7714, UEM: 0.3769, LEM: 0.1561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5992, partial_loss/deprel_loss: 1.6861, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7301, loss: 1.5698, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  78%|#######8  | 87/111 [00:58<00:16,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6880, UAS: 0.8660, LAS: 0.7708, UEM: 0.3766, LEM: 0.1560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6133, partial_loss/deprel_loss: 2.1378, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2944, loss: 1.5744, batch_reg_loss: 0.0615, reg_loss: 0.0614 ||:  81%|########1 | 90/111 [01:01<00:15,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7145, UAS: 0.8654, LAS: 0.7703, UEM: 0.3729, LEM: 0.1542, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3646, partial_loss/deprel_loss: 2.0728, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1926, loss: 1.5798, batch_reg_loss: 0.0615, reg_loss: 0.0614 ||:  84%|########3 | 93/111 [01:03<00:13,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7754, UAS: 0.8652, LAS: 0.7702, UEM: 0.3709, LEM: 0.1526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2314, partial_loss/deprel_loss: 1.5581, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5543, loss: 1.5834, batch_reg_loss: 0.0615, reg_loss: 0.0614 ||:  86%|########6 | 96/111 [01:05<00:10,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7925, UAS: 0.8642, LAS: 0.7695, UEM: 0.3719, LEM: 0.1529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1520, partial_loss/deprel_loss: 1.3520, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3735, loss: 1.5922, batch_reg_loss: 0.0615, reg_loss: 0.0614 ||:  89%|########9 | 99/111 [01:08<00:08,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6972, UAS: 0.8644, LAS: 0.7697, UEM: 0.3691, LEM: 0.1504, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3335, partial_loss/deprel_loss: 2.2219, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3058, loss: 1.5920, batch_reg_loss: 0.0615, reg_loss: 0.0614 ||:  93%|#########2| 103/111 [01:10<00:05,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8721, UAS: 0.8655, LAS: 0.7711, UEM: 0.3800, LEM: 0.1593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2474, partial_loss/deprel_loss: 0.5589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5582, loss: 1.5770, batch_reg_loss: 0.0616, reg_loss: 0.0614 ||:  95%|#########5| 106/111 [01:12<00:03,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7927, UAS: 0.8653, LAS: 0.7706, UEM: 0.3763, LEM: 0.1567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9309, partial_loss/deprel_loss: 1.2968, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2852, loss: 1.5809, batch_reg_loss: 0.0616, reg_loss: 0.0614 ||:  98%|#########8| 109/111 [01:14<00:01,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8018, UAS: 0.8655, LAS: 0.7708, UEM: 0.3731, LEM: 0.1547, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8911, partial_loss/deprel_loss: 1.3144, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2913, loss: 1.5809, batch_reg_loss: 0.0616, reg_loss: 0.0614 ||: 100%|##########| 111/111 [01:15<00:00,  1.46it/s]\n",
+      "2023-04-06 22:57:49,583 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8182, UAS: 0.9041, LAS: 0.8223, UEM: 0.3590, LEM: 0.0897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9126, partial_loss/deprel_loss: 32.0601, partial_loss/cycle_loss: 0.0000, batch_loss: 25.8306, loss: 27.0349, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:09,  1.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8824, UAS: 0.9214, LAS: 0.8453, UEM: 0.5769, LEM: 0.3145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4594, partial_loss/deprel_loss: 16.4050, partial_loss/cycle_loss: 0.0000, batch_loss: 13.2159, loss: 21.8993, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:06,  1.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7466, UAS: 0.9121, LAS: 0.8362, UEM: 0.5609, LEM: 0.3025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1975, partial_loss/deprel_loss: 54.5662, partial_loss/cycle_loss: 0.0000, batch_loss: 44.0925, loss: 25.0782, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  69%|######9   | 9/13 [00:08<00:03,  1.05it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8448, UAS: 0.9151, LAS: 0.8387, UEM: 0.5397, LEM: 0.2662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6377, partial_loss/deprel_loss: 22.6314, partial_loss/cycle_loss: 0.0000, batch_loss: 18.2327, loss: 23.8980, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  92%|#########2| 12/13 [00:11<00:00,  1.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8053, UAS: 0.9130, LAS: 0.8361, UEM: 0.5198, LEM: 0.2546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3525, partial_loss/deprel_loss: 34.6234, partial_loss/cycle_loss: 0.0000, batch_loss: 27.9692, loss: 24.2112, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.05it/s]\n",
+      "2023-04-06 22:58:01,929 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 22:58:01,929 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 22:58:01,929 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 22:58:01,929 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 22:58:01,929 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 22:58:01,929 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 22:58:01,929 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.314  |    34.623\n",
+      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.891  |     1.353\n",
+      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.061  |     0.000\n",
+      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - UEM                      |     0.373  |     0.520\n",
+      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - LAS                      |     0.771  |     0.836\n",
+      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - loss                     |     1.581  |    24.211\n",
+      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.097  |       N/A\n",
+      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - LEM                      |     0.155  |     0.255\n",
+      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - UAS                      |     0.866  |     0.913\n",
+      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - EM                       |     0.802  |     0.805\n",
+      "2023-04-06 22:58:01,931 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 22:58:01,931 - INFO - combo.training.trainer - Epoch duration: 0:01:28.130781\n",
+      "2023-04-06 22:58:01,931 - INFO - combo.training.trainer - Estimated training time remaining: 9:01:20\n",
+      "2023-04-06 22:58:01,931 - INFO - allennlp.training.trainer - Epoch 6/399\n",
+      "2023-04-06 22:58:01,932 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 22:58:01,932 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 22:58:01,939 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7928, UAS: 0.8946, LAS: 0.8032, UEM: 0.3837, LEM: 0.1392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9781, partial_loss/deprel_loss: 1.3434, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3320, loss: 1.3132, batch_reg_loss: 0.0616, reg_loss: 0.0616 ||:   3%|2         | 3/111 [00:02<01:16,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8273, UAS: 0.8970, LAS: 0.8065, UEM: 0.4021, LEM: 0.1350, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5714, partial_loss/deprel_loss: 0.9386, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9268, loss: 1.2471, batch_reg_loss: 0.0616, reg_loss: 0.0616 ||:   5%|5         | 6/111 [00:04<01:12,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8161, UAS: 0.8897, LAS: 0.7999, UEM: 0.3630, LEM: 0.1180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9064, partial_loss/deprel_loss: 1.2405, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2353, loss: 1.3079, batch_reg_loss: 0.0617, reg_loss: 0.0616 ||:   9%|9         | 10/111 [00:06<01:07,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7893, UAS: 0.8751, LAS: 0.7831, UEM: 0.3085, LEM: 0.0989, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1124, partial_loss/deprel_loss: 1.4383, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4348, loss: 1.4786, batch_reg_loss: 0.0617, reg_loss: 0.0616 ||:  13%|#2        | 14/111 [00:08<01:02,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8441, UAS: 0.8743, LAS: 0.7827, UEM: 0.3527, LEM: 0.1199, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4962, partial_loss/deprel_loss: 0.8334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8276, loss: 1.4829, batch_reg_loss: 0.0617, reg_loss: 0.0616 ||:  15%|#5        | 17/111 [00:11<01:04,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6250, UAS: 0.8694, LAS: 0.7787, UEM: 0.3480, LEM: 0.1177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.1969, partial_loss/deprel_loss: 2.8191, partial_loss/cycle_loss: 0.0000, batch_loss: 3.1564, loss: 1.5361, batch_reg_loss: 0.0617, reg_loss: 0.0617 ||:  19%|#8        | 21/111 [00:13<01:00,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7569, UAS: 0.8693, LAS: 0.7786, UEM: 0.3166, LEM: 0.1037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5271, partial_loss/deprel_loss: 1.8119, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8167, loss: 1.5297, batch_reg_loss: 0.0617, reg_loss: 0.0617 ||:  23%|##2       | 25/111 [00:16<00:56,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7141, UAS: 0.8677, LAS: 0.7759, UEM: 0.3006, LEM: 0.0945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3811, partial_loss/deprel_loss: 2.0258, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1586, loss: 1.5526, batch_reg_loss: 0.0618, reg_loss: 0.0617 ||:  26%|##6       | 29/111 [00:18<00:53,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7306, UAS: 0.8672, LAS: 0.7753, UEM: 0.3126, LEM: 0.1007, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0218, partial_loss/deprel_loss: 1.8331, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9327, loss: 1.5604, batch_reg_loss: 0.0618, reg_loss: 0.0617 ||:  30%|##9       | 33/111 [00:21<00:50,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7770, UAS: 0.8695, LAS: 0.7770, UEM: 0.3171, LEM: 0.1003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3398, partial_loss/deprel_loss: 1.4502, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4899, loss: 1.5471, batch_reg_loss: 0.0618, reg_loss: 0.0617 ||:  33%|###3      | 37/111 [00:23<00:46,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7841, UAS: 0.8650, LAS: 0.7722, UEM: 0.3010, LEM: 0.0950, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2401, partial_loss/deprel_loss: 1.4031, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4324, loss: 1.6028, batch_reg_loss: 0.0619, reg_loss: 0.0617 ||:  37%|###6      | 41/111 [00:26<00:42,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.8680, LAS: 0.7754, UEM: 0.3355, LEM: 0.1209, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2475, partial_loss/deprel_loss: 0.5893, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5828, loss: 1.5741, batch_reg_loss: 0.0619, reg_loss: 0.0617 ||:  41%|####      | 45/111 [00:29<00:43,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8182, UAS: 0.8696, LAS: 0.7771, UEM: 0.3369, LEM: 0.1205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6923, partial_loss/deprel_loss: 1.0521, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0421, loss: 1.5538, batch_reg_loss: 0.0620, reg_loss: 0.0618 ||:  44%|####4     | 49/111 [00:31<00:41,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7539, UAS: 0.8692, LAS: 0.7765, UEM: 0.3256, LEM: 0.1145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6915, partial_loss/deprel_loss: 1.8414, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8734, loss: 1.5572, batch_reg_loss: 0.0620, reg_loss: 0.0618 ||:  48%|####7     | 53/111 [00:34<00:38,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8421, UAS: 0.8703, LAS: 0.7782, UEM: 0.3360, LEM: 0.1201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6520, partial_loss/deprel_loss: 0.8937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9074, loss: 1.5379, batch_reg_loss: 0.0620, reg_loss: 0.0618 ||:  51%|#####1    | 57/111 [00:37<00:37,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8116, UAS: 0.8717, LAS: 0.7799, UEM: 0.3610, LEM: 0.1445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9092, partial_loss/deprel_loss: 1.1890, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1951, loss: 1.5218, batch_reg_loss: 0.0620, reg_loss: 0.0618 ||:  54%|#####4    | 60/111 [00:39<00:36,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8035, UAS: 0.8727, LAS: 0.7813, UEM: 0.3561, LEM: 0.1403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1905, partial_loss/deprel_loss: 1.2473, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2980, loss: 1.5067, batch_reg_loss: 0.0621, reg_loss: 0.0618 ||:  57%|#####6    | 63/111 [00:42<00:34,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8627, UAS: 0.8749, LAS: 0.7839, UEM: 0.3711, LEM: 0.1484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2916, partial_loss/deprel_loss: 0.6615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6496, loss: 1.4817, batch_reg_loss: 0.0621, reg_loss: 0.0618 ||:  59%|#####9    | 66/111 [00:44<00:31,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7580, UAS: 0.8736, LAS: 0.7826, UEM: 0.3745, LEM: 0.1515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5556, partial_loss/deprel_loss: 1.6028, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6555, loss: 1.4939, batch_reg_loss: 0.0621, reg_loss: 0.0618 ||:  63%|######3   | 70/111 [00:46<00:28,  1.45it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8647, UAS: 0.8744, LAS: 0.7837, UEM: 0.3851, LEM: 0.1595, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3390, partial_loss/deprel_loss: 0.6582, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6565, loss: 1.4852, batch_reg_loss: 0.0621, reg_loss: 0.0619 ||:  66%|######5   | 73/111 [00:50<00:34,  1.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8116, UAS: 0.8754, LAS: 0.7846, UEM: 0.3853, LEM: 0.1580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8573, partial_loss/deprel_loss: 1.2353, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2218, loss: 1.4768, batch_reg_loss: 0.0621, reg_loss: 0.0619 ||:  68%|######8   | 76/111 [00:53<00:31,  1.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8517, UAS: 0.8775, LAS: 0.7871, UEM: 0.4008, LEM: 0.1662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4426, partial_loss/deprel_loss: 0.8148, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8025, loss: 1.4523, batch_reg_loss: 0.0622, reg_loss: 0.0619 ||:  71%|#######1  | 79/111 [00:55<00:27,  1.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7632, UAS: 0.8768, LAS: 0.7867, UEM: 0.4232, LEM: 0.1931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3685, partial_loss/deprel_loss: 1.5348, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5637, loss: 1.4562, batch_reg_loss: 0.0622, reg_loss: 0.0619 ||:  74%|#######3  | 82/111 [00:58<00:24,  1.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7120, UAS: 0.8759, LAS: 0.7859, UEM: 0.4157, LEM: 0.1885, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3845, partial_loss/deprel_loss: 2.0313, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1642, loss: 1.4645, batch_reg_loss: 0.0622, reg_loss: 0.0619 ||:  77%|#######7  | 86/111 [01:00<00:18,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8155, UAS: 0.8760, LAS: 0.7861, UEM: 0.4115, LEM: 0.1853, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8067, partial_loss/deprel_loss: 1.1319, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1291, loss: 1.4605, batch_reg_loss: 0.0622, reg_loss: 0.0619 ||:  80%|########  | 89/111 [01:02<00:16,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7328, UAS: 0.8753, LAS: 0.7855, UEM: 0.4026, LEM: 0.1804, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2779, partial_loss/deprel_loss: 1.9162, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0508, loss: 1.4669, batch_reg_loss: 0.0623, reg_loss: 0.0619 ||:  84%|########3 | 93/111 [01:04<00:12,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8328, UAS: 0.8765, LAS: 0.7868, UEM: 0.4051, LEM: 0.1809, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8328, partial_loss/deprel_loss: 1.0645, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0804, loss: 1.4538, batch_reg_loss: 0.0623, reg_loss: 0.0619 ||:  86%|########6 | 96/111 [01:06<00:10,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8406, UAS: 0.8762, LAS: 0.7865, UEM: 0.4014, LEM: 0.1783, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5521, partial_loss/deprel_loss: 0.9905, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9651, loss: 1.4581, batch_reg_loss: 0.0623, reg_loss: 0.0619 ||:  89%|########9 | 99/111 [01:09<00:08,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7715, UAS: 0.8767, LAS: 0.7872, UEM: 0.3993, LEM: 0.1761, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3737, partial_loss/deprel_loss: 1.5367, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5665, loss: 1.4511, batch_reg_loss: 0.0624, reg_loss: 0.0620 ||:  92%|#########1| 102/111 [01:11<00:06,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7680, UAS: 0.8764, LAS: 0.7870, UEM: 0.3919, LEM: 0.1721, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4850, partial_loss/deprel_loss: 1.6062, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6444, loss: 1.4537, batch_reg_loss: 0.0624, reg_loss: 0.0620 ||:  95%|#########5| 106/111 [01:13<00:03,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8565, UAS: 0.8768, LAS: 0.7875, UEM: 0.3925, LEM: 0.1722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4828, partial_loss/deprel_loss: 0.8308, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8236, loss: 1.4500, batch_reg_loss: 0.0624, reg_loss: 0.0620 ||:  98%|#########8| 109/111 [01:15<00:01,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8117, UAS: 0.8776, LAS: 0.7883, UEM: 0.3955, LEM: 0.1736, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9031, partial_loss/deprel_loss: 1.2503, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2433, loss: 1.4419, batch_reg_loss: 0.0625, reg_loss: 0.0620 ||: 100%|##########| 111/111 [01:17<00:00,  1.43it/s]\n",
+      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.250  |       N/A\n",
+      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.903  |       N/A\n",
+      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.062  |       N/A\n",
+      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - UEM                      |     0.395  |       N/A\n",
+      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - LAS                      |     0.788  |       N/A\n",
+      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - loss                     |     1.442  |       N/A\n",
+      "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.097  |       N/A\n",
+      "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - LEM                      |     0.174  |       N/A\n",
+      "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - UAS                      |     0.878  |       N/A\n",
+      "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - EM                       |     0.812  |       N/A\n",
+      "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 22:59:19,354 - INFO - combo.training.trainer - Epoch duration: 0:01:17.422262\n",
+      "2023-04-06 22:59:19,354 - INFO - combo.training.trainer - Estimated training time remaining: 8:55:16\n",
+      "2023-04-06 22:59:19,354 - INFO - allennlp.training.trainer - Epoch 7/399\n",
+      "2023-04-06 22:59:19,354 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 22:59:19,354 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 22:59:19,361 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8629, UAS: 0.8724, LAS: 0.7842, UEM: 0.3680, LEM: 0.1364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4368, partial_loss/deprel_loss: 0.7830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7763, loss: 1.4874, batch_reg_loss: 0.0625, reg_loss: 0.0625 ||:   4%|3         | 4/111 [00:02<01:11,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7297, UAS: 0.8701, LAS: 0.7828, UEM: 0.4033, LEM: 0.1768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0957, partial_loss/deprel_loss: 1.9928, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0759, loss: 1.5090, batch_reg_loss: 0.0625, reg_loss: 0.0625 ||:   6%|6         | 7/111 [00:05<01:13,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7719, UAS: 0.8774, LAS: 0.7933, UEM: 0.3826, LEM: 0.1651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4563, partial_loss/deprel_loss: 1.6923, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7077, loss: 1.4414, batch_reg_loss: 0.0626, reg_loss: 0.0625 ||:  10%|9         | 11/111 [00:07<01:07,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8024, UAS: 0.8787, LAS: 0.7934, UEM: 0.3521, LEM: 0.1407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9573, partial_loss/deprel_loss: 1.2649, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2660, loss: 1.4205, batch_reg_loss: 0.0626, reg_loss: 0.0625 ||:  14%|#3        | 15/111 [00:09<01:01,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7615, UAS: 0.8748, LAS: 0.7881, UEM: 0.3135, LEM: 0.1196, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6249, partial_loss/deprel_loss: 1.6581, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7141, loss: 1.4666, batch_reg_loss: 0.0627, reg_loss: 0.0626 ||:  17%|#7        | 19/111 [00:12<00:58,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8370, UAS: 0.8822, LAS: 0.7962, UEM: 0.3660, LEM: 0.1485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6126, partial_loss/deprel_loss: 0.9570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9508, loss: 1.3872, batch_reg_loss: 0.0627, reg_loss: 0.0626 ||:  20%|#9        | 22/111 [00:14<00:58,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6689, UAS: 0.8766, LAS: 0.7911, UEM: 0.3612, LEM: 0.1459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.2741, partial_loss/deprel_loss: 2.4141, partial_loss/cycle_loss: 0.0000, batch_loss: 2.6488, loss: 1.4397, batch_reg_loss: 0.0628, reg_loss: 0.0626 ||:  23%|##3       | 26/111 [00:16<00:53,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8573, UAS: 0.8769, LAS: 0.7922, UEM: 0.3532, LEM: 0.1394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6586, partial_loss/deprel_loss: 0.9206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9310, loss: 1.4379, batch_reg_loss: 0.0628, reg_loss: 0.0626 ||:  27%|##7       | 30/111 [00:19<00:51,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8501, UAS: 0.8768, LAS: 0.7918, UEM: 0.3561, LEM: 0.1370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4872, partial_loss/deprel_loss: 0.8191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8156, loss: 1.4428, batch_reg_loss: 0.0629, reg_loss: 0.0627 ||:  31%|###       | 34/111 [00:21<00:49,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7718, UAS: 0.8759, LAS: 0.7906, UEM: 0.3526, LEM: 0.1360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3521, partial_loss/deprel_loss: 1.4910, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5261, loss: 1.4532, batch_reg_loss: 0.0629, reg_loss: 0.0627 ||:  34%|###4      | 38/111 [00:24<00:47,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7682, UAS: 0.8763, LAS: 0.7911, UEM: 0.3421, LEM: 0.1291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5765, partial_loss/deprel_loss: 1.6436, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6931, loss: 1.4514, batch_reg_loss: 0.0630, reg_loss: 0.0627 ||:  38%|###7      | 42/111 [00:27<00:45,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8301, UAS: 0.8781, LAS: 0.7929, UEM: 0.3316, LEM: 0.1220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7117, partial_loss/deprel_loss: 1.1158, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0980, loss: 1.4348, batch_reg_loss: 0.0630, reg_loss: 0.0627 ||:  41%|####1     | 46/111 [00:29<00:40,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7495, UAS: 0.8762, LAS: 0.7916, UEM: 0.3351, LEM: 0.1242, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0049, partial_loss/deprel_loss: 1.8432, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9386, loss: 1.4529, batch_reg_loss: 0.0631, reg_loss: 0.0628 ||:  45%|####5     | 50/111 [00:31<00:37,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7735, UAS: 0.8790, LAS: 0.7953, UEM: 0.3877, LEM: 0.1736, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4529, partial_loss/deprel_loss: 1.4813, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5387, loss: 1.4166, batch_reg_loss: 0.0631, reg_loss: 0.0628 ||:  49%|####8     | 54/111 [00:35<00:39,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8136, UAS: 0.8792, LAS: 0.7954, UEM: 0.3826, LEM: 0.1685, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9952, partial_loss/deprel_loss: 1.2018, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2236, loss: 1.4151, batch_reg_loss: 0.0631, reg_loss: 0.0628 ||:  51%|#####1    | 57/111 [00:37<00:37,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7092, UAS: 0.8797, LAS: 0.7962, UEM: 0.4184, LEM: 0.2082, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.7240, partial_loss/deprel_loss: 2.1644, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3395, loss: 1.4103, batch_reg_loss: 0.0632, reg_loss: 0.0628 ||:  54%|#####4    | 60/111 [00:39<00:36,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7540, UAS: 0.8799, LAS: 0.7961, UEM: 0.4070, LEM: 0.1991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8092, partial_loss/deprel_loss: 1.7140, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7963, loss: 1.4121, batch_reg_loss: 0.0632, reg_loss: 0.0628 ||:  58%|#####7    | 64/111 [00:42<00:32,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8109, UAS: 0.8805, LAS: 0.7967, UEM: 0.4083, LEM: 0.2006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9000, partial_loss/deprel_loss: 1.1946, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1989, loss: 1.4027, batch_reg_loss: 0.0633, reg_loss: 0.0629 ||:  60%|######    | 67/111 [00:44<00:30,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8382, UAS: 0.8815, LAS: 0.7979, UEM: 0.4116, LEM: 0.2017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6882, partial_loss/deprel_loss: 0.9346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9486, loss: 1.3897, batch_reg_loss: 0.0633, reg_loss: 0.0629 ||:  63%|######3   | 70/111 [00:46<00:30,  1.36it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8771, UAS: 0.8812, LAS: 0.7976, UEM: 0.4122, LEM: 0.2035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3938, partial_loss/deprel_loss: 0.6384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6529, loss: 1.3910, batch_reg_loss: 0.0634, reg_loss: 0.0629 ||:  66%|######5   | 73/111 [00:48<00:27,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8465, UAS: 0.8816, LAS: 0.7982, UEM: 0.4122, LEM: 0.2019, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6296, partial_loss/deprel_loss: 0.9116, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9186, loss: 1.3860, batch_reg_loss: 0.0634, reg_loss: 0.0629 ||:  68%|######8   | 76/111 [00:50<00:25,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7487, UAS: 0.8817, LAS: 0.7982, UEM: 0.4104, LEM: 0.1998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8556, partial_loss/deprel_loss: 1.6892, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7859, loss: 1.3852, batch_reg_loss: 0.0634, reg_loss: 0.0629 ||:  71%|#######1  | 79/111 [00:53<00:22,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8273, UAS: 0.8828, LAS: 0.7995, UEM: 0.4079, LEM: 0.1960, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8511, partial_loss/deprel_loss: 1.1586, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1606, loss: 1.3738, batch_reg_loss: 0.0635, reg_loss: 0.0630 ||:  74%|#######3  | 82/111 [00:55<00:20,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7909, UAS: 0.8831, LAS: 0.7998, UEM: 0.3986, LEM: 0.1897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2809, partial_loss/deprel_loss: 1.4356, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4682, loss: 1.3714, batch_reg_loss: 0.0635, reg_loss: 0.0630 ||:  77%|#######7  | 86/111 [00:57<00:17,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8665, UAS: 0.8841, LAS: 0.8011, UEM: 0.4051, LEM: 0.1932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3861, partial_loss/deprel_loss: 0.6754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6811, loss: 1.3591, batch_reg_loss: 0.0636, reg_loss: 0.0630 ||:  80%|########  | 89/111 [00:59<00:15,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8384, UAS: 0.8851, LAS: 0.8022, UEM: 0.4059, LEM: 0.1904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7558, partial_loss/deprel_loss: 0.8878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9250, loss: 1.3475, batch_reg_loss: 0.0636, reg_loss: 0.0630 ||:  83%|########2 | 92/111 [01:01<00:13,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6849, UAS: 0.8847, LAS: 0.8021, UEM: 0.4073, LEM: 0.1900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.0226, partial_loss/deprel_loss: 2.1493, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3876, loss: 1.3458, batch_reg_loss: 0.0637, reg_loss: 0.0630 ||:  86%|########6 | 96/111 [01:04<00:10,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7306, UAS: 0.8834, LAS: 0.8006, UEM: 0.4017, LEM: 0.1872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0285, partial_loss/deprel_loss: 1.8749, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9693, loss: 1.3587, batch_reg_loss: 0.0637, reg_loss: 0.0631 ||:  89%|########9 | 99/111 [01:06<00:08,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8169, UAS: 0.8834, LAS: 0.8005, UEM: 0.4020, LEM: 0.1868, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8733, partial_loss/deprel_loss: 1.1504, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1587, loss: 1.3588, batch_reg_loss: 0.0637, reg_loss: 0.0631 ||:  92%|#########1| 102/111 [01:09<00:06,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.8850, LAS: 0.8022, UEM: 0.4122, LEM: 0.1905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3123, partial_loss/deprel_loss: 0.6209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6230, loss: 1.3414, batch_reg_loss: 0.0638, reg_loss: 0.0631 ||:  95%|#########5| 106/111 [01:11<00:03,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8577, UAS: 0.8857, LAS: 0.8029, UEM: 0.4147, LEM: 0.1914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4652, partial_loss/deprel_loss: 0.7915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7900, loss: 1.3339, batch_reg_loss: 0.0638, reg_loss: 0.0631 ||:  98%|#########8| 109/111 [01:13<00:01,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8271, UAS: 0.8854, LAS: 0.8026, UEM: 0.4124, LEM: 0.1897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8597, partial_loss/deprel_loss: 0.9947, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0315, loss: 1.3354, batch_reg_loss: 0.0638, reg_loss: 0.0631 ||: 100%|##########| 111/111 [01:15<00:00,  1.48it/s]\n",
+      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.995  |       N/A\n",
+      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.860  |       N/A\n",
+      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.063  |       N/A\n",
+      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - UEM                      |     0.412  |       N/A\n",
+      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - LAS                      |     0.803  |       N/A\n",
+      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - loss                     |     1.335  |       N/A\n",
+      "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.097  |       N/A\n",
+      "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - LEM                      |     0.190  |       N/A\n",
+      "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - UAS                      |     0.885  |       N/A\n",
+      "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - EM                       |     0.827  |       N/A\n",
+      "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:00:34,377 - INFO - combo.training.trainer - Epoch duration: 0:01:15.022627\n",
+      "2023-04-06 23:00:34,377 - INFO - combo.training.trainer - Estimated training time remaining: 8:48:26\n",
+      "2023-04-06 23:00:34,377 - INFO - allennlp.training.trainer - Epoch 8/399\n",
+      "2023-04-06 23:00:34,377 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-06 23:00:34,377 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:00:34,384 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8241, UAS: 0.8930, LAS: 0.8071, UEM: 0.2937, LEM: 0.0688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8920, partial_loss/deprel_loss: 1.0848, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1101, loss: 1.2838, batch_reg_loss: 0.0639, reg_loss: 0.0639 ||:   4%|3         | 4/111 [00:02<01:05,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8233, UAS: 0.8886, LAS: 0.8066, UEM: 0.3058, LEM: 0.0816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9010, partial_loss/deprel_loss: 1.1552, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1683, loss: 1.2793, batch_reg_loss: 0.0640, reg_loss: 0.0639 ||:   7%|7         | 8/111 [00:04<01:03,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9018, LAS: 0.8220, UEM: 0.5010, LEM: 0.2561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1971, partial_loss/deprel_loss: 0.4135, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4342, loss: 1.1506, batch_reg_loss: 0.0640, reg_loss: 0.0639 ||:  10%|9         | 11/111 [00:07<01:03,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8606, UAS: 0.8885, LAS: 0.8093, UEM: 0.5000, LEM: 0.2546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4594, partial_loss/deprel_loss: 0.6960, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7127, loss: 1.3050, batch_reg_loss: 0.0640, reg_loss: 0.0640 ||:  13%|#2        | 14/111 [00:09<01:07,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8513, UAS: 0.8872, LAS: 0.8077, UEM: 0.4793, LEM: 0.2398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5064, partial_loss/deprel_loss: 0.7968, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8028, loss: 1.3102, batch_reg_loss: 0.0641, reg_loss: 0.0640 ||:  15%|#5        | 17/111 [00:11<01:08,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7552, UAS: 0.8892, LAS: 0.8111, UEM: 0.4579, LEM: 0.2212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8160, partial_loss/deprel_loss: 1.5796, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6910, loss: 1.2699, batch_reg_loss: 0.0641, reg_loss: 0.0640 ||:  19%|#8        | 21/111 [00:14<01:01,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8090, UAS: 0.8856, LAS: 0.8065, UEM: 0.4306, LEM: 0.2060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1190, partial_loss/deprel_loss: 1.1705, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2244, loss: 1.3033, batch_reg_loss: 0.0642, reg_loss: 0.0640 ||:  22%|##1       | 24/111 [00:16<00:59,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7897, UAS: 0.8861, LAS: 0.8069, UEM: 0.4112, LEM: 0.1927, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2958, partial_loss/deprel_loss: 1.3087, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3704, loss: 1.2958, batch_reg_loss: 0.0642, reg_loss: 0.0640 ||:  24%|##4       | 27/111 [00:18<01:00,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7306, UAS: 0.8839, LAS: 0.8044, UEM: 0.4072, LEM: 0.1892, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4421, partial_loss/deprel_loss: 1.8969, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0702, loss: 1.3262, batch_reg_loss: 0.0643, reg_loss: 0.0641 ||:  27%|##7       | 30/111 [00:20<00:59,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8245, UAS: 0.8813, LAS: 0.8011, UEM: 0.3874, LEM: 0.1759, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8848, partial_loss/deprel_loss: 1.1863, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1903, loss: 1.3609, batch_reg_loss: 0.0644, reg_loss: 0.0641 ||:  31%|###       | 34/111 [00:23<00:53,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7990, UAS: 0.8837, LAS: 0.8038, UEM: 0.4387, LEM: 0.2372, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1111, partial_loss/deprel_loss: 1.2691, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3019, loss: 1.3366, batch_reg_loss: 0.0644, reg_loss: 0.0641 ||:  33%|###3      | 37/111 [00:25<00:52,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7902, UAS: 0.8854, LAS: 0.8050, UEM: 0.4272, LEM: 0.2249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3545, partial_loss/deprel_loss: 1.4825, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5214, loss: 1.3286, batch_reg_loss: 0.0645, reg_loss: 0.0642 ||:  36%|###6      | 40/111 [00:27<00:49,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.8877, LAS: 0.8072, UEM: 0.4217, LEM: 0.2144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5300, partial_loss/deprel_loss: 0.9049, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8945, loss: 1.3072, batch_reg_loss: 0.0645, reg_loss: 0.0642 ||:  39%|###8      | 43/111 [00:29<00:47,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8620, UAS: 0.8908, LAS: 0.8105, UEM: 0.4339, LEM: 0.2148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5897, partial_loss/deprel_loss: 0.8662, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8754, loss: 1.2774, batch_reg_loss: 0.0646, reg_loss: 0.0642 ||:  41%|####1     | 46/111 [00:32<00:47,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8295, UAS: 0.8909, LAS: 0.8105, UEM: 0.4243, LEM: 0.2074, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8100, partial_loss/deprel_loss: 0.9878, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0168, loss: 1.2768, batch_reg_loss: 0.0646, reg_loss: 0.0642 ||:  44%|####4     | 49/111 [00:34<00:45,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8451, UAS: 0.8901, LAS: 0.8096, UEM: 0.4112, LEM: 0.1977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7876, partial_loss/deprel_loss: 0.9327, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9683, loss: 1.2818, batch_reg_loss: 0.0647, reg_loss: 0.0643 ||:  48%|####7     | 53/111 [00:36<00:39,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8451, UAS: 0.8901, LAS: 0.8096, UEM: 0.4056, LEM: 0.1924, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6974, partial_loss/deprel_loss: 0.9227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9424, loss: 1.2799, batch_reg_loss: 0.0647, reg_loss: 0.0643 ||:  50%|#####     | 56/111 [00:38<00:38,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8424, UAS: 0.8911, LAS: 0.8107, UEM: 0.4065, LEM: 0.1909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7933, partial_loss/deprel_loss: 0.9271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9651, loss: 1.2707, batch_reg_loss: 0.0648, reg_loss: 0.0643 ||:  54%|#####4    | 60/111 [00:41<00:34,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8653, UAS: 0.8913, LAS: 0.8110, UEM: 0.4163, LEM: 0.1957, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5222, partial_loss/deprel_loss: 0.8511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8501, loss: 1.2691, batch_reg_loss: 0.0648, reg_loss: 0.0643 ||:  57%|#####6    | 63/111 [00:43<00:33,  1.45it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8443, UAS: 0.8926, LAS: 0.8125, UEM: 0.4278, LEM: 0.2061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7491, partial_loss/deprel_loss: 1.0206, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0312, loss: 1.2552, batch_reg_loss: 0.0649, reg_loss: 0.0644 ||:  59%|#####9    | 66/111 [00:45<00:31,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8008, UAS: 0.8931, LAS: 0.8132, UEM: 0.4331, LEM: 0.2078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1884, partial_loss/deprel_loss: 1.2751, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3227, loss: 1.2490, batch_reg_loss: 0.0649, reg_loss: 0.0644 ||:  63%|######3   | 70/111 [00:48<00:27,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7758, UAS: 0.8925, LAS: 0.8121, UEM: 0.4233, LEM: 0.2014, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4103, partial_loss/deprel_loss: 1.5663, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6001, loss: 1.2582, batch_reg_loss: 0.0650, reg_loss: 0.0644 ||:  67%|######6   | 74/111 [00:50<00:24,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.8917, LAS: 0.8114, UEM: 0.4194, LEM: 0.1977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5735, partial_loss/deprel_loss: 0.8557, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8643, loss: 1.2660, batch_reg_loss: 0.0651, reg_loss: 0.0645 ||:  70%|#######   | 78/111 [00:53<00:22,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8681, UAS: 0.8931, LAS: 0.8129, UEM: 0.4242, LEM: 0.1982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4187, partial_loss/deprel_loss: 0.7510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7497, loss: 1.2519, batch_reg_loss: 0.0651, reg_loss: 0.0645 ||:  73%|#######2  | 81/111 [00:55<00:21,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6999, UAS: 0.8912, LAS: 0.8106, UEM: 0.4176, LEM: 0.1948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5586, partial_loss/deprel_loss: 2.1598, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3047, loss: 1.2725, batch_reg_loss: 0.0651, reg_loss: 0.0645 ||:  76%|#######5  | 84/111 [00:57<00:18,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7984, UAS: 0.8920, LAS: 0.8114, UEM: 0.4254, LEM: 0.2002, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2174, partial_loss/deprel_loss: 1.3746, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4084, loss: 1.2663, batch_reg_loss: 0.0652, reg_loss: 0.0645 ||:  79%|#######9  | 88/111 [01:00<00:15,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7645, UAS: 0.8914, LAS: 0.8106, UEM: 0.4171, LEM: 0.1945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7351, partial_loss/deprel_loss: 1.6841, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7596, loss: 1.2742, batch_reg_loss: 0.0653, reg_loss: 0.0646 ||:  83%|########2 | 92/111 [01:02<00:12,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8726, UAS: 0.8916, LAS: 0.8109, UEM: 0.4169, LEM: 0.1940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4136, partial_loss/deprel_loss: 0.6496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6677, loss: 1.2720, batch_reg_loss: 0.0653, reg_loss: 0.0646 ||:  86%|########6 | 96/111 [01:05<00:10,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8617, UAS: 0.8930, LAS: 0.8124, UEM: 0.4280, LEM: 0.2003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4469, partial_loss/deprel_loss: 0.7590, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7619, loss: 1.2586, batch_reg_loss: 0.0654, reg_loss: 0.0646 ||:  89%|########9 | 99/111 [01:08<00:08,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7769, UAS: 0.8935, LAS: 0.8130, UEM: 0.4298, LEM: 0.2005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6781, partial_loss/deprel_loss: 1.5453, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6373, loss: 1.2527, batch_reg_loss: 0.0655, reg_loss: 0.0646 ||:  92%|#########1| 102/111 [01:10<00:06,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6829, UAS: 0.8911, LAS: 0.8105, UEM: 0.4258, LEM: 0.1982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.1513, partial_loss/deprel_loss: 2.1113, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3848, loss: 1.2753, batch_reg_loss: 0.0655, reg_loss: 0.0647 ||:  95%|#########4| 105/111 [01:13<00:04,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7566, UAS: 0.8903, LAS: 0.8095, UEM: 0.4247, LEM: 0.1967, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8494, partial_loss/deprel_loss: 1.7516, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8367, loss: 1.2862, batch_reg_loss: 0.0656, reg_loss: 0.0647 ||:  97%|#########7| 108/111 [01:15<00:02,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8283, UAS: 0.8911, LAS: 0.8104, UEM: 0.4280, LEM: 0.1988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7554, partial_loss/deprel_loss: 1.0998, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0965, loss: 1.2771, batch_reg_loss: 0.0656, reg_loss: 0.0647 ||: 100%|##########| 111/111 [01:16<00:00,  1.44it/s]\n",
+      "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.100  |       N/A\n",
+      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.755  |       N/A\n",
+      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.065  |       N/A\n",
+      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - UEM                      |     0.428  |       N/A\n",
+      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - LAS                      |     0.810  |       N/A\n",
+      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - loss                     |     1.277  |       N/A\n",
+      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.097  |       N/A\n",
+      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - LEM                      |     0.199  |       N/A\n",
+      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - UAS                      |     0.891  |       N/A\n",
+      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - EM                       |     0.828  |       N/A\n",
+      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:01:51,359 - INFO - combo.training.trainer - Epoch duration: 0:01:16.982102\n",
+      "2023-04-06 23:01:51,359 - INFO - combo.training.trainer - Estimated training time remaining: 8:44:16\n",
+      "2023-04-06 23:01:51,359 - INFO - allennlp.training.trainer - Epoch 9/399\n",
+      "2023-04-06 23:01:51,359 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:01:51,359 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:01:51,366 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8694, UAS: 0.9255, LAS: 0.8548, UEM: 0.5504, LEM: 0.2738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4220, partial_loss/deprel_loss: 0.6260, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6508, loss: 0.8275, batch_reg_loss: 0.0656, reg_loss: 0.0656 ||:   3%|2         | 3/111 [00:02<01:21,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8375, UAS: 0.9245, LAS: 0.8515, UEM: 0.5266, LEM: 0.2491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7531, partial_loss/deprel_loss: 0.9576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9824, loss: 0.8760, batch_reg_loss: 0.0657, reg_loss: 0.0657 ||:   5%|5         | 6/111 [00:04<01:20,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8321, UAS: 0.9161, LAS: 0.8419, UEM: 0.4940, LEM: 0.2270, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8656, partial_loss/deprel_loss: 1.0827, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1050, loss: 0.9815, batch_reg_loss: 0.0657, reg_loss: 0.0657 ||:   8%|8         | 9/111 [00:06<01:16,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8601, UAS: 0.9148, LAS: 0.8396, UEM: 0.4936, LEM: 0.2105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4626, partial_loss/deprel_loss: 0.7863, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7874, loss: 1.0120, batch_reg_loss: 0.0658, reg_loss: 0.0657 ||:  11%|#         | 12/111 [00:09<01:14,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7472, UAS: 0.9118, LAS: 0.8363, UEM: 0.4936, LEM: 0.2092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1431, partial_loss/deprel_loss: 1.7409, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8873, loss: 1.0389, batch_reg_loss: 0.0659, reg_loss: 0.0657 ||:  14%|#4        | 16/111 [00:11<01:06,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8605, UAS: 0.9033, LAS: 0.8265, UEM: 0.4604, LEM: 0.1912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5063, partial_loss/deprel_loss: 0.8511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8481, loss: 1.1324, batch_reg_loss: 0.0659, reg_loss: 0.0658 ||:  18%|#8        | 20/111 [00:13<01:00,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8059, UAS: 0.9014, LAS: 0.8239, UEM: 0.4295, LEM: 0.1726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1199, partial_loss/deprel_loss: 1.4563, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4550, loss: 1.1575, batch_reg_loss: 0.0660, reg_loss: 0.0658 ||:  22%|##1       | 24/111 [00:16<00:57,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7750, UAS: 0.8952, LAS: 0.8171, UEM: 0.4111, LEM: 0.1644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6847, partial_loss/deprel_loss: 1.5184, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6177, loss: 1.2197, batch_reg_loss: 0.0661, reg_loss: 0.0658 ||:  25%|##5       | 28/111 [00:18<00:52,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7462, UAS: 0.8923, LAS: 0.8137, UEM: 0.3953, LEM: 0.1563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2574, partial_loss/deprel_loss: 1.8212, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9746, loss: 1.2571, batch_reg_loss: 0.0662, reg_loss: 0.0659 ||:  29%|##8       | 32/111 [00:21<00:50,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8600, UAS: 0.8916, LAS: 0.8133, UEM: 0.3940, LEM: 0.1561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5520, partial_loss/deprel_loss: 0.7620, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7862, loss: 1.2609, batch_reg_loss: 0.0662, reg_loss: 0.0659 ||:  32%|###2      | 36/111 [00:23<00:48,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8140, UAS: 0.8902, LAS: 0.8114, UEM: 0.3764, LEM: 0.1479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1807, partial_loss/deprel_loss: 1.2136, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2734, loss: 1.2838, batch_reg_loss: 0.0663, reg_loss: 0.0660 ||:  36%|###6      | 40/111 [00:26<00:45,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8870, UAS: 0.8915, LAS: 0.8126, UEM: 0.4016, LEM: 0.1669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2704, partial_loss/deprel_loss: 0.5464, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5576, loss: 1.2723, batch_reg_loss: 0.0664, reg_loss: 0.0660 ||:  40%|###9      | 44/111 [00:29<00:43,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8098, UAS: 0.8917, LAS: 0.8122, UEM: 0.3866, LEM: 0.1573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9682, partial_loss/deprel_loss: 1.2962, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2971, loss: 1.2742, batch_reg_loss: 0.0665, reg_loss: 0.0660 ||:  43%|####3     | 48/111 [00:31<00:41,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8341, UAS: 0.8915, LAS: 0.8119, UEM: 0.3734, LEM: 0.1493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8617, partial_loss/deprel_loss: 1.0904, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1112, loss: 1.2763, batch_reg_loss: 0.0666, reg_loss: 0.0661 ||:  47%|####6     | 52/111 [00:34<00:39,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8407, UAS: 0.8937, LAS: 0.8143, UEM: 0.3817, LEM: 0.1525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8274, partial_loss/deprel_loss: 0.9894, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0237, loss: 1.2510, batch_reg_loss: 0.0666, reg_loss: 0.0661 ||:  50%|#####     | 56/111 [00:37<00:37,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7726, UAS: 0.8911, LAS: 0.8114, UEM: 0.3731, LEM: 0.1485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7883, partial_loss/deprel_loss: 1.6515, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7456, loss: 1.2778, batch_reg_loss: 0.0667, reg_loss: 0.0661 ||:  53%|#####3    | 59/111 [00:39<00:35,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.8919, LAS: 0.8123, UEM: 0.3775, LEM: 0.1503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3845, partial_loss/deprel_loss: 0.6765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6848, loss: 1.2680, batch_reg_loss: 0.0668, reg_loss: 0.0662 ||:  57%|#####6    | 63/111 [00:42<00:33,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8825, UAS: 0.8923, LAS: 0.8129, UEM: 0.3800, LEM: 0.1507, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3847, partial_loss/deprel_loss: 0.6543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6672, loss: 1.2614, batch_reg_loss: 0.0668, reg_loss: 0.0662 ||:  60%|######    | 67/111 [00:45<00:30,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8736, UAS: 0.8945, LAS: 0.8153, UEM: 0.3887, LEM: 0.1545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4404, partial_loss/deprel_loss: 0.7233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7337, loss: 1.2393, batch_reg_loss: 0.0669, reg_loss: 0.0663 ||:  64%|######3   | 71/111 [00:47<00:27,  1.45it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8122, UAS: 0.8962, LAS: 0.8173, UEM: 0.4219, LEM: 0.1912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9752, partial_loss/deprel_loss: 1.3085, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3088, loss: 1.2234, batch_reg_loss: 0.0670, reg_loss: 0.0663 ||:  67%|######6   | 74/111 [00:50<00:26,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7825, UAS: 0.8964, LAS: 0.8179, UEM: 0.4236, LEM: 0.1933, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5015, partial_loss/deprel_loss: 1.4831, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5538, loss: 1.2192, batch_reg_loss: 0.0670, reg_loss: 0.0663 ||:  69%|######9   | 77/111 [00:52<00:24,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8175, UAS: 0.8970, LAS: 0.8187, UEM: 0.4197, LEM: 0.1886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0788, partial_loss/deprel_loss: 1.1409, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1956, loss: 1.2138, batch_reg_loss: 0.0671, reg_loss: 0.0663 ||:  73%|#######2  | 81/111 [00:54<00:20,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8500, UAS: 0.8961, LAS: 0.8179, UEM: 0.4136, LEM: 0.1848, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7436, partial_loss/deprel_loss: 0.8710, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9127, loss: 1.2214, batch_reg_loss: 0.0672, reg_loss: 0.0664 ||:  77%|#######6  | 85/111 [00:57<00:17,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7341, UAS: 0.8956, LAS: 0.8174, UEM: 0.4083, LEM: 0.1813, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2575, partial_loss/deprel_loss: 1.8813, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0237, loss: 1.2272, batch_reg_loss: 0.0672, reg_loss: 0.0664 ||:  80%|########  | 89/111 [00:59<00:14,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8867, UAS: 0.8969, LAS: 0.8191, UEM: 0.4323, LEM: 0.2002, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2403, partial_loss/deprel_loss: 0.5870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5850, loss: 1.2123, batch_reg_loss: 0.0673, reg_loss: 0.0665 ||:  84%|########3 | 93/111 [01:02<00:12,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7063, UAS: 0.8948, LAS: 0.8169, UEM: 0.4339, LEM: 0.2011, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6918, partial_loss/deprel_loss: 2.1989, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3648, loss: 1.2362, batch_reg_loss: 0.0673, reg_loss: 0.0665 ||:  86%|########6 | 96/111 [01:05<00:10,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8118, UAS: 0.8947, LAS: 0.8168, UEM: 0.4295, LEM: 0.1973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0917, partial_loss/deprel_loss: 1.1721, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2234, loss: 1.2352, batch_reg_loss: 0.0674, reg_loss: 0.0665 ||:  89%|########9 | 99/111 [01:07<00:08,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8250, UAS: 0.8951, LAS: 0.8172, UEM: 0.4260, LEM: 0.1936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9414, partial_loss/deprel_loss: 1.0274, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0777, loss: 1.2291, batch_reg_loss: 0.0675, reg_loss: 0.0665 ||:  93%|#########2| 103/111 [01:10<00:05,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8082, UAS: 0.8962, LAS: 0.8186, UEM: 0.4419, LEM: 0.2084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1479, partial_loss/deprel_loss: 1.1772, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2388, loss: 1.2158, batch_reg_loss: 0.0675, reg_loss: 0.0666 ||:  95%|#########5| 106/111 [01:12<00:03,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8127, UAS: 0.8962, LAS: 0.8185, UEM: 0.4424, LEM: 0.2096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9760, partial_loss/deprel_loss: 1.2365, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2520, loss: 1.2173, batch_reg_loss: 0.0676, reg_loss: 0.0666 ||:  99%|#########9| 110/111 [01:14<00:00,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7871, UAS: 0.8960, LAS: 0.8182, UEM: 0.4402, LEM: 0.2085, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3663, partial_loss/deprel_loss: 1.4187, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4759, loss: 1.2197, batch_reg_loss: 0.0676, reg_loss: 0.0666 ||: 100%|##########| 111/111 [01:15<00:00,  1.48it/s]\n",
+      "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.419  |       N/A\n",
+      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.366  |       N/A\n",
+      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.067  |       N/A\n",
+      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - UEM                      |     0.440  |       N/A\n",
+      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - LAS                      |     0.818  |       N/A\n",
+      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - loss                     |     1.220  |       N/A\n",
+      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - LEM                      |     0.209  |       N/A\n",
+      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:03:06,511 - INFO - combo.training.tensorboard_writer - UAS                      |     0.896  |       N/A\n",
+      "2023-04-06 23:03:06,511 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:03:06,511 - INFO - combo.training.tensorboard_writer - EM                       |     0.787  |       N/A\n",
+      "2023-04-06 23:03:06,511 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:03:06,511 - INFO - combo.training.trainer - Epoch duration: 0:01:15.152380\n",
+      "2023-04-06 23:03:06,512 - INFO - combo.training.trainer - Estimated training time remaining: 8:39:28\n",
+      "2023-04-06 23:03:06,512 - INFO - allennlp.training.trainer - Epoch 10/399\n",
+      "2023-04-06 23:03:06,512 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:03:06,512 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:03:06,518 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8555, UAS: 0.9211, LAS: 0.8489, UEM: 0.4350, LEM: 0.1673, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6806, partial_loss/deprel_loss: 0.8446, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8795, loss: 0.9582, batch_reg_loss: 0.0677, reg_loss: 0.0676 ||:   3%|2         | 3/111 [00:02<01:13,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7567, UAS: 0.9095, LAS: 0.8358, UEM: 0.3786, LEM: 0.1376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0075, partial_loss/deprel_loss: 1.6559, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7939, loss: 1.0705, batch_reg_loss: 0.0677, reg_loss: 0.0677 ||:   6%|6         | 7/111 [00:04<01:07,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8734, UAS: 0.9037, LAS: 0.8297, UEM: 0.4104, LEM: 0.1799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4051, partial_loss/deprel_loss: 0.6088, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6359, loss: 1.1128, batch_reg_loss: 0.0678, reg_loss: 0.0677 ||:   9%|9         | 10/111 [00:06<01:06,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8079, UAS: 0.9057, LAS: 0.8309, UEM: 0.3985, LEM: 0.1653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1594, partial_loss/deprel_loss: 1.4341, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4470, loss: 1.1057, batch_reg_loss: 0.0678, reg_loss: 0.0677 ||:  12%|#1        | 13/111 [00:08<01:07,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7768, UAS: 0.8954, LAS: 0.8210, UEM: 0.3798, LEM: 0.1587, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8156, partial_loss/deprel_loss: 1.4734, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6097, loss: 1.1918, batch_reg_loss: 0.0679, reg_loss: 0.0678 ||:  14%|#4        | 16/111 [00:10<01:05,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8736, UAS: 0.9001, LAS: 0.8265, UEM: 0.3925, LEM: 0.1602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5088, partial_loss/deprel_loss: 0.6757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7103, loss: 1.1418, batch_reg_loss: 0.0680, reg_loss: 0.0678 ||:  18%|#8        | 20/111 [00:13<01:01,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8563, UAS: 0.9033, LAS: 0.8293, UEM: 0.4103, LEM: 0.1721, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5729, partial_loss/deprel_loss: 0.8466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8599, loss: 1.1190, batch_reg_loss: 0.0680, reg_loss: 0.0678 ||:  21%|##        | 23/111 [00:15<00:59,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7607, UAS: 0.9003, LAS: 0.8257, UEM: 0.3788, LEM: 0.1528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9901, partial_loss/deprel_loss: 1.5372, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6959, loss: 1.1511, batch_reg_loss: 0.0681, reg_loss: 0.0679 ||:  25%|##5       | 28/111 [00:17<00:50,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8466, UAS: 0.9034, LAS: 0.8289, UEM: 0.3855, LEM: 0.1509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7388, partial_loss/deprel_loss: 1.0446, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0516, loss: 1.1226, batch_reg_loss: 0.0682, reg_loss: 0.0679 ||:  29%|##8       | 32/111 [00:20<00:51,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9063, LAS: 0.8325, UEM: 0.4192, LEM: 0.1846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3700, partial_loss/deprel_loss: 0.6140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6335, loss: 1.0953, batch_reg_loss: 0.0683, reg_loss: 0.0679 ||:  32%|###2      | 36/111 [00:23<00:52,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8745, UAS: 0.9079, LAS: 0.8343, UEM: 0.4254, LEM: 0.1857, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4378, partial_loss/deprel_loss: 0.7192, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7312, loss: 1.0799, batch_reg_loss: 0.0683, reg_loss: 0.0680 ||:  35%|###5      | 39/111 [00:25<00:50,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8569, UAS: 0.9090, LAS: 0.8357, UEM: 0.4734, LEM: 0.2418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5374, partial_loss/deprel_loss: 0.8689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8710, loss: 1.0719, batch_reg_loss: 0.0684, reg_loss: 0.0680 ||:  38%|###7      | 42/111 [00:28<00:52,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8581, UAS: 0.9110, LAS: 0.8381, UEM: 0.4946, LEM: 0.2545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5987, partial_loss/deprel_loss: 0.8453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8644, loss: 1.0472, batch_reg_loss: 0.0684, reg_loss: 0.0680 ||:  41%|####      | 45/111 [00:31<00:51,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8491, UAS: 0.9084, LAS: 0.8351, UEM: 0.4845, LEM: 0.2480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6995, partial_loss/deprel_loss: 0.8959, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9251, loss: 1.0728, batch_reg_loss: 0.0685, reg_loss: 0.0680 ||:  43%|####3     | 48/111 [00:33<00:48,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8088, UAS: 0.9075, LAS: 0.8338, UEM: 0.4736, LEM: 0.2393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1152, partial_loss/deprel_loss: 1.1692, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2269, loss: 1.0826, batch_reg_loss: 0.0685, reg_loss: 0.0681 ||:  46%|####5     | 51/111 [00:35<00:44,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7492, UAS: 0.9047, LAS: 0.8305, UEM: 0.4617, LEM: 0.2330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8205, partial_loss/deprel_loss: 1.8595, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9202, loss: 1.1140, batch_reg_loss: 0.0686, reg_loss: 0.0681 ||:  49%|####8     | 54/111 [00:37<00:41,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7964, UAS: 0.9034, LAS: 0.8291, UEM: 0.4487, LEM: 0.2257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2039, partial_loss/deprel_loss: 1.3371, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3791, loss: 1.1273, batch_reg_loss: 0.0686, reg_loss: 0.0681 ||:  51%|#####1    | 57/111 [00:39<00:39,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7435, UAS: 0.9016, LAS: 0.8268, UEM: 0.4383, LEM: 0.2176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2836, partial_loss/deprel_loss: 1.8352, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9936, loss: 1.1479, batch_reg_loss: 0.0687, reg_loss: 0.0682 ||:  55%|#####4    | 61/111 [00:42<00:34,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8348, UAS: 0.9023, LAS: 0.8278, UEM: 0.4403, LEM: 0.2168, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7759, partial_loss/deprel_loss: 1.0006, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0244, loss: 1.1379, batch_reg_loss: 0.0688, reg_loss: 0.0682 ||:  58%|#####7    | 64/111 [00:44<00:32,  1.44it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8721, UAS: 0.9030, LAS: 0.8286, UEM: 0.4388, LEM: 0.2130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5197, partial_loss/deprel_loss: 0.7770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7944, loss: 1.1308, batch_reg_loss: 0.0689, reg_loss: 0.0682 ||:  60%|######    | 67/111 [00:46<00:30,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9032, LAS: 0.8287, UEM: 0.4419, LEM: 0.2154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3263, partial_loss/deprel_loss: 0.6052, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6184, loss: 1.1277, batch_reg_loss: 0.0689, reg_loss: 0.0683 ||:  63%|######3   | 70/111 [00:48<00:29,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8555, UAS: 0.9024, LAS: 0.8277, UEM: 0.4353, LEM: 0.2113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6941, partial_loss/deprel_loss: 0.8625, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8978, loss: 1.1377, batch_reg_loss: 0.0690, reg_loss: 0.0683 ||:  66%|######5   | 73/111 [00:50<00:26,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7257, UAS: 0.9023, LAS: 0.8276, UEM: 0.4461, LEM: 0.2181, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5688, partial_loss/deprel_loss: 1.8292, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0462, loss: 1.1387, batch_reg_loss: 0.0691, reg_loss: 0.0683 ||:  68%|######8   | 76/111 [00:52<00:24,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8725, UAS: 0.9029, LAS: 0.8282, UEM: 0.4496, LEM: 0.2185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4104, partial_loss/deprel_loss: 0.7276, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7332, loss: 1.1344, batch_reg_loss: 0.0691, reg_loss: 0.0683 ||:  71%|#######1  | 79/111 [00:55<00:22,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7970, UAS: 0.9011, LAS: 0.8263, UEM: 0.4404, LEM: 0.2131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4546, partial_loss/deprel_loss: 1.2680, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3746, loss: 1.1528, batch_reg_loss: 0.0692, reg_loss: 0.0684 ||:  75%|#######4  | 83/111 [00:57<00:19,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7372, UAS: 0.9006, LAS: 0.8256, UEM: 0.4416, LEM: 0.2148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9790, partial_loss/deprel_loss: 1.8560, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9498, loss: 1.1586, batch_reg_loss: 0.0693, reg_loss: 0.0684 ||:  77%|#######7  | 86/111 [00:59<00:17,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8673, UAS: 0.9005, LAS: 0.8255, UEM: 0.4447, LEM: 0.2144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4351, partial_loss/deprel_loss: 0.7105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7247, loss: 1.1604, batch_reg_loss: 0.0694, reg_loss: 0.0685 ||:  81%|########1 | 90/111 [01:02<00:14,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8762, UAS: 0.9016, LAS: 0.8266, UEM: 0.4473, LEM: 0.2139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4284, partial_loss/deprel_loss: 0.6718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6926, loss: 1.1503, batch_reg_loss: 0.0694, reg_loss: 0.0685 ||:  84%|########3 | 93/111 [01:04<00:12,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8070, UAS: 0.9025, LAS: 0.8278, UEM: 0.4611, LEM: 0.2269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3530, partial_loss/deprel_loss: 1.2532, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3427, loss: 1.1401, batch_reg_loss: 0.0695, reg_loss: 0.0685 ||:  86%|########6 | 96/111 [01:06<00:10,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9011, LAS: 0.8262, UEM: 0.4614, LEM: 0.2285, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3227, partial_loss/deprel_loss: 0.5647, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5858, loss: 1.1574, batch_reg_loss: 0.0696, reg_loss: 0.0686 ||:  90%|######### | 100/111 [01:08<00:07,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7670, UAS: 0.9000, LAS: 0.8250, UEM: 0.4556, LEM: 0.2241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6908, partial_loss/deprel_loss: 1.5468, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6452, loss: 1.1669, batch_reg_loss: 0.0696, reg_loss: 0.0686 ||:  94%|#########3| 104/111 [01:11<00:04,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8278, UAS: 0.8997, LAS: 0.8246, UEM: 0.4485, LEM: 0.2188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9835, partial_loss/deprel_loss: 1.0113, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0754, loss: 1.1688, batch_reg_loss: 0.0697, reg_loss: 0.0686 ||:  97%|#########7| 108/111 [01:13<00:01,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.8993, LAS: 0.8241, UEM: 0.4477, LEM: 0.2181, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3591, partial_loss/deprel_loss: 0.6441, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6569, loss: 1.1728, batch_reg_loss: 0.0698, reg_loss: 0.0687 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
+      "2023-04-06 23:04:21,844 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9091, LAS: 0.8425, UEM: 0.5537, LEM: 0.2550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4429, partial_loss/deprel_loss: 25.5584, partial_loss/cycle_loss: 0.0000, batch_loss: 20.5353, loss: 33.4054, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:12,  1.17s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9252, LAS: 0.8642, UEM: 0.6450, LEM: 0.4138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2464, partial_loss/deprel_loss: 19.8308, partial_loss/cycle_loss: 0.0000, batch_loss: 15.9139, loss: 26.8195, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:05<00:08,  1.10s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8695, UAS: 0.9317, LAS: 0.8693, UEM: 0.6302, LEM: 0.3764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5259, partial_loss/deprel_loss: 23.7138, partial_loss/cycle_loss: 0.0000, batch_loss: 19.0762, loss: 25.0754, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:08<00:05,  1.06s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8426, UAS: 0.9354, LAS: 0.8720, UEM: 0.6148, LEM: 0.3476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0366, partial_loss/deprel_loss: 42.6409, partial_loss/cycle_loss: 0.0000, batch_loss: 34.3200, loss: 24.3461, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:10<00:02,  1.01s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8435, UAS: 0.9327, LAS: 0.8688, UEM: 0.5809, LEM: 0.3203, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1886, partial_loss/deprel_loss: 48.1446, partial_loss/cycle_loss: 0.0000, batch_loss: 38.7534, loss: 25.3898, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.03it/s]\n",
+      "2023-04-06 23:04:34,521 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:04:34,521 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:04:34,521 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:04:34,521 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:04:34,521 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.644  |    48.145\n",
+      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.359  |     1.189\n",
+      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.069  |     0.000\n",
+      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - UEM                      |     0.448  |     0.581\n",
+      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - LAS                      |     0.824  |     0.869\n",
+      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - loss                     |     1.173  |    25.390\n",
+      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - LEM                      |     0.218  |     0.320\n",
+      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - UAS                      |     0.899  |     0.933\n",
+      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - EM                       |     0.879  |     0.844\n",
+      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:04:34,523 - INFO - combo.training.trainer - Epoch duration: 0:01:28.011201\n",
+      "2023-04-06 23:04:34,523 - INFO - combo.training.trainer - Estimated training time remaining: 8:42:55\n",
+      "2023-04-06 23:04:34,523 - INFO - allennlp.training.trainer - Epoch 11/399\n",
+      "2023-04-06 23:04:34,523 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:04:34,523 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:04:34,529 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7318, UAS: 0.9023, LAS: 0.8266, UEM: 0.6184, LEM: 0.2993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2381, partial_loss/deprel_loss: 1.8576, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0035, loss: 1.1306, batch_reg_loss: 0.0699, reg_loss: 0.0698 ||:   3%|2         | 3/111 [00:02<01:23,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8728, UAS: 0.9063, LAS: 0.8290, UEM: 0.4976, LEM: 0.2240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4630, partial_loss/deprel_loss: 0.8076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8086, loss: 1.1307, batch_reg_loss: 0.0699, reg_loss: 0.0699 ||:   5%|5         | 6/111 [00:04<01:18,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8167, UAS: 0.9103, LAS: 0.8362, UEM: 0.4687, LEM: 0.1954, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1053, partial_loss/deprel_loss: 1.2357, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2797, loss: 1.0641, batch_reg_loss: 0.0700, reg_loss: 0.0699 ||:   9%|9         | 10/111 [00:06<01:12,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7896, UAS: 0.9057, LAS: 0.8323, UEM: 0.4223, LEM: 0.1711, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5511, partial_loss/deprel_loss: 1.3968, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4978, loss: 1.0987, batch_reg_loss: 0.0701, reg_loss: 0.0700 ||:  12%|#1        | 13/111 [00:08<01:09,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7038, UAS: 0.8933, LAS: 0.8198, UEM: 0.4015, LEM: 0.1612, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.3903, partial_loss/deprel_loss: 2.1584, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4749, loss: 1.2235, batch_reg_loss: 0.0702, reg_loss: 0.0700 ||:  15%|#5        | 17/111 [00:11<01:05,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8609, UAS: 0.8926, LAS: 0.8186, UEM: 0.3850, LEM: 0.1549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5808, partial_loss/deprel_loss: 0.8367, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8557, loss: 1.2307, batch_reg_loss: 0.0702, reg_loss: 0.0700 ||:  18%|#8        | 20/111 [00:13<01:04,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.8979, LAS: 0.8248, UEM: 0.4068, LEM: 0.1651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4397, partial_loss/deprel_loss: 0.6836, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7051, loss: 1.1735, batch_reg_loss: 0.0703, reg_loss: 0.0701 ||:  21%|##        | 23/111 [00:16<01:02,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8470, UAS: 0.9013, LAS: 0.8287, UEM: 0.4106, LEM: 0.1665, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6933, partial_loss/deprel_loss: 0.9933, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0037, loss: 1.1421, batch_reg_loss: 0.0704, reg_loss: 0.0701 ||:  24%|##4       | 27/111 [00:18<00:56,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8822, UAS: 0.9032, LAS: 0.8303, UEM: 0.4190, LEM: 0.1744, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3419, partial_loss/deprel_loss: 0.5709, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5955, loss: 1.1172, batch_reg_loss: 0.0705, reg_loss: 0.0701 ||:  28%|##7       | 31/111 [00:21<00:54,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8587, UAS: 0.9035, LAS: 0.8302, UEM: 0.4089, LEM: 0.1680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6362, partial_loss/deprel_loss: 0.7944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8333, loss: 1.1133, batch_reg_loss: 0.0705, reg_loss: 0.0702 ||:  31%|###       | 34/111 [00:23<00:52,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8844, UAS: 0.9044, LAS: 0.8316, UEM: 0.4279, LEM: 0.1793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3551, partial_loss/deprel_loss: 0.6374, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6515, loss: 1.1019, batch_reg_loss: 0.0706, reg_loss: 0.0702 ||:  34%|###4      | 38/111 [00:25<00:47,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8177, UAS: 0.9025, LAS: 0.8289, UEM: 0.4126, LEM: 0.1706, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0452, partial_loss/deprel_loss: 1.1970, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2373, loss: 1.1266, batch_reg_loss: 0.0707, reg_loss: 0.0703 ||:  38%|###7      | 42/111 [00:28<00:44,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8176, UAS: 0.9022, LAS: 0.8284, UEM: 0.3981, LEM: 0.1621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1751, partial_loss/deprel_loss: 1.1391, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2171, loss: 1.1310, batch_reg_loss: 0.0708, reg_loss: 0.0703 ||:  41%|####1     | 46/111 [00:30<00:40,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.9036, LAS: 0.8304, UEM: 0.4308, LEM: 0.1934, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6100, partial_loss/deprel_loss: 0.8959, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9096, loss: 1.1156, batch_reg_loss: 0.0709, reg_loss: 0.0703 ||:  45%|####5     | 50/111 [00:33<00:40,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7861, UAS: 0.8996, LAS: 0.8257, UEM: 0.4162, LEM: 0.1863, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4086, partial_loss/deprel_loss: 1.4620, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5223, loss: 1.1565, batch_reg_loss: 0.0709, reg_loss: 0.0704 ||:  49%|####8     | 54/111 [00:36<00:38,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8806, UAS: 0.9003, LAS: 0.8264, UEM: 0.4200, LEM: 0.1901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4031, partial_loss/deprel_loss: 0.6066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6369, loss: 1.1513, batch_reg_loss: 0.0710, reg_loss: 0.0704 ||:  51%|#####1    | 57/111 [00:39<00:40,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8030, UAS: 0.8989, LAS: 0.8248, UEM: 0.4080, LEM: 0.1835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4330, partial_loss/deprel_loss: 1.2713, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3747, loss: 1.1698, batch_reg_loss: 0.0711, reg_loss: 0.0705 ||:  55%|#####4    | 61/111 [00:41<00:35,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.8991, LAS: 0.8250, UEM: 0.4074, LEM: 0.1823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3995, partial_loss/deprel_loss: 0.6930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7055, loss: 1.1708, batch_reg_loss: 0.0712, reg_loss: 0.0705 ||:  58%|#####7    | 64/111 [00:43<00:32,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9010, LAS: 0.8273, UEM: 0.4541, LEM: 0.2326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2275, partial_loss/deprel_loss: 0.4708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4934, loss: 1.1522, batch_reg_loss: 0.0713, reg_loss: 0.0705 ||:  60%|######    | 67/111 [00:46<00:33,  1.30it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8669, UAS: 0.9019, LAS: 0.8284, UEM: 0.4523, LEM: 0.2285, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5616, partial_loss/deprel_loss: 0.7684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7984, loss: 1.1425, batch_reg_loss: 0.0713, reg_loss: 0.0706 ||:  63%|######3   | 70/111 [00:48<00:30,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8597, UAS: 0.9028, LAS: 0.8292, UEM: 0.4489, LEM: 0.2223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5849, partial_loss/deprel_loss: 0.8075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8344, loss: 1.1331, batch_reg_loss: 0.0714, reg_loss: 0.0706 ||:  67%|######6   | 74/111 [00:51<00:27,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8455, UAS: 0.9026, LAS: 0.8289, UEM: 0.4483, LEM: 0.2209, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7892, partial_loss/deprel_loss: 0.9486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9882, loss: 1.1360, batch_reg_loss: 0.0715, reg_loss: 0.0706 ||:  69%|######9   | 77/111 [00:53<00:24,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7855, UAS: 0.9023, LAS: 0.8285, UEM: 0.4494, LEM: 0.2224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5825, partial_loss/deprel_loss: 1.4556, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5525, loss: 1.1386, batch_reg_loss: 0.0716, reg_loss: 0.0707 ||:  72%|#######2  | 80/111 [00:55<00:21,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7285, UAS: 0.9020, LAS: 0.8283, UEM: 0.4558, LEM: 0.2254, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6126, partial_loss/deprel_loss: 1.8106, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0426, loss: 1.1390, batch_reg_loss: 0.0716, reg_loss: 0.0707 ||:  75%|#######4  | 83/111 [00:57<00:21,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8581, UAS: 0.9022, LAS: 0.8285, UEM: 0.4532, LEM: 0.2213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4983, partial_loss/deprel_loss: 0.8175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8254, loss: 1.1382, batch_reg_loss: 0.0717, reg_loss: 0.0707 ||:  78%|#######8  | 87/111 [01:00<00:17,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8884, UAS: 0.9024, LAS: 0.8289, UEM: 0.4612, LEM: 0.2287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4406, partial_loss/deprel_loss: 0.6748, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6998, loss: 1.1361, batch_reg_loss: 0.0718, reg_loss: 0.0708 ||:  82%|########1 | 91/111 [01:03<00:14,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7991, UAS: 0.9021, LAS: 0.8285, UEM: 0.4575, LEM: 0.2255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4676, partial_loss/deprel_loss: 1.4466, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5226, loss: 1.1405, batch_reg_loss: 0.0719, reg_loss: 0.0708 ||:  86%|########5 | 95/111 [01:05<00:10,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7878, UAS: 0.9016, LAS: 0.8278, UEM: 0.4487, LEM: 0.2202, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5254, partial_loss/deprel_loss: 1.4661, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5499, loss: 1.1483, batch_reg_loss: 0.0720, reg_loss: 0.0709 ||:  89%|########9 | 99/111 [01:08<00:08,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8066, UAS: 0.9015, LAS: 0.8276, UEM: 0.4439, LEM: 0.2164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1248, partial_loss/deprel_loss: 1.2021, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2587, loss: 1.1491, batch_reg_loss: 0.0720, reg_loss: 0.0709 ||:  93%|#########2| 103/111 [01:10<00:05,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8412, UAS: 0.9024, LAS: 0.8286, UEM: 0.4471, LEM: 0.2176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7510, partial_loss/deprel_loss: 0.9877, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0125, loss: 1.1405, batch_reg_loss: 0.0721, reg_loss: 0.0710 ||:  96%|#########6| 107/111 [01:12<00:02,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7498, UAS: 0.9025, LAS: 0.8286, UEM: 0.4506, LEM: 0.2200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1198, partial_loss/deprel_loss: 1.8436, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9710, loss: 1.1415, batch_reg_loss: 0.0722, reg_loss: 0.0710 ||: 100%|##########| 111/111 [01:15<00:00,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7498, UAS: 0.9025, LAS: 0.8286, UEM: 0.4506, LEM: 0.2200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1198, partial_loss/deprel_loss: 1.8436, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9710, loss: 1.1415, batch_reg_loss: 0.0722, reg_loss: 0.0710 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
+      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.844  |       N/A\n",
+      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     2.120  |       N/A\n",
+      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.071  |       N/A\n",
+      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - UEM                      |     0.451  |       N/A\n",
+      "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - LAS                      |     0.829  |       N/A\n",
+      "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - loss                     |     1.141  |       N/A\n",
+      "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - LEM                      |     0.220  |       N/A\n",
+      "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - UAS                      |     0.902  |       N/A\n",
+      "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - EM                       |     0.750  |       N/A\n",
+      "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:05:50,106 - INFO - combo.training.trainer - Epoch duration: 0:01:15.582589\n",
+      "2023-04-06 23:05:50,106 - INFO - combo.training.trainer - Estimated training time remaining: 8:38:50\n",
+      "2023-04-06 23:05:50,106 - INFO - allennlp.training.trainer - Epoch 12/399\n",
+      "2023-04-06 23:05:50,106 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:05:50,106 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:05:50,112 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8768, UAS: 0.9145, LAS: 0.8453, UEM: 0.4518, LEM: 0.2105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4663, partial_loss/deprel_loss: 0.7585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7723, loss: 1.0488, batch_reg_loss: 0.0723, reg_loss: 0.0723 ||:   3%|2         | 3/111 [00:02<01:15,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9059, LAS: 0.8377, UEM: 0.5846, LEM: 0.3476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6475, partial_loss/deprel_loss: 0.8195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8574, loss: 1.0996, batch_reg_loss: 0.0723, reg_loss: 0.0723 ||:   5%|5         | 6/111 [00:04<01:15,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9139, LAS: 0.8456, UEM: 0.5705, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4356, partial_loss/deprel_loss: 0.6474, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6774, loss: 1.0076, batch_reg_loss: 0.0724, reg_loss: 0.0723 ||:   8%|8         | 9/111 [00:06<01:13,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8927, UAS: 0.9174, LAS: 0.8482, UEM: 0.5739, LEM: 0.3006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3122, partial_loss/deprel_loss: 0.6180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6293, loss: 0.9715, batch_reg_loss: 0.0725, reg_loss: 0.0723 ||:  11%|#         | 12/111 [00:08<01:13,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8221, UAS: 0.9104, LAS: 0.8398, UEM: 0.5355, LEM: 0.2731, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0309, partial_loss/deprel_loss: 1.0752, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1389, loss: 1.0415, batch_reg_loss: 0.0725, reg_loss: 0.0724 ||:  14%|#3        | 15/111 [00:11<01:11,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8429, UAS: 0.9067, LAS: 0.8371, UEM: 0.5688, LEM: 0.3226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8351, partial_loss/deprel_loss: 0.9804, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0239, loss: 1.0859, batch_reg_loss: 0.0726, reg_loss: 0.0724 ||:  16%|#6        | 18/111 [00:13<01:10,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9099, LAS: 0.8394, UEM: 0.5595, LEM: 0.3006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5296, partial_loss/deprel_loss: 0.7868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8080, loss: 1.0573, batch_reg_loss: 0.0726, reg_loss: 0.0724 ||:  19%|#8        | 21/111 [00:15<01:05,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8695, UAS: 0.9070, LAS: 0.8361, UEM: 0.5278, LEM: 0.2775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5860, partial_loss/deprel_loss: 0.8350, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8579, loss: 1.0872, batch_reg_loss: 0.0727, reg_loss: 0.0725 ||:  23%|##2       | 25/111 [00:17<00:59,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8493, UAS: 0.9108, LAS: 0.8402, UEM: 0.5494, LEM: 0.2893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7324, partial_loss/deprel_loss: 0.9558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9839, loss: 1.0478, batch_reg_loss: 0.0728, reg_loss: 0.0725 ||:  25%|##5       | 28/111 [00:20<00:58,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8217, UAS: 0.9095, LAS: 0.8378, UEM: 0.5353, LEM: 0.2781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9042, partial_loss/deprel_loss: 1.1620, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1834, loss: 1.0668, batch_reg_loss: 0.0729, reg_loss: 0.0726 ||:  29%|##8       | 32/111 [00:22<00:53,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8655, UAS: 0.9101, LAS: 0.8382, UEM: 0.5166, LEM: 0.2622, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5087, partial_loss/deprel_loss: 0.8009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8154, loss: 1.0627, batch_reg_loss: 0.0730, reg_loss: 0.0726 ||:  32%|###2      | 36/111 [00:25<00:49,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8028, UAS: 0.9089, LAS: 0.8370, UEM: 0.5070, LEM: 0.2578, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3822, partial_loss/deprel_loss: 1.3442, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4248, loss: 1.0717, batch_reg_loss: 0.0731, reg_loss: 0.0726 ||:  36%|###6      | 40/111 [00:27<00:46,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9432, UAS: 0.9101, LAS: 0.8384, UEM: 0.5297, LEM: 0.2952, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0845, partial_loss/deprel_loss: 0.2260, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2709, loss: 1.0596, batch_reg_loss: 0.0731, reg_loss: 0.0727 ||:  40%|###9      | 44/111 [00:30<00:47,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8942, UAS: 0.9088, LAS: 0.8368, UEM: 0.5236, LEM: 0.2921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3538, partial_loss/deprel_loss: 0.5469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5815, loss: 1.0727, batch_reg_loss: 0.0732, reg_loss: 0.0727 ||:  43%|####3     | 48/111 [00:33<00:44,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8150, UAS: 0.9072, LAS: 0.8350, UEM: 0.5092, LEM: 0.2833, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0867, partial_loss/deprel_loss: 1.3690, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3859, loss: 1.0896, batch_reg_loss: 0.0733, reg_loss: 0.0728 ||:  46%|####5     | 51/111 [00:36<00:43,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8385, UAS: 0.9088, LAS: 0.8370, UEM: 0.5143, LEM: 0.2817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8776, partial_loss/deprel_loss: 1.0180, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0633, loss: 1.0735, batch_reg_loss: 0.0734, reg_loss: 0.0728 ||:  49%|####8     | 54/111 [00:38<00:43,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7273, UAS: 0.9077, LAS: 0.8359, UEM: 0.5105, LEM: 0.2755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6504, partial_loss/deprel_loss: 1.8004, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0438, loss: 1.0829, batch_reg_loss: 0.0734, reg_loss: 0.0728 ||:  51%|#####1    | 57/111 [00:40<00:39,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7544, UAS: 0.9065, LAS: 0.8341, UEM: 0.4990, LEM: 0.2681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8573, partial_loss/deprel_loss: 1.7411, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8378, loss: 1.0979, batch_reg_loss: 0.0735, reg_loss: 0.0729 ||:  54%|#####4    | 60/111 [00:42<00:37,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7376, UAS: 0.9049, LAS: 0.8321, UEM: 0.4968, LEM: 0.2647, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1506, partial_loss/deprel_loss: 1.7339, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8908, loss: 1.1161, batch_reg_loss: 0.0736, reg_loss: 0.0729 ||:  57%|#####6    | 63/111 [00:45<00:35,  1.34it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7635, UAS: 0.9050, LAS: 0.8323, UEM: 0.4953, LEM: 0.2602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9722, partial_loss/deprel_loss: 1.6385, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7789, loss: 1.1152, batch_reg_loss: 0.0737, reg_loss: 0.0729 ||:  60%|######    | 67/111 [00:47<00:31,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8878, UAS: 0.9055, LAS: 0.8327, UEM: 0.4957, LEM: 0.2607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3573, partial_loss/deprel_loss: 0.5606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5937, loss: 1.1123, batch_reg_loss: 0.0737, reg_loss: 0.0730 ||:  63%|######3   | 70/111 [00:50<00:29,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8615, UAS: 0.9058, LAS: 0.8332, UEM: 0.4880, LEM: 0.2547, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6342, partial_loss/deprel_loss: 0.7887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8317, loss: 1.1077, batch_reg_loss: 0.0738, reg_loss: 0.0730 ||:  67%|######6   | 74/111 [00:52<00:26,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8511, UAS: 0.9068, LAS: 0.8343, UEM: 0.4830, LEM: 0.2481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7012, partial_loss/deprel_loss: 0.8971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9318, loss: 1.0977, batch_reg_loss: 0.0739, reg_loss: 0.0731 ||:  70%|#######   | 78/111 [00:54<00:21,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8553, UAS: 0.9070, LAS: 0.8342, UEM: 0.4768, LEM: 0.2413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7163, partial_loss/deprel_loss: 0.9517, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9786, loss: 1.0981, batch_reg_loss: 0.0740, reg_loss: 0.0731 ||:  74%|#######3  | 82/111 [00:57<00:19,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7462, UAS: 0.9056, LAS: 0.8328, UEM: 0.4687, LEM: 0.2366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1859, partial_loss/deprel_loss: 1.6293, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8147, loss: 1.1102, batch_reg_loss: 0.0741, reg_loss: 0.0731 ||:  77%|#######7  | 86/111 [00:59<00:15,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8527, UAS: 0.9051, LAS: 0.8322, UEM: 0.4610, LEM: 0.2306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6899, partial_loss/deprel_loss: 0.8140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8633, loss: 1.1154, batch_reg_loss: 0.0742, reg_loss: 0.0732 ||:  81%|########1 | 90/111 [01:02<00:13,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9056, LAS: 0.8328, UEM: 0.4617, LEM: 0.2292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3437, partial_loss/deprel_loss: 0.5813, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6080, loss: 1.1113, batch_reg_loss: 0.0743, reg_loss: 0.0732 ||:  85%|########4 | 94/111 [01:04<00:10,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8285, UAS: 0.9058, LAS: 0.8330, UEM: 0.4594, LEM: 0.2272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8808, partial_loss/deprel_loss: 1.0929, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1248, loss: 1.1101, batch_reg_loss: 0.0743, reg_loss: 0.0733 ||:  88%|########8 | 98/111 [01:07<00:08,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9059, LAS: 0.8333, UEM: 0.4644, LEM: 0.2317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5260, partial_loss/deprel_loss: 0.6404, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6920, loss: 1.1069, batch_reg_loss: 0.0744, reg_loss: 0.0733 ||:  92%|#########1| 102/111 [01:09<00:05,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8420, UAS: 0.9051, LAS: 0.8326, UEM: 0.4572, LEM: 0.2272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7691, partial_loss/deprel_loss: 0.9381, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9788, loss: 1.1119, batch_reg_loss: 0.0745, reg_loss: 0.0734 ||:  95%|#########5| 106/111 [01:12<00:03,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8197, UAS: 0.9062, LAS: 0.8339, UEM: 0.4675, LEM: 0.2349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0885, partial_loss/deprel_loss: 1.1797, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2361, loss: 1.0998, batch_reg_loss: 0.0746, reg_loss: 0.0734 ||:  99%|#########9| 110/111 [01:15<00:00,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8198, UAS: 0.9061, LAS: 0.8338, UEM: 0.4655, LEM: 0.2335, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0232, partial_loss/deprel_loss: 1.1102, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1674, loss: 1.1004, batch_reg_loss: 0.0746, reg_loss: 0.0734 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
+      "2023-04-06 23:07:05,881 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.110  |       N/A\n",
+      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.023  |       N/A\n",
+      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.073  |       N/A\n",
+      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - UEM                      |     0.465  |       N/A\n",
+      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - LAS                      |     0.834  |       N/A\n",
+      "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - loss                     |     1.100  |       N/A\n",
+      "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - LEM                      |     0.233  |       N/A\n",
+      "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - UAS                      |     0.906  |       N/A\n",
+      "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - EM                       |     0.820  |       N/A\n",
+      "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:07:05,884 - INFO - combo.training.trainer - Epoch duration: 0:01:15.777801\n",
+      "2023-04-06 23:07:05,884 - INFO - combo.training.trainer - Estimated training time remaining: 8:35:17\n",
+      "2023-04-06 23:07:05,884 - INFO - allennlp.training.trainer - Epoch 13/399\n",
+      "2023-04-06 23:07:05,884 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:07:05,884 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:07:05,891 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8541, UAS: 0.9303, LAS: 0.8619, UEM: 0.4574, LEM: 0.1618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7100, partial_loss/deprel_loss: 0.9025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9387, loss: 0.8542, batch_reg_loss: 0.0747, reg_loss: 0.0747 ||:   4%|3         | 4/111 [00:02<01:05,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8582, UAS: 0.9274, LAS: 0.8577, UEM: 0.5495, LEM: 0.2515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5867, partial_loss/deprel_loss: 0.8378, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8624, loss: 0.9059, batch_reg_loss: 0.0747, reg_loss: 0.0747 ||:   6%|6         | 7/111 [00:04<01:06,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8469, UAS: 0.9324, LAS: 0.8661, UEM: 0.6490, LEM: 0.3987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7952, partial_loss/deprel_loss: 0.9270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9754, loss: 0.8396, batch_reg_loss: 0.0748, reg_loss: 0.0747 ||:   9%|9         | 10/111 [00:07<01:10,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8533, UAS: 0.9237, LAS: 0.8552, UEM: 0.6107, LEM: 0.3598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5861, partial_loss/deprel_loss: 0.8717, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8895, loss: 0.9147, batch_reg_loss: 0.0749, reg_loss: 0.0748 ||:  12%|#1        | 13/111 [00:09<01:09,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8860, UAS: 0.9197, LAS: 0.8506, UEM: 0.5745, LEM: 0.3269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3641, partial_loss/deprel_loss: 0.6230, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6461, loss: 0.9695, batch_reg_loss: 0.0749, reg_loss: 0.0748 ||:  15%|#5        | 17/111 [00:11<01:03,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8156, UAS: 0.9151, LAS: 0.8442, UEM: 0.5264, LEM: 0.2925, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1686, partial_loss/deprel_loss: 1.2195, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2844, loss: 1.0252, batch_reg_loss: 0.0750, reg_loss: 0.0748 ||:  19%|#8        | 21/111 [00:13<00:57,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8267, UAS: 0.9124, LAS: 0.8413, UEM: 0.4941, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0154, partial_loss/deprel_loss: 1.0660, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1310, loss: 1.0460, batch_reg_loss: 0.0751, reg_loss: 0.0749 ||:  23%|##2       | 25/111 [00:16<00:53,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8238, UAS: 0.9086, LAS: 0.8368, UEM: 0.4664, LEM: 0.2499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0240, partial_loss/deprel_loss: 1.2609, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2887, loss: 1.0848, batch_reg_loss: 0.0752, reg_loss: 0.0749 ||:  26%|##6       | 29/111 [00:18<00:49,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8801, UAS: 0.9055, LAS: 0.8337, UEM: 0.4621, LEM: 0.2417, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4187, partial_loss/deprel_loss: 0.6399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6710, loss: 1.1165, batch_reg_loss: 0.0753, reg_loss: 0.0749 ||:  30%|##9       | 33/111 [00:21<00:49,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8659, UAS: 0.9073, LAS: 0.8363, UEM: 0.4795, LEM: 0.2514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6131, partial_loss/deprel_loss: 0.7515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7992, loss: 1.0915, batch_reg_loss: 0.0754, reg_loss: 0.0750 ||:  33%|###3      | 37/111 [00:24<00:49,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7761, UAS: 0.9057, LAS: 0.8346, UEM: 0.4668, LEM: 0.2435, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8575, partial_loss/deprel_loss: 1.3668, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5404, loss: 1.1023, batch_reg_loss: 0.0754, reg_loss: 0.0750 ||:  36%|###6      | 40/111 [00:26<00:49,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7881, UAS: 0.9043, LAS: 0.8329, UEM: 0.4531, LEM: 0.2340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5114, partial_loss/deprel_loss: 1.4052, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5020, loss: 1.1203, batch_reg_loss: 0.0755, reg_loss: 0.0751 ||:  40%|###9      | 44/111 [00:29<00:45,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8413, UAS: 0.9052, LAS: 0.8341, UEM: 0.4580, LEM: 0.2377, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9760, partial_loss/deprel_loss: 0.9807, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0554, loss: 1.1106, batch_reg_loss: 0.0756, reg_loss: 0.0751 ||:  43%|####3     | 48/111 [00:31<00:41,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8444, UAS: 0.9044, LAS: 0.8330, UEM: 0.4435, LEM: 0.2266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8102, partial_loss/deprel_loss: 0.9511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9986, loss: 1.1189, batch_reg_loss: 0.0757, reg_loss: 0.0752 ||:  47%|####6     | 52/111 [00:34<00:38,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8000, UAS: 0.9029, LAS: 0.8312, UEM: 0.4362, LEM: 0.2202, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5169, partial_loss/deprel_loss: 1.3667, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4725, loss: 1.1357, batch_reg_loss: 0.0758, reg_loss: 0.0752 ||:  50%|#####     | 56/111 [00:36<00:36,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7002, UAS: 0.9022, LAS: 0.8304, UEM: 0.4436, LEM: 0.2236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.2238, partial_loss/deprel_loss: 2.1219, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4182, loss: 1.1438, batch_reg_loss: 0.0759, reg_loss: 0.0752 ||:  54%|#####4    | 60/111 [00:39<00:33,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9040, LAS: 0.8323, UEM: 0.4516, LEM: 0.2267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6981, partial_loss/deprel_loss: 0.9456, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9721, loss: 1.1264, batch_reg_loss: 0.0760, reg_loss: 0.0753 ||:  58%|#####7    | 64/111 [00:41<00:30,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8776, UAS: 0.9055, LAS: 0.8341, UEM: 0.4556, LEM: 0.2268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4415, partial_loss/deprel_loss: 0.7414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7575, loss: 1.1101, batch_reg_loss: 0.0761, reg_loss: 0.0753 ||:  61%|######1   | 68/111 [00:44<00:28,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8575, UAS: 0.9040, LAS: 0.8328, UEM: 0.4447, LEM: 0.2207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7093, partial_loss/deprel_loss: 0.7485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8168, loss: 1.1185, batch_reg_loss: 0.0762, reg_loss: 0.0754 ||:  65%|######4   | 72/111 [00:47<00:25,  1.51it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8172, UAS: 0.9043, LAS: 0.8333, UEM: 0.4447, LEM: 0.2198, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2306, partial_loss/deprel_loss: 1.1250, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2224, loss: 1.1130, batch_reg_loss: 0.0763, reg_loss: 0.0754 ||:  68%|######8   | 76/111 [00:50<00:24,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8946, UAS: 0.9062, LAS: 0.8355, UEM: 0.4584, LEM: 0.2289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2390, partial_loss/deprel_loss: 0.4781, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5066, loss: 1.0937, batch_reg_loss: 0.0764, reg_loss: 0.0755 ||:  72%|#######2  | 80/111 [00:53<00:21,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8032, UAS: 0.9060, LAS: 0.8351, UEM: 0.4538, LEM: 0.2249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3960, partial_loss/deprel_loss: 1.3687, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4506, loss: 1.0980, batch_reg_loss: 0.0764, reg_loss: 0.0755 ||:  75%|#######4  | 83/111 [00:55<00:19,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8021, UAS: 0.9050, LAS: 0.8337, UEM: 0.4466, LEM: 0.2208, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3930, partial_loss/deprel_loss: 1.3680, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4495, loss: 1.1114, batch_reg_loss: 0.0765, reg_loss: 0.0755 ||:  77%|#######7  | 86/111 [00:57<00:17,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9049, LAS: 0.8336, UEM: 0.4501, LEM: 0.2231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3639, partial_loss/deprel_loss: 0.5709, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6060, loss: 1.1125, batch_reg_loss: 0.0765, reg_loss: 0.0756 ||:  80%|########  | 89/111 [00:59<00:15,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9055, LAS: 0.8343, UEM: 0.4625, LEM: 0.2369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4388, partial_loss/deprel_loss: 0.6558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6890, loss: 1.1064, batch_reg_loss: 0.0766, reg_loss: 0.0756 ||:  84%|########3 | 93/111 [01:02<00:12,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8150, UAS: 0.9057, LAS: 0.8346, UEM: 0.4606, LEM: 0.2346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0815, partial_loss/deprel_loss: 1.1541, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2163, loss: 1.1032, batch_reg_loss: 0.0767, reg_loss: 0.0757 ||:  87%|########7 | 97/111 [01:04<00:09,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8593, UAS: 0.9064, LAS: 0.8353, UEM: 0.4631, LEM: 0.2353, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5644, partial_loss/deprel_loss: 0.7545, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7933, loss: 1.0944, batch_reg_loss: 0.0768, reg_loss: 0.0757 ||:  90%|######### | 100/111 [01:07<00:07,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8722, UAS: 0.9071, LAS: 0.8359, UEM: 0.4619, LEM: 0.2309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4491, partial_loss/deprel_loss: 0.7446, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7624, loss: 1.0887, batch_reg_loss: 0.0769, reg_loss: 0.0757 ||:  94%|#########3| 104/111 [01:09<00:04,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8485, UAS: 0.9075, LAS: 0.8365, UEM: 0.4599, LEM: 0.2282, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7765, partial_loss/deprel_loss: 0.9821, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0180, loss: 1.0846, batch_reg_loss: 0.0770, reg_loss: 0.0758 ||:  97%|#########7| 108/111 [01:12<00:01,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9079, LAS: 0.8370, UEM: 0.4689, LEM: 0.2362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5006, partial_loss/deprel_loss: 0.6604, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7055, loss: 1.0791, batch_reg_loss: 0.0770, reg_loss: 0.0758 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
+      "2023-04-06 23:08:20,319 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:08:20,319 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.660  |       N/A\n",
+      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.501  |       N/A\n",
+      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.076  |       N/A\n",
+      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - UEM                      |     0.469  |       N/A\n",
+      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - LAS                      |     0.837  |       N/A\n",
+      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - loss                     |     1.079  |       N/A\n",
+      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - LEM                      |     0.236  |       N/A\n",
+      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:08:20,321 - INFO - combo.training.tensorboard_writer - UAS                      |     0.908  |       N/A\n",
+      "2023-04-06 23:08:20,321 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:08:20,321 - INFO - combo.training.tensorboard_writer - EM                       |     0.877  |       N/A\n",
+      "2023-04-06 23:08:20,321 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:08:20,321 - INFO - combo.training.trainer - Epoch duration: 0:01:14.437484\n",
+      "2023-04-06 23:08:20,322 - INFO - combo.training.trainer - Estimated training time remaining: 8:31:27\n",
+      "2023-04-06 23:08:20,322 - INFO - allennlp.training.trainer - Epoch 14/399\n",
+      "2023-04-06 23:08:20,322 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:08:20,322 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:08:20,328 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8872, UAS: 0.9050, LAS: 0.8322, UEM: 0.3462, LEM: 0.1412, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3882, partial_loss/deprel_loss: 0.6340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6619, loss: 1.1053, batch_reg_loss: 0.0771, reg_loss: 0.0771 ||:   4%|3         | 4/111 [00:02<01:09,  1.53it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9041, UAS: 0.9247, LAS: 0.8550, UEM: 0.5441, LEM: 0.2661, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2521, partial_loss/deprel_loss: 0.4683, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5022, loss: 0.9122, batch_reg_loss: 0.0772, reg_loss: 0.0771 ||:   6%|6         | 7/111 [00:04<01:09,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8409, UAS: 0.9159, LAS: 0.8477, UEM: 0.6024, LEM: 0.3563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8878, partial_loss/deprel_loss: 0.9722, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0326, loss: 0.9816, batch_reg_loss: 0.0773, reg_loss: 0.0772 ||:   9%|9         | 10/111 [00:06<01:09,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8393, UAS: 0.9164, LAS: 0.8477, UEM: 0.5390, LEM: 0.2992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8523, partial_loss/deprel_loss: 0.9885, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0386, loss: 0.9758, batch_reg_loss: 0.0773, reg_loss: 0.0772 ||:  13%|#2        | 14/111 [00:09<01:03,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7601, UAS: 0.9110, LAS: 0.8412, UEM: 0.5185, LEM: 0.2800, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9668, partial_loss/deprel_loss: 1.5166, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6841, loss: 1.0342, batch_reg_loss: 0.0774, reg_loss: 0.0772 ||:  15%|#5        | 17/111 [00:11<01:04,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8805, UAS: 0.9141, LAS: 0.8444, UEM: 0.5072, LEM: 0.2637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3938, partial_loss/deprel_loss: 0.6296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6599, loss: 1.0093, batch_reg_loss: 0.0775, reg_loss: 0.0773 ||:  19%|#8        | 21/111 [00:14<01:00,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8259, UAS: 0.9116, LAS: 0.8416, UEM: 0.4865, LEM: 0.2501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0877, partial_loss/deprel_loss: 1.1095, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1827, loss: 1.0410, batch_reg_loss: 0.0776, reg_loss: 0.0773 ||:  23%|##2       | 25/111 [00:16<00:57,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8550, UAS: 0.9061, LAS: 0.8356, UEM: 0.4625, LEM: 0.2324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7059, partial_loss/deprel_loss: 0.8587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9058, loss: 1.0970, batch_reg_loss: 0.0777, reg_loss: 0.0774 ||:  26%|##6       | 29/111 [00:19<00:52,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8325, UAS: 0.9051, LAS: 0.8340, UEM: 0.4469, LEM: 0.2211, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0395, partial_loss/deprel_loss: 1.0731, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1441, loss: 1.1120, batch_reg_loss: 0.0778, reg_loss: 0.0774 ||:  30%|##9       | 33/111 [00:21<00:50,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9085, LAS: 0.8382, UEM: 0.4764, LEM: 0.2406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3495, partial_loss/deprel_loss: 0.6205, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6442, loss: 1.0744, batch_reg_loss: 0.0778, reg_loss: 0.0774 ||:  32%|###2      | 36/111 [00:24<00:52,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8723, UAS: 0.9108, LAS: 0.8411, UEM: 0.4902, LEM: 0.2499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6145, partial_loss/deprel_loss: 0.7804, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8251, loss: 1.0500, batch_reg_loss: 0.0779, reg_loss: 0.0775 ||:  36%|###6      | 40/111 [00:26<00:48,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8914, UAS: 0.9124, LAS: 0.8426, UEM: 0.4984, LEM: 0.2531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3140, partial_loss/deprel_loss: 0.5344, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5684, loss: 1.0315, batch_reg_loss: 0.0780, reg_loss: 0.0775 ||:  40%|###9      | 44/111 [00:29<00:45,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8373, UAS: 0.9119, LAS: 0.8419, UEM: 0.4840, LEM: 0.2437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9631, partial_loss/deprel_loss: 1.0249, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0907, loss: 1.0371, batch_reg_loss: 0.0781, reg_loss: 0.0776 ||:  42%|####2     | 47/111 [00:31<00:44,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9133, LAS: 0.8437, UEM: 0.4948, LEM: 0.2530, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2245, partial_loss/deprel_loss: 0.4133, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4537, loss: 1.0207, batch_reg_loss: 0.0782, reg_loss: 0.0776 ||:  46%|####5     | 51/111 [00:34<00:41,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7901, UAS: 0.9129, LAS: 0.8434, UEM: 0.4891, LEM: 0.2476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6952, partial_loss/deprel_loss: 1.4274, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5592, loss: 1.0256, batch_reg_loss: 0.0782, reg_loss: 0.0776 ||:  49%|####8     | 54/111 [00:36<00:40,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9030, UAS: 0.9121, LAS: 0.8425, UEM: 0.4933, LEM: 0.2509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1891, partial_loss/deprel_loss: 0.4925, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5101, loss: 1.0326, batch_reg_loss: 0.0783, reg_loss: 0.0777 ||:  52%|#####2    | 58/111 [00:39<00:37,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8539, UAS: 0.9113, LAS: 0.8415, UEM: 0.4846, LEM: 0.2433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6334, partial_loss/deprel_loss: 0.8711, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9019, loss: 1.0366, batch_reg_loss: 0.0784, reg_loss: 0.0777 ||:  56%|#####5    | 62/111 [00:41<00:33,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8846, UAS: 0.9111, LAS: 0.8413, UEM: 0.4800, LEM: 0.2409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4166, partial_loss/deprel_loss: 0.6120, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6514, loss: 1.0415, batch_reg_loss: 0.0785, reg_loss: 0.0778 ||:  59%|#####8    | 65/111 [00:44<00:31,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7980, UAS: 0.9108, LAS: 0.8410, UEM: 0.4735, LEM: 0.2367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4804, partial_loss/deprel_loss: 1.3567, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4600, loss: 1.0455, batch_reg_loss: 0.0785, reg_loss: 0.0778 ||:  61%|######1   | 68/111 [00:46<00:30,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7880, UAS: 0.9112, LAS: 0.8414, UEM: 0.4779, LEM: 0.2394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6517, partial_loss/deprel_loss: 1.4157, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5415, loss: 1.0425, batch_reg_loss: 0.0786, reg_loss: 0.0778 ||:  64%|######3   | 71/111 [00:48<00:29,  1.38it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9119, LAS: 0.8426, UEM: 0.4984, LEM: 0.2679, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1117, partial_loss/deprel_loss: 0.2414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2941, loss: 1.0349, batch_reg_loss: 0.0786, reg_loss: 0.0779 ||:  67%|######6   | 74/111 [00:50<00:27,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7983, UAS: 0.9113, LAS: 0.8419, UEM: 0.4900, LEM: 0.2614, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4769, partial_loss/deprel_loss: 1.3341, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4414, loss: 1.0420, batch_reg_loss: 0.0787, reg_loss: 0.0779 ||:  70%|#######   | 78/111 [00:53<00:23,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7141, UAS: 0.9108, LAS: 0.8416, UEM: 0.4961, LEM: 0.2649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.2212, partial_loss/deprel_loss: 2.0886, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3939, loss: 1.0457, batch_reg_loss: 0.0788, reg_loss: 0.0779 ||:  74%|#######3  | 82/111 [00:56<00:20,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8603, UAS: 0.9102, LAS: 0.8409, UEM: 0.4893, LEM: 0.2593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6706, partial_loss/deprel_loss: 0.8114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8622, loss: 1.0496, batch_reg_loss: 0.0789, reg_loss: 0.0780 ||:  77%|#######7  | 86/111 [00:58<00:17,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7963, UAS: 0.9103, LAS: 0.8411, UEM: 0.4857, LEM: 0.2558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4870, partial_loss/deprel_loss: 1.3774, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4783, loss: 1.0499, batch_reg_loss: 0.0790, reg_loss: 0.0780 ||:  81%|########1 | 90/111 [01:01<00:14,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8439, UAS: 0.9096, LAS: 0.8401, UEM: 0.4780, LEM: 0.2496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7491, partial_loss/deprel_loss: 0.8945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9445, loss: 1.0577, batch_reg_loss: 0.0791, reg_loss: 0.0781 ||:  85%|########4 | 94/111 [01:03<00:10,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8615, UAS: 0.9107, LAS: 0.8414, UEM: 0.4827, LEM: 0.2505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6406, partial_loss/deprel_loss: 0.8061, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8522, loss: 1.0448, batch_reg_loss: 0.0792, reg_loss: 0.0781 ||:  88%|########8 | 98/111 [01:06<00:08,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8037, UAS: 0.9103, LAS: 0.8410, UEM: 0.4798, LEM: 0.2484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2133, partial_loss/deprel_loss: 1.2041, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2852, loss: 1.0474, batch_reg_loss: 0.0792, reg_loss: 0.0781 ||:  91%|######### | 101/111 [01:08<00:07,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7601, UAS: 0.9088, LAS: 0.8395, UEM: 0.4738, LEM: 0.2452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0699, partial_loss/deprel_loss: 1.6046, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7770, loss: 1.0608, batch_reg_loss: 0.0793, reg_loss: 0.0782 ||:  94%|#########3| 104/111 [01:11<00:04,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8128, UAS: 0.9079, LAS: 0.8384, UEM: 0.4676, LEM: 0.2416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1866, partial_loss/deprel_loss: 1.2551, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3208, loss: 1.0707, batch_reg_loss: 0.0794, reg_loss: 0.0782 ||:  96%|#########6| 107/111 [01:13<00:02,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.9092, LAS: 0.8398, UEM: 0.4744, LEM: 0.2438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3939, partial_loss/deprel_loss: 0.6267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6596, loss: 1.0586, batch_reg_loss: 0.0795, reg_loss: 0.0783 ||: 100%|##########| 111/111 [01:15<00:00,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.9092, LAS: 0.8398, UEM: 0.4744, LEM: 0.2438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3939, partial_loss/deprel_loss: 0.6267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6596, loss: 1.0586, batch_reg_loss: 0.0795, reg_loss: 0.0783 ||: 100%|##########| 111/111 [01:15<00:00,  1.46it/s]\n",
+      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.627  |       N/A\n",
+      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.394  |       N/A\n",
+      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.078  |       N/A\n",
+      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - UEM                      |     0.474  |       N/A\n",
+      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - LAS                      |     0.840  |       N/A\n",
+      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - loss                     |     1.059  |       N/A\n",
+      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:09:36,177 - INFO - combo.training.tensorboard_writer - LEM                      |     0.244  |       N/A\n",
+      "2023-04-06 23:09:36,177 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:09:36,177 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:09:36,177 - INFO - combo.training.tensorboard_writer - UAS                      |     0.909  |       N/A\n",
+      "2023-04-06 23:09:36,177 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:09:36,177 - INFO - combo.training.tensorboard_writer - EM                       |     0.879  |       N/A\n",
+      "2023-04-06 23:09:36,177 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:09:36,177 - INFO - combo.training.trainer - Epoch duration: 0:01:15.855623\n",
+      "2023-04-06 23:09:36,177 - INFO - combo.training.trainer - Estimated training time remaining: 8:28:34\n",
+      "2023-04-06 23:09:36,178 - INFO - allennlp.training.trainer - Epoch 15/399\n",
+      "2023-04-06 23:09:36,178 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:09:36,178 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:09:36,183 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9129, LAS: 0.8471, UEM: 0.5121, LEM: 0.2814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3401, partial_loss/deprel_loss: 0.5037, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5505, loss: 1.0156, batch_reg_loss: 0.0795, reg_loss: 0.0795 ||:   3%|2         | 3/111 [00:02<01:16,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8599, UAS: 0.9213, LAS: 0.8539, UEM: 0.5395, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6728, partial_loss/deprel_loss: 0.8153, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8665, loss: 0.9328, batch_reg_loss: 0.0796, reg_loss: 0.0796 ||:   6%|6         | 7/111 [00:04<01:10,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8601, UAS: 0.9119, LAS: 0.8434, UEM: 0.4963, LEM: 0.2662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5714, partial_loss/deprel_loss: 0.8098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8418, loss: 1.0238, batch_reg_loss: 0.0797, reg_loss: 0.0796 ||:   9%|9         | 10/111 [00:06<01:08,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8758, UAS: 0.9158, LAS: 0.8482, UEM: 0.4947, LEM: 0.2493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4600, partial_loss/deprel_loss: 0.6518, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6932, loss: 0.9811, batch_reg_loss: 0.0798, reg_loss: 0.0796 ||:  13%|#2        | 14/111 [00:09<01:06,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9126, LAS: 0.8430, UEM: 0.4992, LEM: 0.2573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1905, partial_loss/deprel_loss: 0.5070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5236, loss: 1.0350, batch_reg_loss: 0.0799, reg_loss: 0.0797 ||:  16%|#6        | 18/111 [00:11<01:01,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8956, UAS: 0.9172, LAS: 0.8487, UEM: 0.5242, LEM: 0.2724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3962, partial_loss/deprel_loss: 0.5998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6390, loss: 0.9883, batch_reg_loss: 0.0799, reg_loss: 0.0797 ||:  19%|#8        | 21/111 [00:14<01:01,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8737, UAS: 0.9172, LAS: 0.8486, UEM: 0.5373, LEM: 0.2797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4394, partial_loss/deprel_loss: 0.6408, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6805, loss: 0.9807, batch_reg_loss: 0.0800, reg_loss: 0.0797 ||:  22%|##1       | 24/111 [00:16<01:03,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8847, UAS: 0.9188, LAS: 0.8518, UEM: 0.5242, LEM: 0.2712, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5723, partial_loss/deprel_loss: 0.6435, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7094, loss: 0.9584, batch_reg_loss: 0.0801, reg_loss: 0.0798 ||:  25%|##5       | 28/111 [00:19<00:58,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9203, LAS: 0.8540, UEM: 0.5249, LEM: 0.2724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2475, partial_loss/deprel_loss: 0.4650, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5017, loss: 0.9409, batch_reg_loss: 0.0802, reg_loss: 0.0798 ||:  29%|##8       | 32/111 [00:21<00:54,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8028, UAS: 0.9190, LAS: 0.8522, UEM: 0.5190, LEM: 0.2695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3828, partial_loss/deprel_loss: 1.3768, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4582, loss: 0.9604, batch_reg_loss: 0.0802, reg_loss: 0.0799 ||:  32%|###1      | 35/111 [00:23<00:52,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7389, UAS: 0.9176, LAS: 0.8506, UEM: 0.5181, LEM: 0.2656, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2919, partial_loss/deprel_loss: 1.6833, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8853, loss: 0.9725, batch_reg_loss: 0.0803, reg_loss: 0.0799 ||:  34%|###4      | 38/111 [00:26<00:52,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8916, UAS: 0.9187, LAS: 0.8517, UEM: 0.5193, LEM: 0.2625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3254, partial_loss/deprel_loss: 0.5673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5993, loss: 0.9599, batch_reg_loss: 0.0804, reg_loss: 0.0799 ||:  37%|###6      | 41/111 [00:28<00:50,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8510, UAS: 0.9194, LAS: 0.8522, UEM: 0.5159, LEM: 0.2569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7491, partial_loss/deprel_loss: 0.8486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9091, loss: 0.9546, batch_reg_loss: 0.0804, reg_loss: 0.0800 ||:  40%|###9      | 44/111 [00:30<00:47,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9198, LAS: 0.8526, UEM: 0.5182, LEM: 0.2558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4518, partial_loss/deprel_loss: 0.7032, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7334, loss: 0.9497, batch_reg_loss: 0.0805, reg_loss: 0.0800 ||:  42%|####2     | 47/111 [00:32<00:45,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9207, LAS: 0.8539, UEM: 0.5335, LEM: 0.2761, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1517, partial_loss/deprel_loss: 0.3182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3655, loss: 0.9379, batch_reg_loss: 0.0805, reg_loss: 0.0800 ||:  45%|####5     | 50/111 [00:34<00:43,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8364, UAS: 0.9215, LAS: 0.8548, UEM: 0.5430, LEM: 0.2846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9017, partial_loss/deprel_loss: 1.0522, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1027, loss: 0.9278, batch_reg_loss: 0.0806, reg_loss: 0.0801 ||:  48%|####7     | 53/111 [00:37<00:42,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8623, UAS: 0.9200, LAS: 0.8530, UEM: 0.5317, LEM: 0.2759, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6586, partial_loss/deprel_loss: 0.8304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8768, loss: 0.9473, batch_reg_loss: 0.0807, reg_loss: 0.0801 ||:  51%|#####1    | 57/111 [00:39<00:37,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9206, LAS: 0.8537, UEM: 0.5313, LEM: 0.2737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3370, partial_loss/deprel_loss: 0.5406, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5806, loss: 0.9414, batch_reg_loss: 0.0807, reg_loss: 0.0801 ||:  54%|#####4    | 60/111 [00:41<00:35,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8269, UAS: 0.9210, LAS: 0.8541, UEM: 0.5338, LEM: 0.2764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9455, partial_loss/deprel_loss: 1.0358, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0985, loss: 0.9351, batch_reg_loss: 0.0808, reg_loss: 0.0802 ||:  57%|#####6    | 63/111 [00:43<00:34,  1.40it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7807, UAS: 0.9184, LAS: 0.8511, UEM: 0.5201, LEM: 0.2688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6969, partial_loss/deprel_loss: 1.4591, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5876, loss: 0.9608, batch_reg_loss: 0.0809, reg_loss: 0.0802 ||:  60%|######    | 67/111 [00:46<00:30,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7824, UAS: 0.9154, LAS: 0.8479, UEM: 0.5090, LEM: 0.2617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7713, partial_loss/deprel_loss: 1.3922, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5490, loss: 0.9869, batch_reg_loss: 0.0810, reg_loss: 0.0802 ||:  64%|######3   | 71/111 [00:49<00:27,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9155, LAS: 0.8480, UEM: 0.5164, LEM: 0.2689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1790, partial_loss/deprel_loss: 0.4022, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4386, loss: 0.9870, batch_reg_loss: 0.0811, reg_loss: 0.0803 ||:  68%|######7   | 75/111 [00:51<00:24,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9141, LAS: 0.8463, UEM: 0.5077, LEM: 0.2615, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6719, partial_loss/deprel_loss: 0.8466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8928, loss: 1.0058, batch_reg_loss: 0.0812, reg_loss: 0.0803 ||:  71%|#######1  | 79/111 [00:54<00:21,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7749, UAS: 0.9124, LAS: 0.8444, UEM: 0.4999, LEM: 0.2572, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7582, partial_loss/deprel_loss: 1.4269, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5744, loss: 1.0213, batch_reg_loss: 0.0812, reg_loss: 0.0804 ||:  74%|#######3  | 82/111 [00:56<00:19,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8659, UAS: 0.9121, LAS: 0.8439, UEM: 0.4934, LEM: 0.2531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5849, partial_loss/deprel_loss: 0.7789, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8214, loss: 1.0266, batch_reg_loss: 0.0813, reg_loss: 0.0804 ||:  77%|#######6  | 85/111 [00:58<00:17,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8452, UAS: 0.9122, LAS: 0.8440, UEM: 0.4887, LEM: 0.2487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7833, partial_loss/deprel_loss: 1.0462, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0750, loss: 1.0278, batch_reg_loss: 0.0814, reg_loss: 0.0804 ||:  80%|########  | 89/111 [01:01<00:14,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8722, UAS: 0.9112, LAS: 0.8429, UEM: 0.4808, LEM: 0.2430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5965, partial_loss/deprel_loss: 0.7940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8360, loss: 1.0355, batch_reg_loss: 0.0815, reg_loss: 0.0805 ||:  84%|########3 | 93/111 [01:03<00:11,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7975, UAS: 0.9112, LAS: 0.8426, UEM: 0.4752, LEM: 0.2377, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3786, partial_loss/deprel_loss: 1.3451, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4334, loss: 1.0376, batch_reg_loss: 0.0816, reg_loss: 0.0805 ||:  87%|########7 | 97/111 [01:05<00:08,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8615, UAS: 0.9109, LAS: 0.8420, UEM: 0.4715, LEM: 0.2341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6782, partial_loss/deprel_loss: 0.8343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8848, loss: 1.0429, batch_reg_loss: 0.0817, reg_loss: 0.0806 ||:  91%|######### | 101/111 [01:08<00:06,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7601, UAS: 0.9114, LAS: 0.8427, UEM: 0.4907, LEM: 0.2558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8753, partial_loss/deprel_loss: 1.6942, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8122, loss: 1.0390, batch_reg_loss: 0.0818, reg_loss: 0.0806 ||:  95%|#########4| 105/111 [01:11<00:04,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8028, UAS: 0.9112, LAS: 0.8426, UEM: 0.4832, LEM: 0.2502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3786, partial_loss/deprel_loss: 1.2117, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3270, loss: 1.0401, batch_reg_loss: 0.0819, reg_loss: 0.0807 ||:  98%|#########8| 109/111 [01:14<00:01,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8393, UAS: 0.9112, LAS: 0.8424, UEM: 0.4790, LEM: 0.2474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8623, partial_loss/deprel_loss: 1.0124, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0643, loss: 1.0407, batch_reg_loss: 0.0819, reg_loss: 0.0807 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
+      "2023-04-06 23:10:51,901 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9633, LAS: 0.9155, UEM: 0.8426, LEM: 0.6012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2034, partial_loss/deprel_loss: 20.0996, partial_loss/cycle_loss: 0.0000, batch_loss: 16.1204, loss: 18.3759, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:11,  1.05s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8487, UAS: 0.9482, LAS: 0.8943, UEM: 0.7481, LEM: 0.4864, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1447, partial_loss/deprel_loss: 48.1773, partial_loss/cycle_loss: 0.0000, batch_loss: 38.7708, loss: 23.6897, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  31%|###       | 4/13 [00:04<00:09,  1.04s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8831, UAS: 0.9460, LAS: 0.8896, UEM: 0.6815, LEM: 0.4016, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5206, partial_loss/deprel_loss: 23.6872, partial_loss/cycle_loss: 0.0000, batch_loss: 19.0539, loss: 21.7025, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  54%|#####3    | 7/13 [00:06<00:05,  1.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8469, UAS: 0.9392, LAS: 0.8802, UEM: 0.6161, LEM: 0.3403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0001, partial_loss/deprel_loss: 36.3661, partial_loss/cycle_loss: 0.0000, batch_loss: 29.2929, loss: 24.2677, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  77%|#######6  | 10/13 [00:09<00:02,  1.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8713, UAS: 0.9333, LAS: 0.8731, UEM: 0.5785, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7952, partial_loss/deprel_loss: 29.1962, partial_loss/cycle_loss: 0.0000, batch_loss: 23.5160, loss: 26.0322, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  92%|#########2| 12/13 [00:11<00:01,  1.01s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9363, LAS: 0.8771, UEM: 0.6121, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2237, partial_loss/deprel_loss: 23.0313, partial_loss/cycle_loss: 0.0000, batch_loss: 18.4698, loss: 25.4504, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.03it/s]\n",
+      "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.012  |    23.031\n",
+      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.862  |     0.224\n",
+      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.081  |     0.000\n",
+      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - UEM                      |     0.479  |     0.612\n",
+      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - LAS                      |     0.842  |     0.877\n",
+      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - loss                     |     1.041  |    25.450\n",
+      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - LEM                      |     0.247  |     0.344\n",
+      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - UAS                      |     0.911  |     0.936\n",
+      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - EM                       |     0.839  |     0.925\n",
+      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:11:04,513 - INFO - combo.training.trainer - Epoch duration: 0:01:28.335274\n",
+      "2023-04-06 23:11:04,513 - INFO - combo.training.trainer - Estimated training time remaining: 8:30:52\n",
+      "2023-04-06 23:11:04,513 - INFO - allennlp.training.trainer - Epoch 16/399\n",
+      "2023-04-06 23:11:04,513 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:11:04,513 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:11:04,519 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7589, UAS: 0.9080, LAS: 0.8432, UEM: 0.5846, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2122, partial_loss/deprel_loss: 1.5676, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7785, loss: 1.0280, batch_reg_loss: 0.0820, reg_loss: 0.0820 ||:   3%|2         | 3/111 [00:02<01:22,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8663, UAS: 0.9242, LAS: 0.8615, UEM: 0.5455, LEM: 0.2476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6915, partial_loss/deprel_loss: 0.7745, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8400, loss: 0.8831, batch_reg_loss: 0.0821, reg_loss: 0.0820 ||:   6%|6         | 7/111 [00:04<01:14,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8331, UAS: 0.9154, LAS: 0.8499, UEM: 0.4670, LEM: 0.2081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9397, partial_loss/deprel_loss: 1.1732, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2086, loss: 1.0023, batch_reg_loss: 0.0822, reg_loss: 0.0821 ||:   9%|9         | 10/111 [00:06<01:12,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8657, UAS: 0.9175, LAS: 0.8510, UEM: 0.4862, LEM: 0.2185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5694, partial_loss/deprel_loss: 0.7629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8065, loss: 0.9746, batch_reg_loss: 0.0823, reg_loss: 0.0821 ||:  13%|#2        | 14/111 [00:09<01:05,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8733, UAS: 0.9107, LAS: 0.8442, UEM: 0.4501, LEM: 0.1969, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7070, partial_loss/deprel_loss: 0.7876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8538, loss: 1.0366, batch_reg_loss: 0.0823, reg_loss: 0.0821 ||:  16%|#6        | 18/111 [00:11<01:01,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9177, LAS: 0.8516, UEM: 0.5343, LEM: 0.2646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2673, partial_loss/deprel_loss: 0.4801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5199, loss: 0.9668, batch_reg_loss: 0.0824, reg_loss: 0.0822 ||:  20%|#9        | 22/111 [00:14<00:58,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9192, LAS: 0.8529, UEM: 0.5322, LEM: 0.2637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3409, partial_loss/deprel_loss: 0.5948, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6265, loss: 0.9500, batch_reg_loss: 0.0825, reg_loss: 0.0822 ||:  23%|##2       | 25/111 [00:16<01:00,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8353, UAS: 0.9144, LAS: 0.8473, UEM: 0.5001, LEM: 0.2444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9402, partial_loss/deprel_loss: 1.0992, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1499, loss: 1.0039, batch_reg_loss: 0.0826, reg_loss: 0.0823 ||:  26%|##6       | 29/111 [00:19<00:54,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8619, UAS: 0.9124, LAS: 0.8448, UEM: 0.4943, LEM: 0.2411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6395, partial_loss/deprel_loss: 0.8357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8791, loss: 1.0205, batch_reg_loss: 0.0826, reg_loss: 0.0823 ||:  30%|##9       | 33/111 [00:21<00:50,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8202, UAS: 0.9116, LAS: 0.8445, UEM: 0.4757, LEM: 0.2289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1420, partial_loss/deprel_loss: 1.1341, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2184, loss: 1.0229, batch_reg_loss: 0.0827, reg_loss: 0.0823 ||:  32%|###2      | 36/111 [00:23<00:49,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9109, LAS: 0.8433, UEM: 0.4713, LEM: 0.2254, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4303, partial_loss/deprel_loss: 0.6151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6610, loss: 1.0294, batch_reg_loss: 0.0828, reg_loss: 0.0824 ||:  36%|###6      | 40/111 [00:26<00:47,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8473, UAS: 0.9110, LAS: 0.8432, UEM: 0.4799, LEM: 0.2322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7995, partial_loss/deprel_loss: 0.8820, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9484, loss: 1.0291, batch_reg_loss: 0.0829, reg_loss: 0.0824 ||:  39%|###8      | 43/111 [00:28<00:47,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7958, UAS: 0.9110, LAS: 0.8432, UEM: 0.4756, LEM: 0.2299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3631, partial_loss/deprel_loss: 1.3073, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4014, loss: 1.0309, batch_reg_loss: 0.0829, reg_loss: 0.0825 ||:  41%|####1     | 46/111 [00:30<00:45,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8617, UAS: 0.9128, LAS: 0.8450, UEM: 0.4773, LEM: 0.2268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7004, partial_loss/deprel_loss: 0.9011, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9440, loss: 1.0167, batch_reg_loss: 0.0830, reg_loss: 0.0825 ||:  44%|####4     | 49/111 [00:33<00:44,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8606, UAS: 0.9116, LAS: 0.8436, UEM: 0.4651, LEM: 0.2188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6289, partial_loss/deprel_loss: 0.8555, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8933, loss: 1.0315, batch_reg_loss: 0.0831, reg_loss: 0.0825 ||:  48%|####7     | 53/111 [00:35<00:39,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8008, UAS: 0.9112, LAS: 0.8430, UEM: 0.4520, LEM: 0.2096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1899, partial_loss/deprel_loss: 1.2488, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3202, loss: 1.0350, batch_reg_loss: 0.0832, reg_loss: 0.0826 ||:  51%|#####1    | 57/111 [00:38<00:35,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9118, LAS: 0.8436, UEM: 0.4508, LEM: 0.2074, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4705, partial_loss/deprel_loss: 0.6971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7350, loss: 1.0315, batch_reg_loss: 0.0833, reg_loss: 0.0826 ||:  55%|#####4    | 61/111 [00:40<00:34,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8310, UAS: 0.9122, LAS: 0.8440, UEM: 0.4514, LEM: 0.2077, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0268, partial_loss/deprel_loss: 1.1379, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1990, loss: 1.0293, batch_reg_loss: 0.0833, reg_loss: 0.0826 ||:  58%|#####7    | 64/111 [00:43<00:32,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8854, UAS: 0.9126, LAS: 0.8445, UEM: 0.4557, LEM: 0.2132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3577, partial_loss/deprel_loss: 0.5272, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5768, loss: 1.0256, batch_reg_loss: 0.0834, reg_loss: 0.0827 ||:  61%|######1   | 68/111 [00:45<00:29,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8613, UAS: 0.9138, LAS: 0.8459, UEM: 0.4563, LEM: 0.2122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6427, partial_loss/deprel_loss: 0.9296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9557, loss: 1.0155, batch_reg_loss: 0.0835, reg_loss: 0.0827 ||:  65%|######4   | 72/111 [00:48<00:26,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8333, UAS: 0.9128, LAS: 0.8448, UEM: 0.4481, LEM: 0.2077, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9213, partial_loss/deprel_loss: 0.9996, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0676, loss: 1.0238, batch_reg_loss: 0.0836, reg_loss: 0.0828 ||:  68%|######8   | 76/111 [00:50<00:23,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9138, LAS: 0.8463, UEM: 0.4699, LEM: 0.2289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1576, partial_loss/deprel_loss: 0.3164, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3683, loss: 1.0118, batch_reg_loss: 0.0837, reg_loss: 0.0828 ||:  72%|#######2  | 80/111 [00:53<00:20,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7485, UAS: 0.9127, LAS: 0.8450, UEM: 0.4712, LEM: 0.2295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4496, partial_loss/deprel_loss: 1.8294, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0372, loss: 1.0233, batch_reg_loss: 0.0838, reg_loss: 0.0829 ||:  76%|#######5  | 84/111 [00:56<00:17,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9140, LAS: 0.8467, UEM: 0.4935, LEM: 0.2568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0828, partial_loss/deprel_loss: 0.2183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2751, loss: 1.0081, batch_reg_loss: 0.0839, reg_loss: 0.0829 ||:  79%|#######9  | 88/111 [00:59<00:15,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9135, LAS: 0.8460, UEM: 0.4869, LEM: 0.2512, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4877, partial_loss/deprel_loss: 0.7291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7648, loss: 1.0140, batch_reg_loss: 0.0840, reg_loss: 0.0830 ||:  83%|########2 | 92/111 [01:01<00:12,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8203, UAS: 0.9137, LAS: 0.8462, UEM: 0.4900, LEM: 0.2533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0775, partial_loss/deprel_loss: 1.0943, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1750, loss: 1.0106, batch_reg_loss: 0.0841, reg_loss: 0.0830 ||:  86%|########6 | 96/111 [01:04<00:10,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8337, UAS: 0.9119, LAS: 0.8443, UEM: 0.4847, LEM: 0.2501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0740, partial_loss/deprel_loss: 1.0761, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1598, loss: 1.0296, batch_reg_loss: 0.0841, reg_loss: 0.0830 ||:  89%|########9 | 99/111 [01:07<00:08,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8246, UAS: 0.9125, LAS: 0.8451, UEM: 0.4915, LEM: 0.2556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0728, partial_loss/deprel_loss: 1.0576, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1448, loss: 1.0224, batch_reg_loss: 0.0842, reg_loss: 0.0831 ||:  92%|#########1| 102/111 [01:09<00:06,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8747, UAS: 0.9125, LAS: 0.8449, UEM: 0.4885, LEM: 0.2531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4391, partial_loss/deprel_loss: 0.6192, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6675, loss: 1.0221, batch_reg_loss: 0.0843, reg_loss: 0.0831 ||:  95%|#########4| 105/111 [01:11<00:04,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8539, UAS: 0.9127, LAS: 0.8451, UEM: 0.4833, LEM: 0.2480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6720, partial_loss/deprel_loss: 0.8026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8609, loss: 1.0200, batch_reg_loss: 0.0844, reg_loss: 0.0831 ||:  98%|#########8| 109/111 [01:13<00:01,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8645, UAS: 0.9127, LAS: 0.8451, UEM: 0.4802, LEM: 0.2455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5954, partial_loss/deprel_loss: 0.8870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9131, loss: 1.0210, batch_reg_loss: 0.0844, reg_loss: 0.0832 ||: 100%|##########| 111/111 [01:14<00:00,  1.48it/s]\n",
+      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.887  |       N/A\n",
+      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.595  |       N/A\n",
+      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.083  |       N/A\n",
+      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - UEM                      |     0.480  |       N/A\n",
+      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - LAS                      |     0.845  |       N/A\n",
+      "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - loss                     |     1.021  |       N/A\n",
+      "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - LEM                      |     0.246  |       N/A\n",
+      "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - UAS                      |     0.913  |       N/A\n",
+      "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - EM                       |     0.864  |       N/A\n",
+      "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:12:19,454 - INFO - combo.training.trainer - Epoch duration: 0:01:14.940605\n",
+      "2023-04-06 23:12:19,454 - INFO - combo.training.trainer - Estimated training time remaining: 8:27:43\n",
+      "2023-04-06 23:12:19,454 - INFO - allennlp.training.trainer - Epoch 17/399\n",
+      "2023-04-06 23:12:19,454 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:12:19,454 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:12:19,461 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8653, UAS: 0.9216, LAS: 0.8554, UEM: 0.3382, LEM: 0.1011, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5816, partial_loss/deprel_loss: 0.8625, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8908, loss: 0.9648, batch_reg_loss: 0.0845, reg_loss: 0.0845 ||:   4%|3         | 4/111 [00:02<01:04,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8527, UAS: 0.9265, LAS: 0.8618, UEM: 0.3934, LEM: 0.1398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6621, partial_loss/deprel_loss: 0.8200, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8730, loss: 0.8968, batch_reg_loss: 0.0846, reg_loss: 0.0845 ||:   6%|6         | 7/111 [00:04<01:08,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8333, UAS: 0.9162, LAS: 0.8500, UEM: 0.3532, LEM: 0.1257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0305, partial_loss/deprel_loss: 0.9789, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0739, loss: 0.9920, batch_reg_loss: 0.0846, reg_loss: 0.0845 ||:   9%|9         | 10/111 [00:06<01:06,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8026, UAS: 0.9184, LAS: 0.8528, UEM: 0.4350, LEM: 0.1899, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3660, partial_loss/deprel_loss: 1.2370, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3475, loss: 0.9582, batch_reg_loss: 0.0847, reg_loss: 0.0846 ||:  12%|#1        | 13/111 [00:08<01:05,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8967, UAS: 0.9205, LAS: 0.8554, UEM: 0.4904, LEM: 0.2367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4147, partial_loss/deprel_loss: 0.5218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5851, loss: 0.9331, batch_reg_loss: 0.0848, reg_loss: 0.0846 ||:  15%|#5        | 17/111 [00:11<01:02,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9110, UAS: 0.9219, LAS: 0.8575, UEM: 0.5308, LEM: 0.2704, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1652, partial_loss/deprel_loss: 0.4622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4877, loss: 0.9235, batch_reg_loss: 0.0849, reg_loss: 0.0846 ||:  18%|#8        | 20/111 [00:13<01:00,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8204, UAS: 0.9207, LAS: 0.8556, UEM: 0.5155, LEM: 0.2657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1489, partial_loss/deprel_loss: 1.1239, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2139, loss: 0.9339, batch_reg_loss: 0.0850, reg_loss: 0.0847 ||:  22%|##1       | 24/111 [00:16<00:57,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8496, UAS: 0.9208, LAS: 0.8555, UEM: 0.4917, LEM: 0.2469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7885, partial_loss/deprel_loss: 0.9084, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9694, loss: 0.9335, batch_reg_loss: 0.0850, reg_loss: 0.0847 ||:  25%|##5       | 28/111 [00:18<00:52,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9203, LAS: 0.8549, UEM: 0.4892, LEM: 0.2457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2998, partial_loss/deprel_loss: 0.5312, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5701, loss: 0.9418, batch_reg_loss: 0.0851, reg_loss: 0.0848 ||:  28%|##7       | 31/111 [00:20<00:53,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8699, UAS: 0.9203, LAS: 0.8548, UEM: 0.4730, LEM: 0.2298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5786, partial_loss/deprel_loss: 0.7671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8146, loss: 0.9400, batch_reg_loss: 0.0852, reg_loss: 0.0848 ||:  32%|###1      | 35/111 [00:23<00:50,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9223, LAS: 0.8573, UEM: 0.4940, LEM: 0.2481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5172, partial_loss/deprel_loss: 0.6889, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7398, loss: 0.9204, batch_reg_loss: 0.0853, reg_loss: 0.0849 ||:  34%|###4      | 38/111 [00:25<00:50,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8749, UAS: 0.9217, LAS: 0.8563, UEM: 0.4839, LEM: 0.2367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5008, partial_loss/deprel_loss: 0.7724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8034, loss: 0.9291, batch_reg_loss: 0.0854, reg_loss: 0.0849 ||:  38%|###7      | 42/111 [00:27<00:45,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8884, UAS: 0.9206, LAS: 0.8548, UEM: 0.4822, LEM: 0.2346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3619, partial_loss/deprel_loss: 0.5743, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6173, loss: 0.9410, batch_reg_loss: 0.0854, reg_loss: 0.0849 ||:  41%|####      | 45/111 [00:30<00:46,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8460, UAS: 0.9174, LAS: 0.8517, UEM: 0.4643, LEM: 0.2239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9001, partial_loss/deprel_loss: 0.9548, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0294, loss: 0.9654, batch_reg_loss: 0.0855, reg_loss: 0.0850 ||:  44%|####4     | 49/111 [00:32<00:42,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8553, UAS: 0.9165, LAS: 0.8508, UEM: 0.4653, LEM: 0.2219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8402, partial_loss/deprel_loss: 0.8455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9301, loss: 0.9775, batch_reg_loss: 0.0856, reg_loss: 0.0850 ||:  48%|####7     | 53/111 [00:35<00:38,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8495, UAS: 0.9179, LAS: 0.8524, UEM: 0.4743, LEM: 0.2237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8424, partial_loss/deprel_loss: 0.9273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9960, loss: 0.9632, batch_reg_loss: 0.0857, reg_loss: 0.0851 ||:  51%|#####1    | 57/111 [00:37<00:35,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8958, UAS: 0.9181, LAS: 0.8528, UEM: 0.4839, LEM: 0.2345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3615, partial_loss/deprel_loss: 0.5027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5603, loss: 0.9589, batch_reg_loss: 0.0858, reg_loss: 0.0851 ||:  55%|#####4    | 61/111 [00:40<00:33,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9201, LAS: 0.8551, UEM: 0.5090, LEM: 0.2596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4550, partial_loss/deprel_loss: 0.6768, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7183, loss: 0.9397, batch_reg_loss: 0.0859, reg_loss: 0.0852 ||:  59%|#####8    | 65/111 [00:43<00:30,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8599, UAS: 0.9196, LAS: 0.8545, UEM: 0.5017, LEM: 0.2534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6634, partial_loss/deprel_loss: 0.7655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8311, loss: 0.9431, batch_reg_loss: 0.0860, reg_loss: 0.0852 ||:  62%|######2   | 69/111 [00:46<00:28,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9189, LAS: 0.8537, UEM: 0.4995, LEM: 0.2534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4002, partial_loss/deprel_loss: 0.5723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6239, loss: 0.9510, batch_reg_loss: 0.0860, reg_loss: 0.0852 ||:  65%|######4   | 72/111 [00:48<00:26,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9195, LAS: 0.8542, UEM: 0.5001, LEM: 0.2517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4251, partial_loss/deprel_loss: 0.7046, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7348, loss: 0.9440, batch_reg_loss: 0.0861, reg_loss: 0.0853 ||:  68%|######8   | 76/111 [00:50<00:23,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8669, UAS: 0.9161, LAS: 0.8505, UEM: 0.4923, LEM: 0.2467, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5704, partial_loss/deprel_loss: 0.8707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8969, loss: 0.9753, batch_reg_loss: 0.0862, reg_loss: 0.0853 ||:  72%|#######2  | 80/111 [00:53<00:20,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8143, UAS: 0.9160, LAS: 0.8504, UEM: 0.4899, LEM: 0.2445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3190, partial_loss/deprel_loss: 1.2196, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3258, loss: 0.9778, batch_reg_loss: 0.0863, reg_loss: 0.0854 ||:  76%|#######5  | 84/111 [00:55<00:17,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7646, UAS: 0.9146, LAS: 0.8487, UEM: 0.4840, LEM: 0.2404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9803, partial_loss/deprel_loss: 1.4948, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6783, loss: 0.9919, batch_reg_loss: 0.0864, reg_loss: 0.0854 ||:  79%|#######9  | 88/111 [00:57<00:14,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9360, UAS: 0.9150, LAS: 0.8493, UEM: 0.5098, LEM: 0.2731, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0973, partial_loss/deprel_loss: 0.2371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2956, loss: 0.9903, batch_reg_loss: 0.0865, reg_loss: 0.0855 ||:  83%|########2 | 92/111 [01:01<00:12,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8278, UAS: 0.9145, LAS: 0.8486, UEM: 0.5008, LEM: 0.2669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1653, partial_loss/deprel_loss: 1.1575, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2456, loss: 0.9977, batch_reg_loss: 0.0866, reg_loss: 0.0855 ||:  86%|########6 | 96/111 [01:05<00:11,  1.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8094, UAS: 0.9144, LAS: 0.8484, UEM: 0.4967, LEM: 0.2632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3131, partial_loss/deprel_loss: 1.1735, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2881, loss: 0.9981, batch_reg_loss: 0.0867, reg_loss: 0.0855 ||:  89%|########9 | 99/111 [01:07<00:09,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8428, UAS: 0.9144, LAS: 0.8483, UEM: 0.4979, LEM: 0.2638, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8804, partial_loss/deprel_loss: 1.0840, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1300, loss: 0.9994, batch_reg_loss: 0.0867, reg_loss: 0.0856 ||:  92%|#########1| 102/111 [01:09<00:06,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8894, UAS: 0.9148, LAS: 0.8489, UEM: 0.4973, LEM: 0.2625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4124, partial_loss/deprel_loss: 0.5711, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6262, loss: 0.9941, batch_reg_loss: 0.0868, reg_loss: 0.0856 ||:  95%|#########4| 105/111 [01:12<00:04,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8624, UAS: 0.9151, LAS: 0.8490, UEM: 0.4923, LEM: 0.2570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7387, partial_loss/deprel_loss: 0.8004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8749, loss: 0.9937, batch_reg_loss: 0.0869, reg_loss: 0.0857 ||:  98%|#########8| 109/111 [01:14<00:01,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8040, UAS: 0.9140, LAS: 0.8479, UEM: 0.4885, LEM: 0.2549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3149, partial_loss/deprel_loss: 1.1623, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2798, loss: 1.0035, batch_reg_loss: 0.0869, reg_loss: 0.0857 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
+      "2023-04-06 23:13:34,894 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.162  |       N/A\n",
+      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.315  |       N/A\n",
+      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.086  |       N/A\n",
+      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - UEM                      |     0.489  |       N/A\n",
+      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - LAS                      |     0.848  |       N/A\n",
+      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - loss                     |     1.004  |       N/A\n",
+      "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - LEM                      |     0.255  |       N/A\n",
+      "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - UAS                      |     0.914  |       N/A\n",
+      "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - EM                       |     0.804  |       N/A\n",
+      "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:13:34,897 - INFO - combo.training.trainer - Epoch duration: 0:01:15.442752\n",
+      "2023-04-06 23:13:34,897 - INFO - combo.training.trainer - Estimated training time remaining: 8:24:56\n",
+      "2023-04-06 23:13:34,897 - INFO - allennlp.training.trainer - Epoch 18/399\n",
+      "2023-04-06 23:13:34,897 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:13:34,897 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:13:34,904 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8228, UAS: 0.9169, LAS: 0.8505, UEM: 0.3212, LEM: 0.0933, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0915, partial_loss/deprel_loss: 1.1094, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1928, loss: 0.9545, batch_reg_loss: 0.0870, reg_loss: 0.0870 ||:   3%|2         | 3/111 [00:02<01:20,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8898, UAS: 0.9276, LAS: 0.8623, UEM: 0.5231, LEM: 0.2611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3255, partial_loss/deprel_loss: 0.5087, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5591, loss: 0.8390, batch_reg_loss: 0.0871, reg_loss: 0.0870 ||:   5%|5         | 6/111 [00:04<01:20,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9346, LAS: 0.8740, UEM: 0.6711, LEM: 0.4448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1051, partial_loss/deprel_loss: 0.2196, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2839, loss: 0.7732, batch_reg_loss: 0.0872, reg_loss: 0.0871 ||:   9%|9         | 10/111 [00:07<01:17,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8591, UAS: 0.9301, LAS: 0.8680, UEM: 0.6054, LEM: 0.3828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6862, partial_loss/deprel_loss: 0.8887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9355, loss: 0.8377, batch_reg_loss: 0.0873, reg_loss: 0.0871 ||:  13%|#2        | 14/111 [00:10<01:09,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9300, LAS: 0.8676, UEM: 0.5688, LEM: 0.3422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5562, partial_loss/deprel_loss: 0.6804, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7430, loss: 0.8469, batch_reg_loss: 0.0874, reg_loss: 0.0872 ||:  16%|#6        | 18/111 [00:12<01:04,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9126, UAS: 0.9308, LAS: 0.8677, UEM: 0.5772, LEM: 0.3364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1748, partial_loss/deprel_loss: 0.4864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5115, loss: 0.8475, batch_reg_loss: 0.0874, reg_loss: 0.0872 ||:  20%|#9        | 22/111 [00:15<01:00,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8934, UAS: 0.9230, LAS: 0.8594, UEM: 0.5669, LEM: 0.3287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3768, partial_loss/deprel_loss: 0.5494, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6024, loss: 0.9163, batch_reg_loss: 0.0875, reg_loss: 0.0872 ||:  23%|##2       | 25/111 [00:17<01:01,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8352, UAS: 0.9221, LAS: 0.8583, UEM: 0.5419, LEM: 0.3100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9141, partial_loss/deprel_loss: 1.1264, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1715, loss: 0.9262, batch_reg_loss: 0.0876, reg_loss: 0.0873 ||:  25%|##5       | 28/111 [00:19<00:57,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9203, LAS: 0.8562, UEM: 0.5457, LEM: 0.3061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3203, partial_loss/deprel_loss: 0.5512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5926, loss: 0.9386, batch_reg_loss: 0.0876, reg_loss: 0.0873 ||:  28%|##7       | 31/111 [00:21<00:55,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8389, UAS: 0.9183, LAS: 0.8538, UEM: 0.5326, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9560, partial_loss/deprel_loss: 0.9772, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0607, loss: 0.9626, batch_reg_loss: 0.0877, reg_loss: 0.0874 ||:  32%|###1      | 35/111 [00:24<00:51,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9185, LAS: 0.8543, UEM: 0.5263, LEM: 0.2879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3537, partial_loss/deprel_loss: 0.5632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6091, loss: 0.9598, batch_reg_loss: 0.0878, reg_loss: 0.0874 ||:  35%|###5      | 39/111 [00:27<00:49,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9138, LAS: 0.8490, UEM: 0.5170, LEM: 0.2822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4010, partial_loss/deprel_loss: 0.5286, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5910, loss: 1.0039, batch_reg_loss: 0.0879, reg_loss: 0.0874 ||:  39%|###8      | 43/111 [00:29<00:47,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9152, LAS: 0.8507, UEM: 0.5210, LEM: 0.2825, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4241, partial_loss/deprel_loss: 0.6749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7127, loss: 0.9916, batch_reg_loss: 0.0880, reg_loss: 0.0875 ||:  41%|####1     | 46/111 [00:32<00:45,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8042, UAS: 0.9142, LAS: 0.8494, UEM: 0.5098, LEM: 0.2753, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3450, partial_loss/deprel_loss: 1.1223, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2549, loss: 0.9971, batch_reg_loss: 0.0881, reg_loss: 0.0875 ||:  44%|####4     | 49/111 [00:34<00:44,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8924, UAS: 0.9148, LAS: 0.8502, UEM: 0.5006, LEM: 0.2659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4315, partial_loss/deprel_loss: 0.6747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7142, loss: 0.9906, batch_reg_loss: 0.0882, reg_loss: 0.0876 ||:  48%|####7     | 53/111 [00:36<00:40,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8735, UAS: 0.9139, LAS: 0.8492, UEM: 0.4906, LEM: 0.2577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5756, partial_loss/deprel_loss: 0.7295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7870, loss: 0.9980, batch_reg_loss: 0.0883, reg_loss: 0.0876 ||:  51%|#####1    | 57/111 [00:39<00:35,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7875, UAS: 0.9122, LAS: 0.8470, UEM: 0.4822, LEM: 0.2516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5783, partial_loss/deprel_loss: 1.4357, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5525, loss: 1.0136, batch_reg_loss: 0.0884, reg_loss: 0.0877 ||:  55%|#####4    | 61/111 [00:41<00:33,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9123, LAS: 0.8474, UEM: 0.4979, LEM: 0.2680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2670, partial_loss/deprel_loss: 0.4382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4924, loss: 1.0101, batch_reg_loss: 0.0884, reg_loss: 0.0877 ||:  59%|#####8    | 65/111 [00:44<00:31,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8053, UAS: 0.9124, LAS: 0.8475, UEM: 0.4922, LEM: 0.2636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3323, partial_loss/deprel_loss: 1.3069, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4005, loss: 1.0098, batch_reg_loss: 0.0885, reg_loss: 0.0877 ||:  61%|######1   | 68/111 [00:46<00:29,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8203, UAS: 0.9130, LAS: 0.8481, UEM: 0.4973, LEM: 0.2674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1742, partial_loss/deprel_loss: 1.2064, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2885, loss: 1.0040, batch_reg_loss: 0.0886, reg_loss: 0.0878 ||:  64%|######3   | 71/111 [00:48<00:27,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9135, LAS: 0.8489, UEM: 0.5123, LEM: 0.2847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1399, partial_loss/deprel_loss: 0.3012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3576, loss: 0.9980, batch_reg_loss: 0.0887, reg_loss: 0.0878 ||:  68%|######7   | 75/111 [00:51<00:24,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8536, UAS: 0.9134, LAS: 0.8486, UEM: 0.5078, LEM: 0.2796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7427, partial_loss/deprel_loss: 0.9010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9581, loss: 1.0009, batch_reg_loss: 0.0887, reg_loss: 0.0879 ||:  70%|#######   | 78/111 [00:53<00:23,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7803, UAS: 0.9131, LAS: 0.8483, UEM: 0.5069, LEM: 0.2774, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8427, partial_loss/deprel_loss: 1.5858, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7260, loss: 1.0046, batch_reg_loss: 0.0888, reg_loss: 0.0879 ||:  73%|#######2  | 81/111 [00:56<00:21,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8095, UAS: 0.9134, LAS: 0.8483, UEM: 0.5000, LEM: 0.2705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2830, partial_loss/deprel_loss: 1.1385, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2563, loss: 1.0034, batch_reg_loss: 0.0889, reg_loss: 0.0879 ||:  77%|#######6  | 85/111 [00:58<00:17,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8533, UAS: 0.9131, LAS: 0.8480, UEM: 0.4932, LEM: 0.2646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8080, partial_loss/deprel_loss: 0.8970, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9682, loss: 1.0072, batch_reg_loss: 0.0890, reg_loss: 0.0880 ||:  80%|########  | 89/111 [01:00<00:14,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9132, LAS: 0.8480, UEM: 0.4909, LEM: 0.2622, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3357, partial_loss/deprel_loss: 0.5487, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5952, loss: 1.0083, batch_reg_loss: 0.0891, reg_loss: 0.0880 ||:  84%|########3 | 93/111 [01:03<00:11,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8723, UAS: 0.9140, LAS: 0.8488, UEM: 0.4943, LEM: 0.2648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4893, partial_loss/deprel_loss: 0.7979, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8254, loss: 1.0029, batch_reg_loss: 0.0892, reg_loss: 0.0881 ||:  87%|########7 | 97/111 [01:06<00:09,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8230, UAS: 0.9135, LAS: 0.8483, UEM: 0.4857, LEM: 0.2584, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1926, partial_loss/deprel_loss: 1.1354, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2361, loss: 1.0052, batch_reg_loss: 0.0893, reg_loss: 0.0881 ||:  91%|######### | 101/111 [01:08<00:06,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8649, UAS: 0.9144, LAS: 0.8493, UEM: 0.4890, LEM: 0.2579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6948, partial_loss/deprel_loss: 0.8095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8759, loss: 0.9975, batch_reg_loss: 0.0893, reg_loss: 0.0882 ||:  94%|#########3| 104/111 [01:11<00:04,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8489, UAS: 0.9143, LAS: 0.8492, UEM: 0.4848, LEM: 0.2548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9411, partial_loss/deprel_loss: 0.8917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9910, loss: 0.9983, batch_reg_loss: 0.0894, reg_loss: 0.0882 ||:  96%|#########6| 107/111 [01:13<00:02,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8840, UAS: 0.9151, LAS: 0.8501, UEM: 0.4914, LEM: 0.2580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3863, partial_loss/deprel_loss: 0.6280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6691, loss: 0.9898, batch_reg_loss: 0.0895, reg_loss: 0.0882 ||:  99%|#########9| 110/111 [01:15<00:00,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8704, UAS: 0.9153, LAS: 0.8503, UEM: 0.4906, LEM: 0.2570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5699, partial_loss/deprel_loss: 0.8068, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8490, loss: 0.9886, batch_reg_loss: 0.0895, reg_loss: 0.0882 ||: 100%|##########| 111/111 [01:16<00:00,  1.46it/s]\n",
+      "2023-04-06 23:14:50,914 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:14:50,914 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.807  |       N/A\n",
+      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.570  |       N/A\n",
+      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.088  |       N/A\n",
+      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - UEM                      |     0.491  |       N/A\n",
+      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - LAS                      |     0.850  |       N/A\n",
+      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - loss                     |     0.989  |       N/A\n",
+      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - LEM                      |     0.257  |       N/A\n",
+      "2023-04-06 23:14:50,916 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:14:50,916 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:14:50,916 - INFO - combo.training.tensorboard_writer - UAS                      |     0.915  |       N/A\n",
+      "2023-04-06 23:14:50,916 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:14:50,916 - INFO - combo.training.tensorboard_writer - EM                       |     0.870  |       N/A\n",
+      "2023-04-06 23:14:50,916 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:14:50,916 - INFO - combo.training.trainer - Epoch duration: 0:01:16.019608\n",
+      "2023-04-06 23:14:50,917 - INFO - combo.training.trainer - Estimated training time remaining: 8:22:31\n",
+      "2023-04-06 23:14:50,917 - INFO - allennlp.training.trainer - Epoch 19/399\n",
+      "2023-04-06 23:14:50,917 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:14:50,917 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-06 23:14:50,923 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9280, LAS: 0.8663, UEM: 0.4818, LEM: 0.2052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3412, partial_loss/deprel_loss: 0.5427, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5920, loss: 0.8326, batch_reg_loss: 0.0896, reg_loss: 0.0896 ||:   4%|3         | 4/111 [00:02<01:06,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8347, UAS: 0.9147, LAS: 0.8502, UEM: 0.3867, LEM: 0.1510, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0561, partial_loss/deprel_loss: 1.0243, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1203, loss: 0.9958, batch_reg_loss: 0.0897, reg_loss: 0.0896 ||:   6%|6         | 7/111 [00:04<01:07,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7890, UAS: 0.9112, LAS: 0.8450, UEM: 0.3595, LEM: 0.1344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5057, partial_loss/deprel_loss: 1.4440, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5460, loss: 1.0469, batch_reg_loss: 0.0897, reg_loss: 0.0896 ||:   9%|9         | 10/111 [00:06<01:06,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8477, UAS: 0.9132, LAS: 0.8471, UEM: 0.3635, LEM: 0.1282, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8014, partial_loss/deprel_loss: 0.8880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9604, loss: 1.0209, batch_reg_loss: 0.0898, reg_loss: 0.0897 ||:  12%|#1        | 13/111 [00:08<01:05,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8711, UAS: 0.9142, LAS: 0.8481, UEM: 0.3500, LEM: 0.1202, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5703, partial_loss/deprel_loss: 0.7201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7801, loss: 1.0151, batch_reg_loss: 0.0899, reg_loss: 0.0897 ||:  15%|#5        | 17/111 [00:11<01:02,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8080, UAS: 0.9147, LAS: 0.8485, UEM: 0.3594, LEM: 0.1297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3113, partial_loss/deprel_loss: 1.1270, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2538, loss: 1.0083, batch_reg_loss: 0.0899, reg_loss: 0.0897 ||:  18%|#8        | 20/111 [00:13<01:01,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8353, UAS: 0.9089, LAS: 0.8422, UEM: 0.3288, LEM: 0.1173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0613, partial_loss/deprel_loss: 0.9594, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0698, loss: 1.0639, batch_reg_loss: 0.0900, reg_loss: 0.0898 ||:  22%|##1       | 24/111 [00:16<00:57,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8194, UAS: 0.9075, LAS: 0.8401, UEM: 0.3043, LEM: 0.1081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1332, partial_loss/deprel_loss: 1.1339, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2239, loss: 1.0805, batch_reg_loss: 0.0901, reg_loss: 0.0898 ||:  25%|##5       | 28/111 [00:18<00:54,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9118, LAS: 0.8454, UEM: 0.3797, LEM: 0.1651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2529, partial_loss/deprel_loss: 0.4029, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4631, loss: 1.0336, batch_reg_loss: 0.0902, reg_loss: 0.0899 ||:  28%|##7       | 31/111 [00:20<00:53,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9146, LAS: 0.8488, UEM: 0.4005, LEM: 0.1766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2672, partial_loss/deprel_loss: 0.4931, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5382, loss: 1.0074, batch_reg_loss: 0.0903, reg_loss: 0.0899 ||:  32%|###1      | 35/111 [00:23<00:51,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9167, LAS: 0.8515, UEM: 0.4096, LEM: 0.1790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5449, partial_loss/deprel_loss: 0.7061, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7642, loss: 0.9820, batch_reg_loss: 0.0904, reg_loss: 0.0899 ||:  35%|###5      | 39/111 [00:25<00:47,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9189, LAS: 0.8544, UEM: 0.4478, LEM: 0.2113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2027, partial_loss/deprel_loss: 0.4174, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4649, loss: 0.9584, batch_reg_loss: 0.0905, reg_loss: 0.0900 ||:  38%|###7      | 42/111 [00:28<00:47,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8055, UAS: 0.9189, LAS: 0.8545, UEM: 0.4558, LEM: 0.2175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4937, partial_loss/deprel_loss: 1.2253, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3695, loss: 0.9560, batch_reg_loss: 0.0905, reg_loss: 0.0900 ||:  41%|####      | 45/111 [00:30<00:46,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7630, UAS: 0.9134, LAS: 0.8488, UEM: 0.4408, LEM: 0.2103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9478, partial_loss/deprel_loss: 1.5173, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6940, loss: 1.0013, batch_reg_loss: 0.0906, reg_loss: 0.0901 ||:  44%|####4     | 49/111 [00:33<00:42,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9136, LAS: 0.8490, UEM: 0.4447, LEM: 0.2155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3234, partial_loss/deprel_loss: 0.4641, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5266, loss: 1.0002, batch_reg_loss: 0.0907, reg_loss: 0.0901 ||:  47%|####6     | 52/111 [00:35<00:42,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8632, UAS: 0.9148, LAS: 0.8508, UEM: 0.4497, LEM: 0.2170, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8531, partial_loss/deprel_loss: 0.7755, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8818, loss: 0.9856, batch_reg_loss: 0.0907, reg_loss: 0.0901 ||:  50%|####9     | 55/111 [00:37<00:39,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8783, UAS: 0.9144, LAS: 0.8503, UEM: 0.4407, LEM: 0.2094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4102, partial_loss/deprel_loss: 0.7027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7350, loss: 0.9948, batch_reg_loss: 0.0908, reg_loss: 0.0902 ||:  53%|#####3    | 59/111 [00:40<00:35,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8627, UAS: 0.9144, LAS: 0.8500, UEM: 0.4305, LEM: 0.2013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7175, partial_loss/deprel_loss: 0.8354, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9027, loss: 0.9954, batch_reg_loss: 0.0909, reg_loss: 0.0902 ||:  57%|#####6    | 63/111 [00:42<00:32,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9160, LAS: 0.8519, UEM: 0.4603, LEM: 0.2304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1260, partial_loss/deprel_loss: 0.2969, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3537, loss: 0.9770, batch_reg_loss: 0.0910, reg_loss: 0.0903 ||:  59%|#####9    | 66/111 [00:44<00:31,  1.41it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9146, LAS: 0.8503, UEM: 0.4620, LEM: 0.2308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3607, partial_loss/deprel_loss: 0.5944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6387, loss: 0.9922, batch_reg_loss: 0.0911, reg_loss: 0.0903 ||:  62%|######2   | 69/111 [00:47<00:29,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9476, UAS: 0.9152, LAS: 0.8511, UEM: 0.4865, LEM: 0.2638, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0865, partial_loss/deprel_loss: 0.2023, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2703, loss: 0.9884, batch_reg_loss: 0.0911, reg_loss: 0.0903 ||:  65%|######4   | 72/111 [00:49<00:29,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7450, UAS: 0.9129, LAS: 0.8483, UEM: 0.4786, LEM: 0.2592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4474, partial_loss/deprel_loss: 1.6060, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8655, loss: 1.0093, batch_reg_loss: 0.0912, reg_loss: 0.0904 ||:  68%|######7   | 75/111 [00:51<00:26,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9145, LAS: 0.8501, UEM: 0.4913, LEM: 0.2646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3422, partial_loss/deprel_loss: 0.5563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6047, loss: 0.9942, batch_reg_loss: 0.0913, reg_loss: 0.0904 ||:  70%|#######   | 78/111 [00:53<00:23,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8686, UAS: 0.9147, LAS: 0.8503, UEM: 0.4911, LEM: 0.2628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6024, partial_loss/deprel_loss: 0.8119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8614, loss: 0.9942, batch_reg_loss: 0.0914, reg_loss: 0.0904 ||:  74%|#######3  | 82/111 [00:56<00:19,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8070, UAS: 0.9148, LAS: 0.8505, UEM: 0.4921, LEM: 0.2639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3560, partial_loss/deprel_loss: 1.2549, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3665, loss: 0.9919, batch_reg_loss: 0.0914, reg_loss: 0.0905 ||:  77%|#######6  | 85/111 [00:58<00:18,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8503, UAS: 0.9139, LAS: 0.8493, UEM: 0.4854, LEM: 0.2583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7237, partial_loss/deprel_loss: 0.8698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9321, loss: 1.0020, batch_reg_loss: 0.0915, reg_loss: 0.0905 ||:  80%|########  | 89/111 [01:01<00:15,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7970, UAS: 0.9132, LAS: 0.8486, UEM: 0.4798, LEM: 0.2545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6280, partial_loss/deprel_loss: 1.2208, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3938, loss: 1.0073, batch_reg_loss: 0.0916, reg_loss: 0.0905 ||:  83%|########2 | 92/111 [01:03<00:13,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9145, LAS: 0.8499, UEM: 0.4895, LEM: 0.2595, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1750, partial_loss/deprel_loss: 0.4655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4991, loss: 0.9969, batch_reg_loss: 0.0917, reg_loss: 0.0906 ||:  86%|########5 | 95/111 [01:05<00:11,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8012, UAS: 0.9144, LAS: 0.8497, UEM: 0.4877, LEM: 0.2581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4152, partial_loss/deprel_loss: 1.2303, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3590, loss: 0.9990, batch_reg_loss: 0.0917, reg_loss: 0.0906 ||:  88%|########8 | 98/111 [01:07<00:09,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8507, UAS: 0.9146, LAS: 0.8498, UEM: 0.4837, LEM: 0.2542, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7947, partial_loss/deprel_loss: 0.9044, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9742, loss: 0.9972, batch_reg_loss: 0.0918, reg_loss: 0.0907 ||:  91%|######### | 101/111 [01:09<00:07,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8882, UAS: 0.9154, LAS: 0.8507, UEM: 0.4849, LEM: 0.2528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4251, partial_loss/deprel_loss: 0.5496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6166, loss: 0.9904, batch_reg_loss: 0.0919, reg_loss: 0.0907 ||:  95%|#########4| 105/111 [01:12<00:04,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9157, LAS: 0.8511, UEM: 0.4917, LEM: 0.2596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4593, partial_loss/deprel_loss: 0.6486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7027, loss: 0.9860, batch_reg_loss: 0.0919, reg_loss: 0.0907 ||:  97%|#########7| 108/111 [01:15<00:02,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8103, UAS: 0.9161, LAS: 0.8514, UEM: 0.4941, LEM: 0.2598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3019, partial_loss/deprel_loss: 1.1335, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2592, loss: 0.9835, batch_reg_loss: 0.0920, reg_loss: 0.0908 ||: 100%|##########| 111/111 [01:17<00:00,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8103, UAS: 0.9161, LAS: 0.8514, UEM: 0.4941, LEM: 0.2598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3019, partial_loss/deprel_loss: 1.1335, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2592, loss: 0.9835, batch_reg_loss: 0.0920, reg_loss: 0.0908 ||: 100%|##########| 111/111 [01:17<00:00,  1.43it/s]\n",
+      "2023-04-06 23:16:08,307 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.134  |       N/A\n",
+      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.302  |       N/A\n",
+      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.091  |       N/A\n",
+      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - UEM                      |     0.494  |       N/A\n",
+      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - LAS                      |     0.851  |       N/A\n",
+      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - loss                     |     0.984  |       N/A\n",
+      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - LEM                      |     0.260  |       N/A\n",
+      "2023-04-06 23:16:08,309 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:16:08,309 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:16:08,309 - INFO - combo.training.tensorboard_writer - UAS                      |     0.916  |       N/A\n",
+      "2023-04-06 23:16:08,309 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:16:08,309 - INFO - combo.training.tensorboard_writer - EM                       |     0.810  |       N/A\n",
+      "2023-04-06 23:16:08,309 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:16:08,309 - INFO - combo.training.trainer - Epoch duration: 0:01:17.392753\n",
+      "2023-04-06 23:16:08,310 - INFO - combo.training.trainer - Estimated training time remaining: 8:20:39\n",
+      "2023-04-06 23:16:08,310 - INFO - allennlp.training.trainer - Epoch 20/399\n",
+      "2023-04-06 23:16:08,310 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:16:08,310 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-06 23:16:08,316 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9521, LAS: 0.8974, UEM: 0.7753, LEM: 0.6200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3512, partial_loss/deprel_loss: 0.6386, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6732, loss: 0.6190, batch_reg_loss: 0.0921, reg_loss: 0.0920 ||:   3%|2         | 3/111 [00:02<01:31,  1.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7149, UAS: 0.9217, LAS: 0.8639, UEM: 0.7221, LEM: 0.5348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.0170, partial_loss/deprel_loss: 1.8682, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1901, loss: 0.8866, batch_reg_loss: 0.0921, reg_loss: 0.0921 ||:   6%|6         | 7/111 [00:04<01:20,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9203, LAS: 0.8612, UEM: 0.6885, LEM: 0.4941, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2541, partial_loss/deprel_loss: 0.4469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5005, loss: 0.9092, batch_reg_loss: 0.0922, reg_loss: 0.0921 ||:   9%|9         | 10/111 [00:07<01:16,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8377, UAS: 0.9200, LAS: 0.8602, UEM: 0.6465, LEM: 0.4483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9482, partial_loss/deprel_loss: 1.0288, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1050, loss: 0.9218, batch_reg_loss: 0.0923, reg_loss: 0.0921 ||:  12%|#1        | 13/111 [00:09<01:13,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8989, UAS: 0.9260, LAS: 0.8667, UEM: 0.6404, LEM: 0.4198, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3305, partial_loss/deprel_loss: 0.5257, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5790, loss: 0.8611, batch_reg_loss: 0.0923, reg_loss: 0.0922 ||:  15%|#5        | 17/111 [00:11<01:06,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8555, UAS: 0.9266, LAS: 0.8650, UEM: 0.6031, LEM: 0.3783, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6330, partial_loss/deprel_loss: 0.8089, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8662, loss: 0.8658, batch_reg_loss: 0.0924, reg_loss: 0.0922 ||:  19%|#8        | 21/111 [00:14<01:01,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9235, LAS: 0.8615, UEM: 0.5818, LEM: 0.3567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5684, partial_loss/deprel_loss: 0.7775, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8282, loss: 0.8950, batch_reg_loss: 0.0925, reg_loss: 0.0923 ||:  22%|##1       | 24/111 [00:16<00:59,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8780, UAS: 0.9259, LAS: 0.8641, UEM: 0.5802, LEM: 0.3457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4870, partial_loss/deprel_loss: 0.6752, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7301, loss: 0.8726, batch_reg_loss: 0.0926, reg_loss: 0.0923 ||:  24%|##4       | 27/111 [00:18<00:58,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9255, LAS: 0.8640, UEM: 0.5700, LEM: 0.3358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3910, partial_loss/deprel_loss: 0.4800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5549, loss: 0.8753, batch_reg_loss: 0.0926, reg_loss: 0.0923 ||:  27%|##7       | 30/111 [00:20<00:56,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8875, UAS: 0.9263, LAS: 0.8651, UEM: 0.5635, LEM: 0.3275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5597, partial_loss/deprel_loss: 0.6210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7014, loss: 0.8682, batch_reg_loss: 0.0927, reg_loss: 0.0923 ||:  30%|##9       | 33/111 [00:22<00:53,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9252, LAS: 0.8637, UEM: 0.5582, LEM: 0.3224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3287, partial_loss/deprel_loss: 0.5773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6203, loss: 0.8801, batch_reg_loss: 0.0927, reg_loss: 0.0924 ||:  32%|###2      | 36/111 [00:24<00:52,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8709, UAS: 0.9254, LAS: 0.8637, UEM: 0.5541, LEM: 0.3170, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6296, partial_loss/deprel_loss: 0.7761, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8396, loss: 0.8814, batch_reg_loss: 0.0928, reg_loss: 0.0924 ||:  35%|###5      | 39/111 [00:27<00:52,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8333, UAS: 0.9236, LAS: 0.8612, UEM: 0.5381, LEM: 0.3055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0152, partial_loss/deprel_loss: 0.9462, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0529, loss: 0.9042, batch_reg_loss: 0.0929, reg_loss: 0.0924 ||:  38%|###7      | 42/111 [00:29<00:50,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8396, UAS: 0.9249, LAS: 0.8627, UEM: 0.5504, LEM: 0.3155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8873, partial_loss/deprel_loss: 1.0102, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0786, loss: 0.8923, batch_reg_loss: 0.0929, reg_loss: 0.0925 ||:  41%|####      | 45/111 [00:31<00:47,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8389, UAS: 0.9246, LAS: 0.8622, UEM: 0.5363, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8750, partial_loss/deprel_loss: 0.9418, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0214, loss: 0.8949, batch_reg_loss: 0.0930, reg_loss: 0.0925 ||:  44%|####4     | 49/111 [00:33<00:42,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.9244, LAS: 0.8620, UEM: 0.5327, LEM: 0.2988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7190, partial_loss/deprel_loss: 0.8342, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9043, loss: 0.8976, batch_reg_loss: 0.0931, reg_loss: 0.0925 ||:  47%|####6     | 52/111 [00:35<00:40,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8847, UAS: 0.9237, LAS: 0.8612, UEM: 0.5251, LEM: 0.2915, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4009, partial_loss/deprel_loss: 0.6874, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7233, loss: 0.9062, batch_reg_loss: 0.0931, reg_loss: 0.0926 ||:  50%|####9     | 55/111 [00:37<00:38,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9240, LAS: 0.8615, UEM: 0.5296, LEM: 0.2938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3117, partial_loss/deprel_loss: 0.4649, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5275, loss: 0.9034, batch_reg_loss: 0.0932, reg_loss: 0.0926 ||:  52%|#####2    | 58/111 [00:40<00:37,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9247, LAS: 0.8623, UEM: 0.5344, LEM: 0.2969, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3854, partial_loss/deprel_loss: 0.5744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6299, loss: 0.8967, batch_reg_loss: 0.0933, reg_loss: 0.0926 ||:  55%|#####4    | 61/111 [00:42<00:35,  1.39it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7501, UAS: 0.9220, LAS: 0.8592, UEM: 0.5220, LEM: 0.2890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0578, partial_loss/deprel_loss: 1.6962, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8619, loss: 0.9225, batch_reg_loss: 0.0934, reg_loss: 0.0927 ||:  59%|#####8    | 65/111 [00:45<00:32,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8401, UAS: 0.9210, LAS: 0.8582, UEM: 0.5109, LEM: 0.2804, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8382, partial_loss/deprel_loss: 0.9579, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0274, loss: 0.9295, batch_reg_loss: 0.0934, reg_loss: 0.0927 ||:  62%|######2   | 69/111 [00:47<00:27,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8715, UAS: 0.9208, LAS: 0.8578, UEM: 0.5065, LEM: 0.2749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5938, partial_loss/deprel_loss: 0.7648, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8241, loss: 0.9320, batch_reg_loss: 0.0935, reg_loss: 0.0928 ||:  66%|######5   | 73/111 [00:50<00:25,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8780, UAS: 0.9205, LAS: 0.8575, UEM: 0.5089, LEM: 0.2756, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4596, partial_loss/deprel_loss: 0.7226, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7637, loss: 0.9351, batch_reg_loss: 0.0936, reg_loss: 0.0928 ||:  69%|######9   | 77/111 [00:53<00:23,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8154, UAS: 0.9196, LAS: 0.8565, UEM: 0.5025, LEM: 0.2713, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3989, partial_loss/deprel_loss: 1.2230, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3519, loss: 0.9459, batch_reg_loss: 0.0937, reg_loss: 0.0929 ||:  73%|#######2  | 81/111 [00:55<00:19,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9202, LAS: 0.8571, UEM: 0.5031, LEM: 0.2700, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3432, partial_loss/deprel_loss: 0.5774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6244, loss: 0.9399, batch_reg_loss: 0.0938, reg_loss: 0.0929 ||:  77%|#######6  | 85/111 [00:57<00:16,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7840, UAS: 0.9193, LAS: 0.8562, UEM: 0.4962, LEM: 0.2652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9018, partial_loss/deprel_loss: 1.4183, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6089, loss: 0.9479, batch_reg_loss: 0.0939, reg_loss: 0.0929 ||:  80%|########  | 89/111 [01:01<00:15,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7733, UAS: 0.9190, LAS: 0.8557, UEM: 0.4967, LEM: 0.2642, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9213, partial_loss/deprel_loss: 1.5481, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7167, loss: 0.9522, batch_reg_loss: 0.0940, reg_loss: 0.0930 ||:  83%|########2 | 92/111 [01:03<00:13,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8547, UAS: 0.9182, LAS: 0.8549, UEM: 0.4904, LEM: 0.2589, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5844, partial_loss/deprel_loss: 0.8200, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8669, loss: 0.9578, batch_reg_loss: 0.0941, reg_loss: 0.0930 ||:  86%|########6 | 96/111 [01:05<00:10,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8160, UAS: 0.9179, LAS: 0.8545, UEM: 0.4835, LEM: 0.2533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3356, partial_loss/deprel_loss: 1.2480, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3597, loss: 0.9618, batch_reg_loss: 0.0942, reg_loss: 0.0931 ||:  90%|######### | 100/111 [01:08<00:07,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8480, UAS: 0.9185, LAS: 0.8549, UEM: 0.4847, LEM: 0.2529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8264, partial_loss/deprel_loss: 0.9697, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0353, loss: 0.9581, batch_reg_loss: 0.0942, reg_loss: 0.0931 ||:  93%|#########2| 103/111 [01:10<00:05,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9190, LAS: 0.8556, UEM: 0.5012, LEM: 0.2694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1585, partial_loss/deprel_loss: 0.3249, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3859, loss: 0.9525, batch_reg_loss: 0.0943, reg_loss: 0.0931 ||:  95%|#########5| 106/111 [01:12<00:03,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8343, UAS: 0.9174, LAS: 0.8537, UEM: 0.4963, LEM: 0.2666, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9702, partial_loss/deprel_loss: 0.9739, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0675, loss: 0.9691, batch_reg_loss: 0.0944, reg_loss: 0.0932 ||:  98%|#########8| 109/111 [01:14<00:01,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8448, UAS: 0.9175, LAS: 0.8538, UEM: 0.4941, LEM: 0.2641, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9358, partial_loss/deprel_loss: 0.9596, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0492, loss: 0.9684, batch_reg_loss: 0.0944, reg_loss: 0.0932 ||: 100%|##########| 111/111 [01:16<00:00,  1.46it/s]\n",
+      "2023-04-06 23:17:24,438 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9379, LAS: 0.8819, UEM: 0.4929, LEM: 0.2476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8324, partial_loss/deprel_loss: 30.4534, partial_loss/cycle_loss: 0.0000, batch_loss: 24.5292, loss: 22.6841, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:08,  1.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8980, UAS: 0.9483, LAS: 0.8961, UEM: 0.7019, LEM: 0.4664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4225, partial_loss/deprel_loss: 25.9318, partial_loss/cycle_loss: 0.0000, batch_loss: 20.8300, loss: 21.0524, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:04<00:07,  1.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8710, UAS: 0.9460, LAS: 0.8899, UEM: 0.6444, LEM: 0.3815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6182, partial_loss/deprel_loss: 33.9471, partial_loss/cycle_loss: 0.0000, batch_loss: 27.2813, loss: 21.9483, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:07<00:04,  1.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9433, LAS: 0.8872, UEM: 0.6348, LEM: 0.3764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1976, partial_loss/deprel_loss: 23.3129, partial_loss/cycle_loss: 0.0000, batch_loss: 18.6898, loss: 24.3207, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:09<00:01,  1.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9382, LAS: 0.8808, UEM: 0.6098, LEM: 0.3497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5354, partial_loss/deprel_loss: 23.9953, partial_loss/cycle_loss: 0.0000, batch_loss: 19.3033, loss: 25.6272, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:11<00:00,  1.09it/s]\n",
+      "2023-04-06 23:17:36,368 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:17:36,368 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:17:36,368 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:17:36,368 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:17:36,368 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 23:17:36,368 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:17:36,368 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.960  |    23.995\n",
+      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.936  |     0.535\n",
+      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.093  |     0.000\n",
+      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - UEM                      |     0.494  |     0.610\n",
+      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - LAS                      |     0.854  |     0.881\n",
+      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - loss                     |     0.968  |    25.627\n",
+      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - LEM                      |     0.264  |     0.350\n",
+      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - UAS                      |     0.918  |     0.938\n",
+      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - EM                       |     0.845  |     0.885\n",
+      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:17:36,370 - INFO - combo.training.trainer - Epoch duration: 0:01:28.060274\n",
+      "2023-04-06 23:17:36,370 - INFO - combo.training.trainer - Estimated training time remaining: 8:22:02\n",
+      "2023-04-06 23:17:36,370 - INFO - allennlp.training.trainer - Epoch 21/399\n",
+      "2023-04-06 23:17:36,370 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:17:36,371 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:17:36,376 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8363, UAS: 0.9258, LAS: 0.8623, UEM: 0.3812, LEM: 0.1341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0052, partial_loss/deprel_loss: 0.9565, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0607, loss: 0.9069, batch_reg_loss: 0.0945, reg_loss: 0.0944 ||:   3%|2         | 3/111 [00:02<01:17,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9203, LAS: 0.8558, UEM: 0.3611, LEM: 0.1313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3760, partial_loss/deprel_loss: 0.6124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6596, loss: 0.9642, batch_reg_loss: 0.0946, reg_loss: 0.0945 ||:   6%|6         | 7/111 [00:04<01:13,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8580, UAS: 0.9250, LAS: 0.8613, UEM: 0.3832, LEM: 0.1313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8690, partial_loss/deprel_loss: 0.9013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9895, loss: 0.9139, batch_reg_loss: 0.0947, reg_loss: 0.0945 ||:  10%|9         | 11/111 [00:07<01:07,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8533, UAS: 0.9155, LAS: 0.8505, UEM: 0.3310, LEM: 0.1096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7844, partial_loss/deprel_loss: 0.8858, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9602, loss: 0.9989, batch_reg_loss: 0.0947, reg_loss: 0.0946 ||:  14%|#3        | 15/111 [00:09<01:03,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8521, UAS: 0.9187, LAS: 0.8536, UEM: 0.3559, LEM: 0.1284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7069, partial_loss/deprel_loss: 0.9114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9654, loss: 0.9738, batch_reg_loss: 0.0948, reg_loss: 0.0946 ||:  17%|#7        | 19/111 [00:12<01:00,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8454, UAS: 0.9194, LAS: 0.8549, UEM: 0.3802, LEM: 0.1447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9340, partial_loss/deprel_loss: 0.8900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9937, loss: 0.9615, batch_reg_loss: 0.0949, reg_loss: 0.0947 ||:  21%|##        | 23/111 [00:14<00:56,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9213, LAS: 0.8573, UEM: 0.4043, LEM: 0.1632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3409, partial_loss/deprel_loss: 0.5584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6099, loss: 0.9402, batch_reg_loss: 0.0950, reg_loss: 0.0947 ||:  24%|##4       | 27/111 [00:17<00:52,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9229, LAS: 0.8593, UEM: 0.4209, LEM: 0.1772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3523, partial_loss/deprel_loss: 0.5628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6158, loss: 0.9247, batch_reg_loss: 0.0951, reg_loss: 0.0948 ||:  28%|##7       | 31/111 [00:19<00:51,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8642, UAS: 0.9226, LAS: 0.8594, UEM: 0.4405, LEM: 0.1987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7041, partial_loss/deprel_loss: 0.8753, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9363, loss: 0.9259, batch_reg_loss: 0.0952, reg_loss: 0.0948 ||:  32%|###1      | 35/111 [00:22<00:48,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8460, UAS: 0.9234, LAS: 0.8603, UEM: 0.4429, LEM: 0.2005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9610, partial_loss/deprel_loss: 0.8971, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0052, loss: 0.9134, batch_reg_loss: 0.0953, reg_loss: 0.0949 ||:  35%|###5      | 39/111 [00:25<00:46,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7296, UAS: 0.9207, LAS: 0.8576, UEM: 0.4694, LEM: 0.2335, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.0297, partial_loss/deprel_loss: 1.8059, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1460, loss: 0.9392, batch_reg_loss: 0.0953, reg_loss: 0.0949 ||:  38%|###7      | 42/111 [00:27<00:46,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8896, UAS: 0.9230, LAS: 0.8604, UEM: 0.4986, LEM: 0.2542, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4283, partial_loss/deprel_loss: 0.6117, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6704, loss: 0.9153, batch_reg_loss: 0.0954, reg_loss: 0.0949 ||:  41%|####      | 45/111 [00:29<00:45,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8595, UAS: 0.9227, LAS: 0.8601, UEM: 0.4996, LEM: 0.2565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7368, partial_loss/deprel_loss: 0.8730, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9412, loss: 0.9158, batch_reg_loss: 0.0954, reg_loss: 0.0950 ||:  43%|####3     | 48/111 [00:31<00:45,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8347, UAS: 0.9213, LAS: 0.8584, UEM: 0.4874, LEM: 0.2479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9492, partial_loss/deprel_loss: 1.1123, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1752, loss: 0.9301, batch_reg_loss: 0.0955, reg_loss: 0.0950 ||:  46%|####5     | 51/111 [00:34<00:43,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9193, LAS: 0.8562, UEM: 0.4801, LEM: 0.2417, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5844, partial_loss/deprel_loss: 0.7754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8328, loss: 0.9488, batch_reg_loss: 0.0956, reg_loss: 0.0950 ||:  49%|####8     | 54/111 [00:36<00:41,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8167, UAS: 0.9175, LAS: 0.8539, UEM: 0.4693, LEM: 0.2347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2272, partial_loss/deprel_loss: 1.2433, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3357, loss: 0.9674, batch_reg_loss: 0.0957, reg_loss: 0.0951 ||:  52%|#####2    | 58/111 [00:38<00:37,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9193, LAS: 0.8564, UEM: 0.5091, LEM: 0.2797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1029, partial_loss/deprel_loss: 0.2265, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2975, loss: 0.9466, batch_reg_loss: 0.0957, reg_loss: 0.0951 ||:  55%|#####4    | 61/111 [00:41<00:39,  1.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8577, UAS: 0.9187, LAS: 0.8552, UEM: 0.4985, LEM: 0.2708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6729, partial_loss/deprel_loss: 0.7973, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8682, loss: 0.9533, batch_reg_loss: 0.0958, reg_loss: 0.0951 ||:  59%|#####8    | 65/111 [00:44<00:33,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8202, UAS: 0.9188, LAS: 0.8557, UEM: 0.4976, LEM: 0.2690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3849, partial_loss/deprel_loss: 1.1817, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3182, loss: 0.9503, batch_reg_loss: 0.0959, reg_loss: 0.0952 ||:  61%|######1   | 68/111 [00:46<00:30,  1.39it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9184, LAS: 0.8552, UEM: 0.4954, LEM: 0.2681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2846, partial_loss/deprel_loss: 0.4353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5012, loss: 0.9528, batch_reg_loss: 0.0960, reg_loss: 0.0952 ||:  65%|######4   | 72/111 [00:48<00:27,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8599, UAS: 0.9177, LAS: 0.8545, UEM: 0.4896, LEM: 0.2640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8338, partial_loss/deprel_loss: 0.8384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9335, loss: 0.9619, batch_reg_loss: 0.0961, reg_loss: 0.0953 ||:  68%|######8   | 76/111 [00:51<00:23,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8785, UAS: 0.9189, LAS: 0.8556, UEM: 0.4982, LEM: 0.2668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3850, partial_loss/deprel_loss: 0.6036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6560, loss: 0.9503, batch_reg_loss: 0.0961, reg_loss: 0.0953 ||:  71%|#######1  | 79/111 [00:54<00:23,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7855, UAS: 0.9170, LAS: 0.8532, UEM: 0.4909, LEM: 0.2626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7202, partial_loss/deprel_loss: 1.4704, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6166, loss: 0.9708, batch_reg_loss: 0.0962, reg_loss: 0.0953 ||:  74%|#######3  | 82/111 [00:56<00:20,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8386, UAS: 0.9167, LAS: 0.8527, UEM: 0.4814, LEM: 0.2560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9546, partial_loss/deprel_loss: 1.0401, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1193, loss: 0.9757, batch_reg_loss: 0.0963, reg_loss: 0.0954 ||:  77%|#######7  | 86/111 [00:58<00:17,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8799, UAS: 0.9178, LAS: 0.8541, UEM: 0.4946, LEM: 0.2651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4311, partial_loss/deprel_loss: 0.6831, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7291, loss: 0.9636, batch_reg_loss: 0.0964, reg_loss: 0.0954 ||:  80%|########  | 89/111 [01:00<00:15,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8296, UAS: 0.9177, LAS: 0.8538, UEM: 0.4900, LEM: 0.2610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2122, partial_loss/deprel_loss: 1.0230, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1573, loss: 0.9669, batch_reg_loss: 0.0965, reg_loss: 0.0954 ||:  83%|########2 | 92/111 [01:02<00:13,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9007, UAS: 0.9174, LAS: 0.8535, UEM: 0.4914, LEM: 0.2603, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3006, partial_loss/deprel_loss: 0.5337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5836, loss: 0.9690, batch_reg_loss: 0.0965, reg_loss: 0.0955 ||:  86%|########5 | 95/111 [01:04<00:11,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8850, UAS: 0.9168, LAS: 0.8528, UEM: 0.4893, LEM: 0.2586, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4066, partial_loss/deprel_loss: 0.6253, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6781, loss: 0.9755, batch_reg_loss: 0.0966, reg_loss: 0.0955 ||:  88%|########8 | 98/111 [01:07<00:09,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8708, UAS: 0.9167, LAS: 0.8525, UEM: 0.4840, LEM: 0.2545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6369, partial_loss/deprel_loss: 0.7295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8077, loss: 0.9770, batch_reg_loss: 0.0967, reg_loss: 0.0955 ||:  91%|######### | 101/111 [01:09<00:06,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8529, UAS: 0.9169, LAS: 0.8528, UEM: 0.4859, LEM: 0.2553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8818, partial_loss/deprel_loss: 0.8098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9210, loss: 0.9743, batch_reg_loss: 0.0968, reg_loss: 0.0956 ||:  95%|#########4| 105/111 [01:11<00:04,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8621, UAS: 0.9174, LAS: 0.8535, UEM: 0.4861, LEM: 0.2537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5777, partial_loss/deprel_loss: 0.8117, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8617, loss: 0.9685, batch_reg_loss: 0.0968, reg_loss: 0.0956 ||:  97%|#########7| 108/111 [01:14<00:02,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8666, UAS: 0.9184, LAS: 0.8544, UEM: 0.4937, LEM: 0.2579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6128, partial_loss/deprel_loss: 0.8212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8764, loss: 0.9610, batch_reg_loss: 0.0969, reg_loss: 0.0956 ||: 100%|##########| 111/111 [01:16<00:00,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8666, UAS: 0.9184, LAS: 0.8544, UEM: 0.4937, LEM: 0.2579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6128, partial_loss/deprel_loss: 0.8212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8764, loss: 0.9610, batch_reg_loss: 0.0969, reg_loss: 0.0956 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
+      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.821  |       N/A\n",
+      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.613  |       N/A\n",
+      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.096  |       N/A\n",
+      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - UEM                      |     0.494  |       N/A\n",
+      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - LAS                      |     0.854  |       N/A\n",
+      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - loss                     |     0.961  |       N/A\n",
+      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - LEM                      |     0.258  |       N/A\n",
+      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - UAS                      |     0.918  |       N/A\n",
+      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - EM                       |     0.867  |       N/A\n",
+      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:18:53,123 - INFO - combo.training.trainer - Epoch duration: 0:01:16.752609\n",
+      "2023-04-06 23:18:53,123 - INFO - combo.training.trainer - Estimated training time remaining: 8:19:56\n",
+      "2023-04-06 23:18:53,123 - INFO - allennlp.training.trainer - Epoch 22/399\n",
+      "2023-04-06 23:18:53,123 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:18:53,123 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:18:53,130 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8548, UAS: 0.9361, LAS: 0.8734, UEM: 0.4864, LEM: 0.2167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8275, partial_loss/deprel_loss: 0.8561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9474, loss: 0.8003, batch_reg_loss: 0.0970, reg_loss: 0.0970 ||:   4%|3         | 4/111 [00:02<00:57,  1.86it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8194, UAS: 0.9300, LAS: 0.8699, UEM: 0.5067, LEM: 0.2404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4623, partial_loss/deprel_loss: 1.1682, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3241, loss: 0.8539, batch_reg_loss: 0.0971, reg_loss: 0.0970 ||:   7%|7         | 8/111 [00:04<00:56,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8613, UAS: 0.9287, LAS: 0.8690, UEM: 0.4604, LEM: 0.2002, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7500, partial_loss/deprel_loss: 0.8352, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9153, loss: 0.8580, batch_reg_loss: 0.0971, reg_loss: 0.0970 ||:  11%|#         | 12/111 [00:06<00:56,  1.77it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9096, UAS: 0.9332, LAS: 0.8739, UEM: 0.5000, LEM: 0.2279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2665, partial_loss/deprel_loss: 0.4745, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5301, loss: 0.8228, batch_reg_loss: 0.0972, reg_loss: 0.0971 ||:  14%|#3        | 15/111 [00:08<00:58,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8928, UAS: 0.9380, LAS: 0.8796, UEM: 0.5910, LEM: 0.3243, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4276, partial_loss/deprel_loss: 0.6461, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6996, loss: 0.7743, batch_reg_loss: 0.0973, reg_loss: 0.0971 ||:  16%|#6        | 18/111 [00:11<01:00,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8666, UAS: 0.9388, LAS: 0.8795, UEM: 0.5882, LEM: 0.3117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5401, partial_loss/deprel_loss: 0.7525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8074, loss: 0.7672, batch_reg_loss: 0.0973, reg_loss: 0.0971 ||:  19%|#8        | 21/111 [00:13<00:59,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8452, UAS: 0.9394, LAS: 0.8805, UEM: 0.5959, LEM: 0.3183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8269, partial_loss/deprel_loss: 0.9416, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0160, loss: 0.7596, batch_reg_loss: 0.0974, reg_loss: 0.0971 ||:  22%|##1       | 24/111 [00:15<00:58,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8729, UAS: 0.9385, LAS: 0.8795, UEM: 0.5779, LEM: 0.3048, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6153, partial_loss/deprel_loss: 0.8072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8663, loss: 0.7663, batch_reg_loss: 0.0974, reg_loss: 0.0972 ||:  24%|##4       | 27/111 [00:17<00:57,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8079, UAS: 0.9341, LAS: 0.8746, UEM: 0.5516, LEM: 0.2868, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8354, partial_loss/deprel_loss: 1.2851, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4926, loss: 0.8122, batch_reg_loss: 0.0975, reg_loss: 0.0972 ||:  28%|##7       | 31/111 [00:20<00:53,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8138, UAS: 0.9303, LAS: 0.8703, UEM: 0.5369, LEM: 0.2790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3798, partial_loss/deprel_loss: 1.2360, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3623, loss: 0.8503, batch_reg_loss: 0.0976, reg_loss: 0.0972 ||:  32%|###1      | 35/111 [00:22<00:51,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9314, LAS: 0.8718, UEM: 0.5791, LEM: 0.3318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3940, partial_loss/deprel_loss: 0.5500, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6164, loss: 0.8361, batch_reg_loss: 0.0976, reg_loss: 0.0973 ||:  34%|###4      | 38/111 [00:25<00:55,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8747, UAS: 0.9312, LAS: 0.8709, UEM: 0.5703, LEM: 0.3213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5884, partial_loss/deprel_loss: 0.7088, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7824, loss: 0.8412, batch_reg_loss: 0.0977, reg_loss: 0.0973 ||:  37%|###6      | 41/111 [00:27<00:52,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8714, UAS: 0.9275, LAS: 0.8665, UEM: 0.5581, LEM: 0.3114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6344, partial_loss/deprel_loss: 0.7415, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8178, loss: 0.8770, batch_reg_loss: 0.0977, reg_loss: 0.0973 ||:  40%|###9      | 44/111 [00:29<00:48,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8740, UAS: 0.9283, LAS: 0.8671, UEM: 0.5570, LEM: 0.3067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4666, partial_loss/deprel_loss: 0.6955, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7476, loss: 0.8715, batch_reg_loss: 0.0978, reg_loss: 0.0974 ||:  43%|####3     | 48/111 [00:32<00:44,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9256, LAS: 0.8640, UEM: 0.5457, LEM: 0.2997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4119, partial_loss/deprel_loss: 0.5915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6535, loss: 0.8893, batch_reg_loss: 0.0979, reg_loss: 0.0974 ||:  47%|####6     | 52/111 [00:35<00:40,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9268, LAS: 0.8653, UEM: 0.5666, LEM: 0.3207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1844, partial_loss/deprel_loss: 0.3684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4296, loss: 0.8788, batch_reg_loss: 0.0980, reg_loss: 0.0974 ||:  50%|####9     | 55/111 [00:37<00:40,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9261, LAS: 0.8643, UEM: 0.5619, LEM: 0.3160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3166, partial_loss/deprel_loss: 0.4570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5270, loss: 0.8857, batch_reg_loss: 0.0981, reg_loss: 0.0975 ||:  53%|#####3    | 59/111 [00:39<00:35,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7876, UAS: 0.9239, LAS: 0.8618, UEM: 0.5473, LEM: 0.3063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7525, partial_loss/deprel_loss: 1.3168, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5021, loss: 0.9059, batch_reg_loss: 0.0982, reg_loss: 0.0975 ||:  57%|#####6    | 63/111 [00:42<00:32,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8164, UAS: 0.9234, LAS: 0.8610, UEM: 0.5373, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3867, partial_loss/deprel_loss: 1.1551, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2997, loss: 0.9142, batch_reg_loss: 0.0982, reg_loss: 0.0976 ||:  59%|#####9    | 66/111 [00:44<00:30,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8013, UAS: 0.9236, LAS: 0.8612, UEM: 0.5420, LEM: 0.3022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4252, partial_loss/deprel_loss: 1.3715, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4806, loss: 0.9127, batch_reg_loss: 0.0983, reg_loss: 0.0976 ||:  62%|######2   | 69/111 [00:47<00:30,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8822, UAS: 0.9236, LAS: 0.8613, UEM: 0.5379, LEM: 0.2975, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5400, partial_loss/deprel_loss: 0.6561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7313, loss: 0.9139, batch_reg_loss: 0.0984, reg_loss: 0.0976 ||:  65%|######4   | 72/111 [00:49<00:28,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8829, UAS: 0.9226, LAS: 0.8598, UEM: 0.5300, LEM: 0.2902, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5208, partial_loss/deprel_loss: 0.7197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7784, loss: 0.9243, batch_reg_loss: 0.0985, reg_loss: 0.0977 ||:  68%|######8   | 76/111 [00:51<00:24,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9214, LAS: 0.8586, UEM: 0.5237, LEM: 0.2858, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7298, partial_loss/deprel_loss: 0.7075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8105, loss: 0.9339, batch_reg_loss: 0.0986, reg_loss: 0.0977 ||:  72%|#######2  | 80/111 [00:54<00:21,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9218, LAS: 0.8591, UEM: 0.5252, LEM: 0.2861, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5913, partial_loss/deprel_loss: 0.7371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8066, loss: 0.9308, batch_reg_loss: 0.0986, reg_loss: 0.0977 ||:  75%|#######4  | 83/111 [00:56<00:19,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8156, UAS: 0.9213, LAS: 0.8584, UEM: 0.5176, LEM: 0.2797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4704, partial_loss/deprel_loss: 1.1766, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3341, loss: 0.9378, batch_reg_loss: 0.0987, reg_loss: 0.0978 ||:  78%|#######8  | 87/111 [00:59<00:16,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7587, UAS: 0.9197, LAS: 0.8566, UEM: 0.5081, LEM: 0.2734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3102, partial_loss/deprel_loss: 1.6186, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8557, loss: 0.9530, batch_reg_loss: 0.0988, reg_loss: 0.0978 ||:  82%|########1 | 91/111 [01:01<00:13,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8198, UAS: 0.9189, LAS: 0.8555, UEM: 0.4985, LEM: 0.2667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2651, partial_loss/deprel_loss: 1.0647, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2037, loss: 0.9623, batch_reg_loss: 0.0989, reg_loss: 0.0979 ||:  86%|########5 | 95/111 [01:04<00:10,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8740, UAS: 0.9190, LAS: 0.8555, UEM: 0.4983, LEM: 0.2662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5153, partial_loss/deprel_loss: 0.7901, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8342, loss: 0.9627, batch_reg_loss: 0.0990, reg_loss: 0.0979 ||:  89%|########9 | 99/111 [01:06<00:07,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8723, UAS: 0.9191, LAS: 0.8558, UEM: 0.5012, LEM: 0.2698, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5980, partial_loss/deprel_loss: 0.7163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7918, loss: 0.9603, batch_reg_loss: 0.0991, reg_loss: 0.0980 ||:  93%|#########2| 103/111 [01:09<00:05,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8520, UAS: 0.9187, LAS: 0.8553, UEM: 0.5018, LEM: 0.2701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8508, partial_loss/deprel_loss: 0.9035, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9922, loss: 0.9639, batch_reg_loss: 0.0992, reg_loss: 0.0980 ||:  96%|#########6| 107/111 [01:11<00:02,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9197, LAS: 0.8564, UEM: 0.5037, LEM: 0.2689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4395, partial_loss/deprel_loss: 0.6932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7417, loss: 0.9546, batch_reg_loss: 0.0993, reg_loss: 0.0981 ||: 100%|##########| 111/111 [01:14<00:00,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9197, LAS: 0.8564, UEM: 0.5037, LEM: 0.2689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4395, partial_loss/deprel_loss: 0.6932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7417, loss: 0.9546, batch_reg_loss: 0.0993, reg_loss: 0.0981 ||: 100%|##########| 111/111 [01:14<00:00,  1.50it/s]\n",
+      "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.693  |       N/A\n",
+      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.439  |       N/A\n",
+      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.098  |       N/A\n",
+      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - UEM                      |     0.504  |       N/A\n",
+      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - LAS                      |     0.856  |       N/A\n",
+      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - loss                     |     0.955  |       N/A\n",
+      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - LEM                      |     0.269  |       N/A\n",
+      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - UAS                      |     0.920  |       N/A\n",
+      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - EM                       |     0.880  |       N/A\n",
+      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:20:07,333 - INFO - combo.training.trainer - Epoch duration: 0:01:14.210037\n",
+      "2023-04-06 23:20:07,333 - INFO - combo.training.trainer - Estimated training time remaining: 8:17:12\n",
+      "2023-04-06 23:20:07,333 - INFO - allennlp.training.trainer - Epoch 23/399\n",
+      "2023-04-06 23:20:07,333 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:20:07,334 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:20:07,340 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8385, UAS: 0.8949, LAS: 0.8287, UEM: 0.1098, LEM: 0.0122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1080, partial_loss/deprel_loss: 1.0936, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1958, loss: 1.2573, batch_reg_loss: 0.0994, reg_loss: 0.0993 ||:   3%|2         | 3/111 [00:02<01:12,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8446, UAS: 0.9162, LAS: 0.8520, UEM: 0.4313, LEM: 0.1854, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9910, partial_loss/deprel_loss: 0.9522, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0594, loss: 1.0167, batch_reg_loss: 0.0994, reg_loss: 0.0994 ||:   5%|5         | 6/111 [00:04<01:12,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8850, UAS: 0.9208, LAS: 0.8586, UEM: 0.4514, LEM: 0.1973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4497, partial_loss/deprel_loss: 0.7025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7515, loss: 0.9521, batch_reg_loss: 0.0995, reg_loss: 0.0994 ||:   9%|9         | 10/111 [00:06<01:06,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8790, UAS: 0.9220, LAS: 0.8594, UEM: 0.4382, LEM: 0.1919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5719, partial_loss/deprel_loss: 0.6911, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7669, loss: 0.9378, batch_reg_loss: 0.0996, reg_loss: 0.0994 ||:  12%|#1        | 13/111 [00:08<01:05,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8195, UAS: 0.9152, LAS: 0.8517, UEM: 0.4119, LEM: 0.1816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4563, partial_loss/deprel_loss: 1.1203, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2872, loss: 1.0058, batch_reg_loss: 0.0997, reg_loss: 0.0995 ||:  15%|#5        | 17/111 [00:11<01:02,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9212, LAS: 0.8597, UEM: 0.5133, LEM: 0.2807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4697, partial_loss/deprel_loss: 0.6013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6747, loss: 0.9357, batch_reg_loss: 0.0997, reg_loss: 0.0995 ||:  18%|#8        | 20/111 [00:13<01:05,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7982, UAS: 0.9195, LAS: 0.8577, UEM: 0.4810, LEM: 0.2547, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6368, partial_loss/deprel_loss: 1.2883, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4579, loss: 0.9546, batch_reg_loss: 0.0998, reg_loss: 0.0996 ||:  22%|##1       | 24/111 [00:16<00:58,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8528, UAS: 0.9207, LAS: 0.8587, UEM: 0.4830, LEM: 0.2536, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7993, partial_loss/deprel_loss: 0.8640, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9510, loss: 0.9487, batch_reg_loss: 0.0999, reg_loss: 0.0996 ||:  24%|##4       | 27/111 [00:18<00:57,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9174, LAS: 0.8551, UEM: 0.4849, LEM: 0.2546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2721, partial_loss/deprel_loss: 0.4954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5507, loss: 0.9817, batch_reg_loss: 0.1000, reg_loss: 0.0996 ||:  27%|##7       | 30/111 [00:20<00:56,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8186, UAS: 0.9170, LAS: 0.8551, UEM: 0.4742, LEM: 0.2476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2339, partial_loss/deprel_loss: 1.1452, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2630, loss: 0.9804, batch_reg_loss: 0.1000, reg_loss: 0.0997 ||:  30%|##9       | 33/111 [00:22<00:54,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9191, LAS: 0.8576, UEM: 0.5179, LEM: 0.2871, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1584, partial_loss/deprel_loss: 0.3758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4324, loss: 0.9551, batch_reg_loss: 0.1001, reg_loss: 0.0997 ||:  32%|###2      | 36/111 [00:24<00:52,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9208, LAS: 0.8592, UEM: 0.5176, LEM: 0.2831, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3242, partial_loss/deprel_loss: 0.5435, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5999, loss: 0.9375, batch_reg_loss: 0.1002, reg_loss: 0.0998 ||:  36%|###6      | 40/111 [00:27<00:49,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9215, LAS: 0.8597, UEM: 0.5178, LEM: 0.2790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4017, partial_loss/deprel_loss: 0.5735, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6394, loss: 0.9290, batch_reg_loss: 0.1003, reg_loss: 0.0998 ||:  39%|###8      | 43/111 [00:29<00:47,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9230, LAS: 0.8616, UEM: 0.5530, LEM: 0.3230, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0951, partial_loss/deprel_loss: 0.2286, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3023, loss: 0.9164, batch_reg_loss: 0.1003, reg_loss: 0.0998 ||:  41%|####1     | 46/111 [00:31<00:48,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8862, UAS: 0.9233, LAS: 0.8621, UEM: 0.5553, LEM: 0.3236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4974, partial_loss/deprel_loss: 0.6754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7402, loss: 0.9117, batch_reg_loss: 0.1004, reg_loss: 0.0999 ||:  44%|####4     | 49/111 [00:34<00:45,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8017, UAS: 0.9220, LAS: 0.8608, UEM: 0.5543, LEM: 0.3267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5379, partial_loss/deprel_loss: 1.2708, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4247, loss: 0.9204, batch_reg_loss: 0.1005, reg_loss: 0.0999 ||:  48%|####7     | 53/111 [00:36<00:41,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9218, LAS: 0.8605, UEM: 0.5487, LEM: 0.3212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3058, partial_loss/deprel_loss: 0.5159, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5744, loss: 0.9219, batch_reg_loss: 0.1005, reg_loss: 0.0999 ||:  50%|#####     | 56/111 [00:38<00:39,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9142, UAS: 0.9226, LAS: 0.8614, UEM: 0.5549, LEM: 0.3237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1668, partial_loss/deprel_loss: 0.4572, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4997, loss: 0.9170, batch_reg_loss: 0.1006, reg_loss: 0.1000 ||:  53%|#####3    | 59/111 [00:41<00:38,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9232, LAS: 0.8619, UEM: 0.5563, LEM: 0.3225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5530, partial_loss/deprel_loss: 0.6772, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7530, loss: 0.9111, batch_reg_loss: 0.1007, reg_loss: 0.1000 ||:  56%|#####5    | 62/111 [00:43<00:36,  1.34it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8724, UAS: 0.9238, LAS: 0.8623, UEM: 0.5494, LEM: 0.3132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4779, partial_loss/deprel_loss: 0.8325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8623, loss: 0.9075, batch_reg_loss: 0.1008, reg_loss: 0.1000 ||:  59%|#####9    | 66/111 [00:46<00:32,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8420, UAS: 0.9234, LAS: 0.8620, UEM: 0.5454, LEM: 0.3091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9666, partial_loss/deprel_loss: 0.9580, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0606, loss: 0.9100, batch_reg_loss: 0.1008, reg_loss: 0.1001 ||:  62%|######2   | 69/111 [00:48<00:29,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9209, LAS: 0.8594, UEM: 0.5390, LEM: 0.3046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5884, partial_loss/deprel_loss: 0.8047, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8623, loss: 0.9318, batch_reg_loss: 0.1009, reg_loss: 0.1001 ||:  65%|######4   | 72/111 [00:50<00:27,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8647, UAS: 0.9218, LAS: 0.8603, UEM: 0.5415, LEM: 0.3048, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6952, partial_loss/deprel_loss: 0.8219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8975, loss: 0.9227, batch_reg_loss: 0.1009, reg_loss: 0.1001 ||:  68%|######7   | 75/111 [00:52<00:26,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8815, UAS: 0.9209, LAS: 0.8591, UEM: 0.5355, LEM: 0.2978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5396, partial_loss/deprel_loss: 0.6414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7220, loss: 0.9309, batch_reg_loss: 0.1010, reg_loss: 0.1002 ||:  71%|#######1  | 79/111 [00:55<00:23,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9214, LAS: 0.8597, UEM: 0.5347, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3550, partial_loss/deprel_loss: 0.5707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6287, loss: 0.9262, batch_reg_loss: 0.1011, reg_loss: 0.1002 ||:  74%|#######3  | 82/111 [00:57<00:20,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.9216, LAS: 0.8599, UEM: 0.5292, LEM: 0.2913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1648, partial_loss/deprel_loss: 1.1497, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2539, loss: 0.9257, batch_reg_loss: 0.1012, reg_loss: 0.1003 ||:  77%|#######7  | 86/111 [00:59<00:16,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8274, UAS: 0.9212, LAS: 0.8595, UEM: 0.5286, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1797, partial_loss/deprel_loss: 1.0297, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1609, loss: 0.9283, batch_reg_loss: 0.1013, reg_loss: 0.1003 ||:  80%|########  | 89/111 [01:02<00:15,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8444, UAS: 0.9205, LAS: 0.8586, UEM: 0.5206, LEM: 0.2867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8560, partial_loss/deprel_loss: 0.8923, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9864, loss: 0.9342, batch_reg_loss: 0.1013, reg_loss: 0.1003 ||:  83%|########2 | 92/111 [01:04<00:13,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8405, UAS: 0.9196, LAS: 0.8574, UEM: 0.5135, LEM: 0.2820, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8253, partial_loss/deprel_loss: 0.8840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9737, loss: 0.9429, batch_reg_loss: 0.1014, reg_loss: 0.1004 ||:  86%|########5 | 95/111 [01:06<00:11,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8775, UAS: 0.9202, LAS: 0.8579, UEM: 0.5121, LEM: 0.2781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4252, partial_loss/deprel_loss: 0.6383, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6971, loss: 0.9379, batch_reg_loss: 0.1015, reg_loss: 0.1004 ||:  88%|########8 | 98/111 [01:08<00:09,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9202, LAS: 0.8578, UEM: 0.5151, LEM: 0.2800, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3950, partial_loss/deprel_loss: 0.6499, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7004, loss: 0.9367, batch_reg_loss: 0.1015, reg_loss: 0.1004 ||:  91%|######### | 101/111 [01:10<00:07,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8758, UAS: 0.9204, LAS: 0.8580, UEM: 0.5113, LEM: 0.2761, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5823, partial_loss/deprel_loss: 0.7403, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8103, loss: 0.9358, batch_reg_loss: 0.1016, reg_loss: 0.1005 ||:  94%|#########3| 104/111 [01:13<00:05,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8119, UAS: 0.9201, LAS: 0.8575, UEM: 0.5075, LEM: 0.2724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3702, partial_loss/deprel_loss: 1.1280, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2781, loss: 0.9388, batch_reg_loss: 0.1017, reg_loss: 0.1005 ||:  96%|#########6| 107/111 [01:15<00:02,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9199, LAS: 0.8573, UEM: 0.5026, LEM: 0.2678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5529, partial_loss/deprel_loss: 0.7012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7733, loss: 0.9416, batch_reg_loss: 0.1018, reg_loss: 0.1005 ||: 100%|##########| 111/111 [01:17<00:00,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9199, LAS: 0.8573, UEM: 0.5026, LEM: 0.2678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5529, partial_loss/deprel_loss: 0.7012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7733, loss: 0.9416, batch_reg_loss: 0.1018, reg_loss: 0.1005 ||: 100%|##########| 111/111 [01:17<00:00,  1.43it/s]\n",
+      "2023-04-06 23:21:25,103 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:21:25,103 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:21:25,103 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.701  |       N/A\n",
+      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.553  |       N/A\n",
+      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.101  |       N/A\n",
+      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - UEM                      |     0.503  |       N/A\n",
+      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - LAS                      |     0.857  |       N/A\n",
+      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - loss                     |     0.942  |       N/A\n",
+      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - LEM                      |     0.268  |       N/A\n",
+      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - UAS                      |     0.920  |       N/A\n",
+      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:21:25,105 - INFO - combo.training.tensorboard_writer - EM                       |     0.879  |       N/A\n",
+      "2023-04-06 23:21:25,105 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:21:25,105 - INFO - combo.training.trainer - Epoch duration: 0:01:17.771978\n",
+      "2023-04-06 23:21:25,105 - INFO - combo.training.trainer - Estimated training time remaining: 8:15:32\n",
+      "2023-04-06 23:21:25,105 - INFO - allennlp.training.trainer - Epoch 24/399\n",
+      "2023-04-06 23:21:25,106 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:21:25,106 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:21:25,112 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9498, LAS: 0.8965, UEM: 0.6134, LEM: 0.3227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4244, partial_loss/deprel_loss: 0.5337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6136, loss: 0.6403, batch_reg_loss: 0.1018, reg_loss: 0.1018 ||:   3%|2         | 3/111 [00:02<01:13,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7832, UAS: 0.9222, LAS: 0.8663, UEM: 0.5378, LEM: 0.2658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0726, partial_loss/deprel_loss: 1.2622, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5262, loss: 0.8804, batch_reg_loss: 0.1019, reg_loss: 0.1018 ||:   5%|5         | 6/111 [00:04<01:12,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9254, LAS: 0.8696, UEM: 0.5613, LEM: 0.2977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2665, partial_loss/deprel_loss: 0.4438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5103, loss: 0.8574, batch_reg_loss: 0.1020, reg_loss: 0.1019 ||:   8%|8         | 9/111 [00:06<01:13,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9290, LAS: 0.8697, UEM: 0.5375, LEM: 0.2582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5027, partial_loss/deprel_loss: 0.7213, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7796, loss: 0.8491, batch_reg_loss: 0.1021, reg_loss: 0.1019 ||:  12%|#1        | 13/111 [00:08<01:05,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8115, UAS: 0.9180, LAS: 0.8568, UEM: 0.4769, LEM: 0.2268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3171, partial_loss/deprel_loss: 1.1869, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3151, loss: 0.9530, batch_reg_loss: 0.1021, reg_loss: 0.1020 ||:  15%|#5        | 17/111 [00:11<01:01,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8866, UAS: 0.9202, LAS: 0.8585, UEM: 0.4617, LEM: 0.2124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5182, partial_loss/deprel_loss: 0.6378, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7161, loss: 0.9386, batch_reg_loss: 0.1022, reg_loss: 0.1020 ||:  19%|#8        | 21/111 [00:13<00:57,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8729, UAS: 0.9191, LAS: 0.8573, UEM: 0.4431, LEM: 0.1985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5818, partial_loss/deprel_loss: 0.7437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8136, loss: 0.9558, batch_reg_loss: 0.1023, reg_loss: 0.1020 ||:  22%|##1       | 24/111 [00:15<00:57,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8420, UAS: 0.9207, LAS: 0.8589, UEM: 0.4550, LEM: 0.2127, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7988, partial_loss/deprel_loss: 0.9206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9986, loss: 0.9407, batch_reg_loss: 0.1024, reg_loss: 0.1021 ||:  25%|##5       | 28/111 [00:18<00:54,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8407, UAS: 0.9219, LAS: 0.8599, UEM: 0.4545, LEM: 0.2086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9907, partial_loss/deprel_loss: 0.9659, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0733, loss: 0.9309, batch_reg_loss: 0.1025, reg_loss: 0.1021 ||:  28%|##7       | 31/111 [00:20<00:53,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8286, UAS: 0.9239, LAS: 0.8630, UEM: 0.5199, LEM: 0.2897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1700, partial_loss/deprel_loss: 1.1138, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2275, loss: 0.9088, batch_reg_loss: 0.1025, reg_loss: 0.1022 ||:  31%|###       | 34/111 [00:22<00:55,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9237, LAS: 0.8628, UEM: 0.5208, LEM: 0.2880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3895, partial_loss/deprel_loss: 0.6072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6663, loss: 0.9085, batch_reg_loss: 0.1026, reg_loss: 0.1022 ||:  34%|###4      | 38/111 [00:25<00:50,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8645, UAS: 0.9219, LAS: 0.8612, UEM: 0.5116, LEM: 0.2786, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6607, partial_loss/deprel_loss: 0.7658, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8475, loss: 0.9216, batch_reg_loss: 0.1027, reg_loss: 0.1022 ||:  38%|###7      | 42/111 [00:27<00:45,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7785, UAS: 0.9207, LAS: 0.8600, UEM: 0.5061, LEM: 0.2746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8828, partial_loss/deprel_loss: 1.4185, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6141, loss: 0.9324, batch_reg_loss: 0.1028, reg_loss: 0.1023 ||:  41%|####1     | 46/111 [00:30<00:42,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8119, UAS: 0.9206, LAS: 0.8598, UEM: 0.4985, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5178, partial_loss/deprel_loss: 1.2824, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4323, loss: 0.9363, batch_reg_loss: 0.1028, reg_loss: 0.1023 ||:  45%|####5     | 50/111 [00:33<00:40,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9025, UAS: 0.9225, LAS: 0.8620, UEM: 0.5273, LEM: 0.2958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3015, partial_loss/deprel_loss: 0.4830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5496, loss: 0.9186, batch_reg_loss: 0.1029, reg_loss: 0.1024 ||:  48%|####7     | 53/111 [00:35<00:39,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8645, UAS: 0.9225, LAS: 0.8617, UEM: 0.5194, LEM: 0.2878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6157, partial_loss/deprel_loss: 0.7654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8384, loss: 0.9208, batch_reg_loss: 0.1030, reg_loss: 0.1024 ||:  50%|#####     | 56/111 [00:37<00:37,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9223, LAS: 0.8611, UEM: 0.5155, LEM: 0.2832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3731, partial_loss/deprel_loss: 0.6492, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6971, loss: 0.9261, batch_reg_loss: 0.1030, reg_loss: 0.1024 ||:  53%|#####3    | 59/111 [00:39<00:36,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8623, UAS: 0.9211, LAS: 0.8598, UEM: 0.5063, LEM: 0.2758, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7221, partial_loss/deprel_loss: 0.8030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8899, loss: 0.9367, batch_reg_loss: 0.1031, reg_loss: 0.1025 ||:  56%|#####5    | 62/111 [00:41<00:33,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8357, UAS: 0.9183, LAS: 0.8566, UEM: 0.4943, LEM: 0.2676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0037, partial_loss/deprel_loss: 0.9773, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0858, loss: 0.9632, batch_reg_loss: 0.1032, reg_loss: 0.1025 ||:  59%|#####9    | 66/111 [00:44<00:30,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8227, UAS: 0.9178, LAS: 0.8557, UEM: 0.4850, LEM: 0.2602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1411, partial_loss/deprel_loss: 1.1626, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2616, loss: 0.9685, batch_reg_loss: 0.1033, reg_loss: 0.1025 ||:  63%|######3   | 70/111 [00:46<00:27,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9048, UAS: 0.9189, LAS: 0.8569, UEM: 0.4977, LEM: 0.2705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2746, partial_loss/deprel_loss: 0.5005, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5587, loss: 0.9568, batch_reg_loss: 0.1034, reg_loss: 0.1026 ||:  67%|######6   | 74/111 [00:49<00:24,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8208, UAS: 0.9177, LAS: 0.8557, UEM: 0.4966, LEM: 0.2701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6101, partial_loss/deprel_loss: 1.1479, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3438, loss: 0.9684, batch_reg_loss: 0.1035, reg_loss: 0.1026 ||:  69%|######9   | 77/111 [00:51<00:23,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8717, UAS: 0.9174, LAS: 0.8554, UEM: 0.4877, LEM: 0.2624, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6921, partial_loss/deprel_loss: 0.7516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8433, loss: 0.9711, batch_reg_loss: 0.1036, reg_loss: 0.1027 ||:  73%|#######2  | 81/111 [00:54<00:20,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8650, UAS: 0.9177, LAS: 0.8554, UEM: 0.4819, LEM: 0.2561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5465, partial_loss/deprel_loss: 0.7612, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8219, loss: 0.9704, batch_reg_loss: 0.1036, reg_loss: 0.1027 ||:  77%|#######6  | 85/111 [00:56<00:16,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9183, LAS: 0.8559, UEM: 0.4814, LEM: 0.2532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6801, partial_loss/deprel_loss: 0.8225, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8978, loss: 0.9660, batch_reg_loss: 0.1037, reg_loss: 0.1028 ||:  80%|########  | 89/111 [00:59<00:14,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8791, UAS: 0.9192, LAS: 0.8571, UEM: 0.4872, LEM: 0.2573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5869, partial_loss/deprel_loss: 0.6416, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7345, loss: 0.9550, batch_reg_loss: 0.1038, reg_loss: 0.1028 ||:  84%|########3 | 93/111 [01:01<00:11,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9200, LAS: 0.8581, UEM: 0.4941, LEM: 0.2628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2738, partial_loss/deprel_loss: 0.4538, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5217, loss: 0.9464, batch_reg_loss: 0.1039, reg_loss: 0.1028 ||:  87%|########7 | 97/111 [01:05<00:09,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9204, LAS: 0.8585, UEM: 0.5007, LEM: 0.2680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4079, partial_loss/deprel_loss: 0.5752, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6458, loss: 0.9437, batch_reg_loss: 0.1040, reg_loss: 0.1029 ||:  91%|######### | 101/111 [01:07<00:07,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9208, LAS: 0.8587, UEM: 0.5012, LEM: 0.2663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3307, partial_loss/deprel_loss: 0.5607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6188, loss: 0.9398, batch_reg_loss: 0.1041, reg_loss: 0.1029 ||:  94%|#########3| 104/111 [01:10<00:04,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8782, UAS: 0.9209, LAS: 0.8588, UEM: 0.4988, LEM: 0.2634, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5770, partial_loss/deprel_loss: 0.6887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7704, loss: 0.9390, batch_reg_loss: 0.1041, reg_loss: 0.1030 ||:  96%|#########6| 107/111 [01:12<00:02,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7959, UAS: 0.9205, LAS: 0.8584, UEM: 0.5038, LEM: 0.2702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6188, partial_loss/deprel_loss: 1.3442, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5033, loss: 0.9428, batch_reg_loss: 0.1042, reg_loss: 0.1030 ||:  99%|#########9| 110/111 [01:14<00:00,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9208, LAS: 0.8587, UEM: 0.5047, LEM: 0.2705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3658, partial_loss/deprel_loss: 0.5668, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6308, loss: 0.9400, batch_reg_loss: 0.1042, reg_loss: 0.1030 ||: 100%|##########| 111/111 [01:15<00:00,  1.48it/s]\n",
+      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.567  |       N/A\n",
+      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.366  |       N/A\n",
+      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.103  |       N/A\n",
+      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - UEM                      |     0.505  |       N/A\n",
+      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - LAS                      |     0.859  |       N/A\n",
+      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - loss                     |     0.940  |       N/A\n",
+      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - LEM                      |     0.270  |       N/A\n",
+      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - UAS                      |     0.921  |       N/A\n",
+      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - EM                       |     0.892  |       N/A\n",
+      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:22:40,314 - INFO - combo.training.trainer - Epoch duration: 0:01:15.208139\n",
+      "2023-04-06 23:22:40,314 - INFO - combo.training.trainer - Estimated training time remaining: 8:13:15\n",
+      "2023-04-06 23:22:40,314 - INFO - allennlp.training.trainer - Epoch 25/399\n",
+      "2023-04-06 23:22:40,314 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:22:40,314 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:22:40,320 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9344, LAS: 0.8797, UEM: 0.4935, LEM: 0.2495, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6547, partial_loss/deprel_loss: 0.8121, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8849, loss: 0.7391, batch_reg_loss: 0.1042, reg_loss: 0.1042 ||:   3%|2         | 3/111 [00:02<01:15,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8283, UAS: 0.9349, LAS: 0.8766, UEM: 0.4955, LEM: 0.2317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0891, partial_loss/deprel_loss: 1.0617, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1715, loss: 0.7907, batch_reg_loss: 0.1043, reg_loss: 0.1043 ||:   5%|5         | 6/111 [00:04<01:13,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8172, UAS: 0.9163, LAS: 0.8558, UEM: 0.4640, LEM: 0.2246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3905, partial_loss/deprel_loss: 1.1573, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3083, loss: 0.9494, batch_reg_loss: 0.1044, reg_loss: 0.1043 ||:   9%|9         | 10/111 [00:06<01:08,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8936, UAS: 0.9227, LAS: 0.8621, UEM: 0.4577, LEM: 0.2099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4299, partial_loss/deprel_loss: 0.6033, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6731, loss: 0.9065, batch_reg_loss: 0.1045, reg_loss: 0.1043 ||:  13%|#2        | 14/111 [00:09<01:05,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8750, UAS: 0.9247, LAS: 0.8645, UEM: 0.4702, LEM: 0.2253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6388, partial_loss/deprel_loss: 0.7764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8534, loss: 0.8863, batch_reg_loss: 0.1045, reg_loss: 0.1044 ||:  15%|#5        | 17/111 [00:11<01:07,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8458, UAS: 0.9276, LAS: 0.8682, UEM: 0.5241, LEM: 0.2942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8834, partial_loss/deprel_loss: 0.9625, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0513, loss: 0.8611, batch_reg_loss: 0.1046, reg_loss: 0.1044 ||:  18%|#8        | 20/111 [00:14<01:05,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8113, UAS: 0.9243, LAS: 0.8644, UEM: 0.4944, LEM: 0.2741, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5374, partial_loss/deprel_loss: 1.1203, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3084, loss: 0.8922, batch_reg_loss: 0.1047, reg_loss: 0.1044 ||:  21%|##        | 23/111 [00:16<01:02,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9286, LAS: 0.8690, UEM: 0.5379, LEM: 0.2997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3213, partial_loss/deprel_loss: 0.5448, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6048, loss: 0.8552, batch_reg_loss: 0.1047, reg_loss: 0.1045 ||:  23%|##3       | 26/111 [00:18<01:00,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7784, UAS: 0.9271, LAS: 0.8676, UEM: 0.5357, LEM: 0.2948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1583, partial_loss/deprel_loss: 1.3522, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6182, loss: 0.8713, batch_reg_loss: 0.1048, reg_loss: 0.1045 ||:  27%|##7       | 30/111 [00:20<00:55,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9030, UAS: 0.9281, LAS: 0.8688, UEM: 0.5477, LEM: 0.3002, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3166, partial_loss/deprel_loss: 0.4624, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5381, loss: 0.8613, batch_reg_loss: 0.1049, reg_loss: 0.1045 ||:  30%|##9       | 33/111 [00:22<00:53,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8912, UAS: 0.9289, LAS: 0.8693, UEM: 0.5395, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3442, partial_loss/deprel_loss: 0.6002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6539, loss: 0.8581, batch_reg_loss: 0.1049, reg_loss: 0.1046 ||:  32%|###2      | 36/111 [00:24<00:51,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8346, UAS: 0.9285, LAS: 0.8688, UEM: 0.5242, LEM: 0.2751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1629, partial_loss/deprel_loss: 1.0839, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2047, loss: 0.8636, batch_reg_loss: 0.1050, reg_loss: 0.1046 ||:  36%|###6      | 40/111 [00:27<00:47,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7681, UAS: 0.9278, LAS: 0.8681, UEM: 0.5437, LEM: 0.2940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1504, partial_loss/deprel_loss: 1.4375, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6852, loss: 0.8681, batch_reg_loss: 0.1051, reg_loss: 0.1046 ||:  39%|###8      | 43/111 [00:29<00:48,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9259, LAS: 0.8659, UEM: 0.5305, LEM: 0.2850, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6785, partial_loss/deprel_loss: 0.7163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8139, loss: 0.8856, batch_reg_loss: 0.1052, reg_loss: 0.1047 ||:  42%|####2     | 47/111 [00:32<00:43,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8641, UAS: 0.9249, LAS: 0.8648, UEM: 0.5189, LEM: 0.2751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6368, partial_loss/deprel_loss: 0.7374, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8225, loss: 0.8922, batch_reg_loss: 0.1052, reg_loss: 0.1047 ||:  45%|####5     | 50/111 [00:34<00:42,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9007, UAS: 0.9257, LAS: 0.8655, UEM: 0.5205, LEM: 0.2743, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3766, partial_loss/deprel_loss: 0.6185, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6754, loss: 0.8873, batch_reg_loss: 0.1053, reg_loss: 0.1047 ||:  48%|####7     | 53/111 [00:36<00:40,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9251, LAS: 0.8652, UEM: 0.5197, LEM: 0.2753, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2680, partial_loss/deprel_loss: 0.4119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4885, loss: 0.8925, batch_reg_loss: 0.1054, reg_loss: 0.1048 ||:  50%|#####     | 56/111 [00:38<00:38,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8824, UAS: 0.9268, LAS: 0.8674, UEM: 0.5477, LEM: 0.3105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4947, partial_loss/deprel_loss: 0.7372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7941, loss: 0.8777, batch_reg_loss: 0.1054, reg_loss: 0.1048 ||:  53%|#####3    | 59/111 [00:41<00:39,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8073, UAS: 0.9261, LAS: 0.8666, UEM: 0.5477, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6483, partial_loss/deprel_loss: 1.1254, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3354, loss: 0.8834, batch_reg_loss: 0.1055, reg_loss: 0.1048 ||:  56%|#####5    | 62/111 [00:43<00:36,  1.33it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9259, LAS: 0.8663, UEM: 0.5460, LEM: 0.3070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3969, partial_loss/deprel_loss: 0.5212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6019, loss: 0.8849, batch_reg_loss: 0.1056, reg_loss: 0.1049 ||:  59%|#####9    | 66/111 [00:46<00:32,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8236, UAS: 0.9236, LAS: 0.8636, UEM: 0.5365, LEM: 0.3013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2846, partial_loss/deprel_loss: 1.1375, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2725, loss: 0.9055, batch_reg_loss: 0.1056, reg_loss: 0.1049 ||:  62%|######2   | 69/111 [00:48<00:30,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8148, UAS: 0.9225, LAS: 0.8623, UEM: 0.5268, LEM: 0.2954, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3223, partial_loss/deprel_loss: 1.2582, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3767, loss: 0.9208, batch_reg_loss: 0.1057, reg_loss: 0.1050 ||:  65%|######4   | 72/111 [00:50<00:27,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7637, UAS: 0.9220, LAS: 0.8616, UEM: 0.5317, LEM: 0.3009, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9413, partial_loss/deprel_loss: 1.3939, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6091, loss: 0.9239, batch_reg_loss: 0.1058, reg_loss: 0.1050 ||:  68%|######7   | 75/111 [00:52<00:25,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8565, UAS: 0.9222, LAS: 0.8616, UEM: 0.5255, LEM: 0.2946, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7652, partial_loss/deprel_loss: 0.8632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9495, loss: 0.9231, batch_reg_loss: 0.1058, reg_loss: 0.1050 ||:  70%|#######   | 78/111 [00:54<00:23,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9232, LAS: 0.8625, UEM: 0.5251, LEM: 0.2903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4565, partial_loss/deprel_loss: 0.7356, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7857, loss: 0.9174, batch_reg_loss: 0.1059, reg_loss: 0.1050 ||:  73%|#######2  | 81/111 [00:56<00:21,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8333, UAS: 0.9231, LAS: 0.8623, UEM: 0.5156, LEM: 0.2836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0232, partial_loss/deprel_loss: 1.1543, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2341, loss: 0.9186, batch_reg_loss: 0.1060, reg_loss: 0.1051 ||:  77%|#######6  | 85/111 [00:59<00:17,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9037, UAS: 0.9238, LAS: 0.8630, UEM: 0.5193, LEM: 0.2842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2800, partial_loss/deprel_loss: 0.5071, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5677, loss: 0.9128, batch_reg_loss: 0.1061, reg_loss: 0.1051 ||:  80%|########  | 89/111 [01:01<00:15,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8337, UAS: 0.9241, LAS: 0.8633, UEM: 0.5179, LEM: 0.2819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0860, partial_loss/deprel_loss: 1.0809, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1880, loss: 0.9103, batch_reg_loss: 0.1062, reg_loss: 0.1052 ||:  83%|########2 | 92/111 [01:04<00:13,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8234, UAS: 0.9244, LAS: 0.8636, UEM: 0.5232, LEM: 0.2852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2385, partial_loss/deprel_loss: 1.0176, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1680, loss: 0.9053, batch_reg_loss: 0.1062, reg_loss: 0.1052 ||:  86%|########6 | 96/111 [01:06<00:10,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8460, UAS: 0.9233, LAS: 0.8623, UEM: 0.5169, LEM: 0.2813, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8967, partial_loss/deprel_loss: 0.9467, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0430, loss: 0.9148, batch_reg_loss: 0.1063, reg_loss: 0.1052 ||:  89%|########9 | 99/111 [01:08<00:08,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9238, LAS: 0.8630, UEM: 0.5188, LEM: 0.2829, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3748, partial_loss/deprel_loss: 0.5105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5897, loss: 0.9090, batch_reg_loss: 0.1064, reg_loss: 0.1053 ||:  92%|#########1| 102/111 [01:11<00:06,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8596, UAS: 0.9231, LAS: 0.8623, UEM: 0.5110, LEM: 0.2775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7957, partial_loss/deprel_loss: 0.8864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9747, loss: 0.9154, batch_reg_loss: 0.1064, reg_loss: 0.1053 ||:  95%|#########5| 106/111 [01:14<00:03,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7423, UAS: 0.9219, LAS: 0.8609, UEM: 0.5056, LEM: 0.2734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.8168, partial_loss/deprel_loss: 1.8275, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1319, loss: 0.9278, batch_reg_loss: 0.1065, reg_loss: 0.1054 ||:  99%|#########9| 110/111 [01:16<00:00,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9221, LAS: 0.8612, UEM: 0.5086, LEM: 0.2752, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3234, partial_loss/deprel_loss: 0.5511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6121, loss: 0.9250, batch_reg_loss: 0.1065, reg_loss: 0.1054 ||: 100%|##########| 111/111 [01:17<00:00,  1.43it/s]\n",
+      "2023-04-06 23:23:58,213 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9630, LAS: 0.9177, UEM: 0.8159, LEM: 0.5815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1737, partial_loss/deprel_loss: 20.5474, partial_loss/cycle_loss: 0.0000, batch_loss: 16.4726, loss: 21.0144, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:09,  1.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8646, UAS: 0.9472, LAS: 0.8955, UEM: 0.7141, LEM: 0.4812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0153, partial_loss/deprel_loss: 43.3811, partial_loss/cycle_loss: 0.0000, batch_loss: 34.9080, loss: 25.5731, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:04<00:07,  1.05it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8756, UAS: 0.9444, LAS: 0.8901, UEM: 0.6600, LEM: 0.4105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7415, partial_loss/deprel_loss: 29.8373, partial_loss/cycle_loss: 0.0000, batch_loss: 24.0182, loss: 24.7509, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:07<00:04,  1.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9176, UAS: 0.9442, LAS: 0.8901, UEM: 0.6403, LEM: 0.3835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3994, partial_loss/deprel_loss: 17.6347, partial_loss/cycle_loss: 0.0000, batch_loss: 14.1877, loss: 24.6526, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:10<00:01,  1.06it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9044, UAS: 0.9410, LAS: 0.8860, UEM: 0.6232, LEM: 0.3617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3976, partial_loss/deprel_loss: 24.4861, partial_loss/cycle_loss: 0.0000, batch_loss: 19.6684, loss: 25.9867, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.06it/s]\n",
+      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.551  |    24.486\n",
+      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.323  |     0.398\n",
+      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.105  |     0.000\n",
+      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - UEM                      |     0.509  |     0.623\n",
+      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - LAS                      |     0.861  |     0.886\n",
+      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - loss                     |     0.925  |    25.987\n",
+      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - LEM                      |     0.275  |     0.362\n",
+      "2023-04-06 23:24:10,535 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:24:10,535 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:24:10,535 - INFO - combo.training.tensorboard_writer - UAS                      |     0.922  |     0.941\n",
+      "2023-04-06 23:24:10,535 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:24:10,535 - INFO - combo.training.tensorboard_writer - EM                       |     0.893  |     0.904\n",
+      "2023-04-06 23:24:10,535 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:24:10,535 - INFO - combo.training.trainer - Epoch duration: 0:01:30.221589\n",
+      "2023-04-06 23:24:10,535 - INFO - combo.training.trainer - Estimated training time remaining: 8:14:38\n",
+      "2023-04-06 23:24:10,536 - INFO - allennlp.training.trainer - Epoch 26/399\n",
+      "2023-04-06 23:24:10,536 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:24:10,536 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:24:10,542 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9080, UAS: 0.9545, LAS: 0.9014, UEM: 0.6867, LEM: 0.3821, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3364, partial_loss/deprel_loss: 0.5464, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6110, loss: 0.6380, batch_reg_loss: 0.1066, reg_loss: 0.1066 ||:   3%|2         | 3/111 [00:02<01:20,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8532, UAS: 0.9292, LAS: 0.8709, UEM: 0.5445, LEM: 0.2801, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7835, partial_loss/deprel_loss: 0.8604, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9517, loss: 0.8619, batch_reg_loss: 0.1067, reg_loss: 0.1066 ||:   6%|6         | 7/111 [00:04<01:14,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9296, LAS: 0.8722, UEM: 0.6059, LEM: 0.3815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1357, partial_loss/deprel_loss: 0.2700, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3499, loss: 0.8487, batch_reg_loss: 0.1068, reg_loss: 0.1067 ||:   9%|9         | 10/111 [00:07<01:14,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8605, UAS: 0.9257, LAS: 0.8661, UEM: 0.5670, LEM: 0.3431, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8304, partial_loss/deprel_loss: 0.8325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9389, loss: 0.8925, batch_reg_loss: 0.1068, reg_loss: 0.1067 ||:  13%|#2        | 14/111 [00:09<01:07,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9232, LAS: 0.8619, UEM: 0.5243, LEM: 0.3034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5089, partial_loss/deprel_loss: 0.7516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8100, loss: 0.9244, batch_reg_loss: 0.1069, reg_loss: 0.1068 ||:  16%|#6        | 18/111 [00:11<01:01,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8921, UAS: 0.9243, LAS: 0.8631, UEM: 0.5139, LEM: 0.2889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3767, partial_loss/deprel_loss: 0.5236, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6012, loss: 0.9069, batch_reg_loss: 0.1070, reg_loss: 0.1068 ||:  19%|#8        | 21/111 [00:14<01:02,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9241, LAS: 0.8641, UEM: 0.5164, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2933, partial_loss/deprel_loss: 0.4944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5612, loss: 0.9046, batch_reg_loss: 0.1071, reg_loss: 0.1068 ||:  23%|##2       | 25/111 [00:16<00:57,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8872, UAS: 0.9258, LAS: 0.8660, UEM: 0.5084, LEM: 0.2739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4166, partial_loss/deprel_loss: 0.6166, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6837, loss: 0.8859, batch_reg_loss: 0.1072, reg_loss: 0.1069 ||:  26%|##6       | 29/111 [00:19<00:55,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9258, LAS: 0.8655, UEM: 0.5043, LEM: 0.2665, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2740, partial_loss/deprel_loss: 0.5245, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5816, loss: 0.8904, batch_reg_loss: 0.1073, reg_loss: 0.1069 ||:  30%|##9       | 33/111 [00:21<00:51,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9282, LAS: 0.8682, UEM: 0.5457, LEM: 0.3078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1732, partial_loss/deprel_loss: 0.4463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4990, loss: 0.8672, batch_reg_loss: 0.1073, reg_loss: 0.1069 ||:  32%|###2      | 36/111 [00:23<00:49,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8977, UAS: 0.9276, LAS: 0.8675, UEM: 0.5649, LEM: 0.3241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3104, partial_loss/deprel_loss: 0.5077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5757, loss: 0.8686, batch_reg_loss: 0.1074, reg_loss: 0.1070 ||:  35%|###5      | 39/111 [00:26<00:48,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9282, LAS: 0.8683, UEM: 0.5682, LEM: 0.3254, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2328, partial_loss/deprel_loss: 0.4289, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4971, loss: 0.8663, batch_reg_loss: 0.1075, reg_loss: 0.1070 ||:  39%|###8      | 43/111 [00:28<00:44,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9305, LAS: 0.8712, UEM: 0.5994, LEM: 0.3625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3668, partial_loss/deprel_loss: 0.6581, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7074, loss: 0.8445, batch_reg_loss: 0.1075, reg_loss: 0.1071 ||:  42%|####2     | 47/111 [00:31<00:42,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8464, UAS: 0.9285, LAS: 0.8689, UEM: 0.5846, LEM: 0.3499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8792, partial_loss/deprel_loss: 0.9102, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0116, loss: 0.8637, batch_reg_loss: 0.1076, reg_loss: 0.1071 ||:  46%|####5     | 51/111 [00:33<00:39,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9282, LAS: 0.8684, UEM: 0.5741, LEM: 0.3397, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4152, partial_loss/deprel_loss: 0.6219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6883, loss: 0.8696, batch_reg_loss: 0.1077, reg_loss: 0.1071 ||:  50%|####9     | 55/111 [00:36<00:36,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9289, LAS: 0.8689, UEM: 0.5806, LEM: 0.3403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3748, partial_loss/deprel_loss: 0.6606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7112, loss: 0.8649, batch_reg_loss: 0.1078, reg_loss: 0.1072 ||:  53%|#####3    | 59/111 [00:39<00:35,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8305, UAS: 0.9287, LAS: 0.8687, UEM: 0.5776, LEM: 0.3373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1911, partial_loss/deprel_loss: 1.0662, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1991, loss: 0.8640, batch_reg_loss: 0.1078, reg_loss: 0.1072 ||:  56%|#####5    | 62/111 [00:41<00:34,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8407, UAS: 0.9283, LAS: 0.8684, UEM: 0.5685, LEM: 0.3305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0422, partial_loss/deprel_loss: 0.9557, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0810, loss: 0.8660, batch_reg_loss: 0.1079, reg_loss: 0.1073 ||:  59%|#####9    | 66/111 [00:43<00:30,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9273, LAS: 0.8673, UEM: 0.5602, LEM: 0.3234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4067, partial_loss/deprel_loss: 0.6749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7293, loss: 0.8741, batch_reg_loss: 0.1080, reg_loss: 0.1073 ||:  63%|######3   | 70/111 [00:46<00:27,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8612, UAS: 0.9263, LAS: 0.8659, UEM: 0.5479, LEM: 0.3142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7849, partial_loss/deprel_loss: 0.7782, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8876, loss: 0.8835, batch_reg_loss: 0.1081, reg_loss: 0.1073 ||:  67%|######6   | 74/111 [00:48<00:23,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8505, UAS: 0.9263, LAS: 0.8660, UEM: 0.5435, LEM: 0.3093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8610, partial_loss/deprel_loss: 0.9041, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0036, loss: 0.8832, batch_reg_loss: 0.1082, reg_loss: 0.1074 ||:  70%|#######   | 78/111 [00:51<00:21,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8460, UAS: 0.9239, LAS: 0.8632, UEM: 0.5339, LEM: 0.3026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0083, partial_loss/deprel_loss: 0.9057, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0345, loss: 0.9074, batch_reg_loss: 0.1083, reg_loss: 0.1074 ||:  74%|#######3  | 82/111 [00:54<00:19,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9232, LAS: 0.8625, UEM: 0.5256, LEM: 0.2958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4858, partial_loss/deprel_loss: 0.6129, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6958, loss: 0.9146, batch_reg_loss: 0.1083, reg_loss: 0.1075 ||:  77%|#######7  | 86/111 [00:57<00:16,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8379, UAS: 0.9209, LAS: 0.8601, UEM: 0.5163, LEM: 0.2898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1256, partial_loss/deprel_loss: 0.9807, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1181, loss: 0.9341, batch_reg_loss: 0.1084, reg_loss: 0.1075 ||:  81%|########1 | 90/111 [00:59<00:14,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8978, UAS: 0.9218, LAS: 0.8611, UEM: 0.5218, LEM: 0.2919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3100, partial_loss/deprel_loss: 0.5110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5793, loss: 0.9257, batch_reg_loss: 0.1085, reg_loss: 0.1075 ||:  84%|########3 | 93/111 [01:02<00:12,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8807, UAS: 0.9222, LAS: 0.8613, UEM: 0.5183, LEM: 0.2878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5588, partial_loss/deprel_loss: 0.6559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7451, loss: 0.9237, batch_reg_loss: 0.1086, reg_loss: 0.1076 ||:  86%|########6 | 96/111 [01:04<00:10,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8350, UAS: 0.9224, LAS: 0.8615, UEM: 0.5172, LEM: 0.2867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0468, partial_loss/deprel_loss: 1.0077, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1242, loss: 0.9211, batch_reg_loss: 0.1087, reg_loss: 0.1076 ||:  90%|######### | 100/111 [01:06<00:07,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9214, LAS: 0.8605, UEM: 0.5132, LEM: 0.2837, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4873, partial_loss/deprel_loss: 0.6853, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7544, loss: 0.9311, batch_reg_loss: 0.1087, reg_loss: 0.1076 ||:  93%|#########2| 103/111 [01:08<00:05,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8679, UAS: 0.9221, LAS: 0.8612, UEM: 0.5180, LEM: 0.2852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7112, partial_loss/deprel_loss: 0.8132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9016, loss: 0.9247, batch_reg_loss: 0.1088, reg_loss: 0.1077 ||:  95%|#########5| 106/111 [01:11<00:03,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8232, UAS: 0.9214, LAS: 0.8602, UEM: 0.5101, LEM: 0.2792, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2259, partial_loss/deprel_loss: 1.2003, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3143, loss: 0.9326, batch_reg_loss: 0.1089, reg_loss: 0.1077 ||:  99%|#########9| 110/111 [01:13<00:00,  1.45it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9217, LAS: 0.8605, UEM: 0.5109, LEM: 0.2788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3606, partial_loss/deprel_loss: 0.6149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6730, loss: 0.9302, batch_reg_loss: 0.1089, reg_loss: 0.1077 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
+      "2023-04-06 23:25:25,100 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.615  |       N/A\n",
+      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.361  |       N/A\n",
+      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.108  |       N/A\n",
+      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - UEM                      |     0.511  |       N/A\n",
+      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - LAS                      |     0.861  |       N/A\n",
+      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - loss                     |     0.930  |       N/A\n",
+      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:25:25,102 - INFO - combo.training.tensorboard_writer - LEM                      |     0.279  |       N/A\n",
+      "2023-04-06 23:25:25,102 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:25:25,102 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:25:25,102 - INFO - combo.training.tensorboard_writer - UAS                      |     0.922  |       N/A\n",
+      "2023-04-06 23:25:25,102 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:25:25,102 - INFO - combo.training.tensorboard_writer - EM                       |     0.898  |       N/A\n",
+      "2023-04-06 23:25:25,102 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:25:25,102 - INFO - combo.training.trainer - Epoch duration: 0:01:14.566974\n",
+      "2023-04-06 23:25:25,103 - INFO - combo.training.trainer - Estimated training time remaining: 8:12:13\n",
+      "2023-04-06 23:25:25,103 - INFO - allennlp.training.trainer - Epoch 27/399\n",
+      "2023-04-06 23:25:25,103 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:25:25,103 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:25:25,110 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8523, UAS: 0.9369, LAS: 0.8747, UEM: 0.5058, LEM: 0.2442, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8675, partial_loss/deprel_loss: 1.0086, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0894, loss: 0.8187, batch_reg_loss: 0.1090, reg_loss: 0.1090 ||:   4%|3         | 4/111 [00:02<01:07,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9336, LAS: 0.8740, UEM: 0.5125, LEM: 0.2599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3637, partial_loss/deprel_loss: 0.5490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6210, loss: 0.8310, batch_reg_loss: 0.1091, reg_loss: 0.1090 ||:   7%|7         | 8/111 [00:05<01:06,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8245, UAS: 0.9243, LAS: 0.8646, UEM: 0.5087, LEM: 0.2633, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3445, partial_loss/deprel_loss: 1.1262, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2790, loss: 0.9138, batch_reg_loss: 0.1091, reg_loss: 0.1090 ||:  10%|9         | 11/111 [00:07<01:06,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8379, UAS: 0.9269, LAS: 0.8667, UEM: 0.5467, LEM: 0.3056, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8799, partial_loss/deprel_loss: 1.0002, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0854, loss: 0.8886, batch_reg_loss: 0.1092, reg_loss: 0.1091 ||:  13%|#2        | 14/111 [00:09<01:05,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9294, LAS: 0.8700, UEM: 0.5552, LEM: 0.3033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3805, partial_loss/deprel_loss: 0.5957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6619, loss: 0.8598, batch_reg_loss: 0.1093, reg_loss: 0.1091 ||:  15%|#5        | 17/111 [00:11<01:03,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9265, LAS: 0.8674, UEM: 0.5617, LEM: 0.3090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2696, partial_loss/deprel_loss: 0.4384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5139, loss: 0.8870, batch_reg_loss: 0.1093, reg_loss: 0.1091 ||:  19%|#8        | 21/111 [00:14<01:01,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8317, UAS: 0.9271, LAS: 0.8678, UEM: 0.5447, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1042, partial_loss/deprel_loss: 0.9767, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1116, loss: 0.8804, batch_reg_loss: 0.1094, reg_loss: 0.1092 ||:  23%|##2       | 25/111 [00:16<00:55,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8788, UAS: 0.9287, LAS: 0.8691, UEM: 0.5503, LEM: 0.3007, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5186, partial_loss/deprel_loss: 0.7539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8163, loss: 0.8661, batch_reg_loss: 0.1095, reg_loss: 0.1092 ||:  26%|##6       | 29/111 [00:19<00:52,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8669, UAS: 0.9292, LAS: 0.8690, UEM: 0.5347, LEM: 0.2819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6542, partial_loss/deprel_loss: 0.8093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8878, loss: 0.8647, batch_reg_loss: 0.1096, reg_loss: 0.1093 ||:  30%|##9       | 33/111 [00:21<00:49,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7760, UAS: 0.9264, LAS: 0.8662, UEM: 0.5149, LEM: 0.2670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9272, partial_loss/deprel_loss: 1.4164, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6282, loss: 0.8847, batch_reg_loss: 0.1097, reg_loss: 0.1093 ||:  33%|###3      | 37/111 [00:24<00:46,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8203, UAS: 0.9237, LAS: 0.8637, UEM: 0.5148, LEM: 0.2693, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4669, partial_loss/deprel_loss: 1.0744, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2626, loss: 0.9017, batch_reg_loss: 0.1097, reg_loss: 0.1093 ||:  37%|###6      | 41/111 [00:27<00:47,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9233, LAS: 0.8630, UEM: 0.5048, LEM: 0.2601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5881, partial_loss/deprel_loss: 0.7383, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8181, loss: 0.9055, batch_reg_loss: 0.1098, reg_loss: 0.1094 ||:  41%|####      | 45/111 [00:29<00:43,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8337, UAS: 0.9229, LAS: 0.8620, UEM: 0.4906, LEM: 0.2502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1077, partial_loss/deprel_loss: 1.0868, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2009, loss: 0.9135, batch_reg_loss: 0.1099, reg_loss: 0.1094 ||:  44%|####4     | 49/111 [00:32<00:42,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8291, UAS: 0.9227, LAS: 0.8618, UEM: 0.4889, LEM: 0.2509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1882, partial_loss/deprel_loss: 1.1634, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2784, loss: 0.9169, batch_reg_loss: 0.1100, reg_loss: 0.1095 ||:  48%|####7     | 53/111 [00:35<00:38,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9214, LAS: 0.8604, UEM: 0.5006, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1371, partial_loss/deprel_loss: 0.2988, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3766, loss: 0.9293, batch_reg_loss: 0.1101, reg_loss: 0.1095 ||:  51%|#####1    | 57/111 [00:37<00:35,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8270, UAS: 0.9216, LAS: 0.8607, UEM: 0.4967, LEM: 0.2637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3575, partial_loss/deprel_loss: 1.1842, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3291, loss: 0.9275, batch_reg_loss: 0.1102, reg_loss: 0.1095 ||:  55%|#####4    | 61/111 [00:40<00:33,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9224, LAS: 0.8614, UEM: 0.4990, LEM: 0.2618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3941, partial_loss/deprel_loss: 0.6425, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7031, loss: 0.9222, batch_reg_loss: 0.1103, reg_loss: 0.1096 ||:  59%|#####8    | 65/111 [00:43<00:31,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8837, UAS: 0.9221, LAS: 0.8608, UEM: 0.4882, LEM: 0.2540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5820, partial_loss/deprel_loss: 0.7200, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8027, loss: 0.9284, batch_reg_loss: 0.1104, reg_loss: 0.1096 ||:  62%|######2   | 69/111 [00:45<00:27,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7939, UAS: 0.9217, LAS: 0.8602, UEM: 0.4867, LEM: 0.2522, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4043, partial_loss/deprel_loss: 1.2781, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4138, loss: 0.9343, batch_reg_loss: 0.1105, reg_loss: 0.1097 ||:  66%|######5   | 73/111 [00:48<00:25,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8337, UAS: 0.9218, LAS: 0.8604, UEM: 0.4876, LEM: 0.2539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1732, partial_loss/deprel_loss: 1.1097, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2329, loss: 0.9349, batch_reg_loss: 0.1105, reg_loss: 0.1097 ||:  68%|######8   | 76/111 [00:50<00:23,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7630, UAS: 0.9204, LAS: 0.8589, UEM: 0.4799, LEM: 0.2490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3397, partial_loss/deprel_loss: 1.4709, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7552, loss: 0.9468, batch_reg_loss: 0.1106, reg_loss: 0.1098 ||:  72%|#######2  | 80/111 [00:53<00:20,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9212, LAS: 0.8595, UEM: 0.4774, LEM: 0.2459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4129, partial_loss/deprel_loss: 0.5541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6366, loss: 0.9420, batch_reg_loss: 0.1107, reg_loss: 0.1098 ||:  76%|#######5  | 84/111 [00:55<00:17,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8835, UAS: 0.9211, LAS: 0.8593, UEM: 0.4725, LEM: 0.2413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4724, partial_loss/deprel_loss: 0.6431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7198, loss: 0.9422, batch_reg_loss: 0.1108, reg_loss: 0.1098 ||:  79%|#######9  | 88/111 [00:58<00:15,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8946, UAS: 0.9214, LAS: 0.8598, UEM: 0.4746, LEM: 0.2414, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3605, partial_loss/deprel_loss: 0.5323, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6088, loss: 0.9386, batch_reg_loss: 0.1109, reg_loss: 0.1099 ||:  83%|########2 | 92/111 [01:00<00:12,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9217, LAS: 0.8601, UEM: 0.4750, LEM: 0.2411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2847, partial_loss/deprel_loss: 0.5046, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5715, loss: 0.9359, batch_reg_loss: 0.1109, reg_loss: 0.1099 ||:  86%|########6 | 96/111 [01:03<00:09,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9220, LAS: 0.8605, UEM: 0.4788, LEM: 0.2450, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2380, partial_loss/deprel_loss: 0.4325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5046, loss: 0.9335, batch_reg_loss: 0.1110, reg_loss: 0.1100 ||:  90%|######### | 100/111 [01:05<00:07,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9146, UAS: 0.9226, LAS: 0.8612, UEM: 0.4877, LEM: 0.2515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1806, partial_loss/deprel_loss: 0.4301, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4913, loss: 0.9288, batch_reg_loss: 0.1111, reg_loss: 0.1100 ||:  94%|#########3| 104/111 [01:08<00:04,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8623, UAS: 0.9225, LAS: 0.8610, UEM: 0.4866, LEM: 0.2516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6775, partial_loss/deprel_loss: 0.9319, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9922, loss: 0.9303, batch_reg_loss: 0.1112, reg_loss: 0.1101 ||:  97%|#########7| 108/111 [01:11<00:02,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9492, UAS: 0.9236, LAS: 0.8623, UEM: 0.5071, LEM: 0.2749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0673, partial_loss/deprel_loss: 0.2098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2925, loss: 0.9200, batch_reg_loss: 0.1112, reg_loss: 0.1101 ||: 100%|##########| 111/111 [01:14<00:00,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9492, UAS: 0.9236, LAS: 0.8623, UEM: 0.5071, LEM: 0.2749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0673, partial_loss/deprel_loss: 0.2098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2925, loss: 0.9200, batch_reg_loss: 0.1112, reg_loss: 0.1101 ||: 100%|##########| 111/111 [01:14<00:00,  1.50it/s]\n",
+      "2023-04-06 23:26:39,190 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:26:39,190 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:26:39,190 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.210  |       N/A\n",
+      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.067  |       N/A\n",
+      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.110  |       N/A\n",
+      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - UEM                      |     0.507  |       N/A\n",
+      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - LAS                      |     0.862  |       N/A\n",
+      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - loss                     |     0.920  |       N/A\n",
+      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - LEM                      |     0.275  |       N/A\n",
+      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - UAS                      |     0.924  |       N/A\n",
+      "2023-04-06 23:26:39,192 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:26:39,192 - INFO - combo.training.tensorboard_writer - EM                       |     0.949  |       N/A\n",
+      "2023-04-06 23:26:39,192 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:26:39,192 - INFO - combo.training.trainer - Epoch duration: 0:01:14.089580\n",
+      "2023-04-06 23:26:39,192 - INFO - combo.training.trainer - Estimated training time remaining: 8:09:46\n",
+      "2023-04-06 23:26:39,192 - INFO - allennlp.training.trainer - Epoch 28/399\n",
+      "2023-04-06 23:26:39,193 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:26:39,193 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:26:39,200 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9141, UAS: 0.9165, LAS: 0.8582, UEM: 0.6021, LEM: 0.3938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2068, partial_loss/deprel_loss: 0.4027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4748, loss: 0.9632, batch_reg_loss: 0.1113, reg_loss: 0.1113 ||:   3%|2         | 3/111 [00:02<01:20,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8479, UAS: 0.9296, LAS: 0.8705, UEM: 0.5821, LEM: 0.3469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8214, partial_loss/deprel_loss: 1.0063, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0807, loss: 0.8797, batch_reg_loss: 0.1114, reg_loss: 0.1113 ||:   5%|5         | 6/111 [00:04<01:16,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9309, LAS: 0.8722, UEM: 0.5280, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8053, partial_loss/deprel_loss: 0.8538, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9555, loss: 0.8659, batch_reg_loss: 0.1114, reg_loss: 0.1113 ||:   8%|8         | 9/111 [00:06<01:14,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9298, LAS: 0.8711, UEM: 0.5151, LEM: 0.2832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4062, partial_loss/deprel_loss: 0.5566, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6380, loss: 0.8682, batch_reg_loss: 0.1115, reg_loss: 0.1114 ||:  12%|#1        | 13/111 [00:09<01:09,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9512, UAS: 0.9341, LAS: 0.8772, UEM: 0.6051, LEM: 0.3936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0950, partial_loss/deprel_loss: 0.1922, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2843, loss: 0.8222, batch_reg_loss: 0.1115, reg_loss: 0.1114 ||:  14%|#4        | 16/111 [00:11<01:08,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9353, LAS: 0.8781, UEM: 0.5912, LEM: 0.3662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3400, partial_loss/deprel_loss: 0.5233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5982, loss: 0.8082, batch_reg_loss: 0.1116, reg_loss: 0.1114 ||:  17%|#7        | 19/111 [00:13<01:06,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8460, UAS: 0.9338, LAS: 0.8764, UEM: 0.5584, LEM: 0.3338, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8651, partial_loss/deprel_loss: 0.8871, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9944, loss: 0.8188, batch_reg_loss: 0.1117, reg_loss: 0.1115 ||:  21%|##        | 23/111 [00:16<01:00,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9134, UAS: 0.9357, LAS: 0.8784, UEM: 0.5772, LEM: 0.3459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1911, partial_loss/deprel_loss: 0.4073, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4758, loss: 0.7985, batch_reg_loss: 0.1117, reg_loss: 0.1115 ||:  23%|##3       | 26/111 [00:18<01:00,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8446, UAS: 0.9333, LAS: 0.8759, UEM: 0.5707, LEM: 0.3427, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0747, partial_loss/deprel_loss: 0.9027, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0489, loss: 0.8142, batch_reg_loss: 0.1118, reg_loss: 0.1115 ||:  26%|##6       | 29/111 [00:20<00:58,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8281, UAS: 0.9316, LAS: 0.8740, UEM: 0.5647, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2179, partial_loss/deprel_loss: 1.0295, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1790, loss: 0.8310, batch_reg_loss: 0.1118, reg_loss: 0.1116 ||:  29%|##8       | 32/111 [00:22<00:58,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8395, UAS: 0.9268, LAS: 0.8688, UEM: 0.5456, LEM: 0.3239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0683, partial_loss/deprel_loss: 0.9735, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1044, loss: 0.8689, batch_reg_loss: 0.1119, reg_loss: 0.1116 ||:  32%|###1      | 35/111 [00:25<00:56,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8979, UAS: 0.9256, LAS: 0.8672, UEM: 0.5327, LEM: 0.3104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3730, partial_loss/deprel_loss: 0.5946, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6623, loss: 0.8821, batch_reg_loss: 0.1120, reg_loss: 0.1116 ||:  35%|###5      | 39/111 [00:27<00:49,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9262, LAS: 0.8679, UEM: 0.5237, LEM: 0.3000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4640, partial_loss/deprel_loss: 0.6099, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6928, loss: 0.8753, batch_reg_loss: 0.1121, reg_loss: 0.1117 ||:  39%|###8      | 43/111 [00:30<00:46,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8842, UAS: 0.9260, LAS: 0.8675, UEM: 0.5286, LEM: 0.2976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5349, partial_loss/deprel_loss: 0.5833, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6858, loss: 0.8760, batch_reg_loss: 0.1122, reg_loss: 0.1117 ||:  42%|####2     | 47/111 [00:32<00:42,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8339, UAS: 0.9248, LAS: 0.8660, UEM: 0.5233, LEM: 0.2962, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2239, partial_loss/deprel_loss: 1.0366, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1863, loss: 0.8865, batch_reg_loss: 0.1123, reg_loss: 0.1117 ||:  46%|####5     | 51/111 [00:35<00:40,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9241, LAS: 0.8651, UEM: 0.5362, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4257, partial_loss/deprel_loss: 0.6319, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7030, loss: 0.8954, batch_reg_loss: 0.1123, reg_loss: 0.1118 ||:  49%|####8     | 54/111 [00:37<00:40,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9245, LAS: 0.8652, UEM: 0.5354, LEM: 0.3005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3021, partial_loss/deprel_loss: 0.5010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5736, loss: 0.8952, batch_reg_loss: 0.1124, reg_loss: 0.1118 ||:  51%|#####1    | 57/111 [00:39<00:37,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8413, UAS: 0.9239, LAS: 0.8643, UEM: 0.5229, LEM: 0.2924, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0378, partial_loss/deprel_loss: 1.0526, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1621, loss: 0.9046, batch_reg_loss: 0.1125, reg_loss: 0.1118 ||:  54%|#####4    | 60/111 [00:41<00:35,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8561, UAS: 0.9243, LAS: 0.8646, UEM: 0.5144, LEM: 0.2832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8400, partial_loss/deprel_loss: 0.8978, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9988, loss: 0.9017, batch_reg_loss: 0.1125, reg_loss: 0.1119 ||:  58%|#####7    | 64/111 [00:44<00:31,  1.49it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9241, LAS: 0.8643, UEM: 0.5133, LEM: 0.2813, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3304, partial_loss/deprel_loss: 0.5270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6003, loss: 0.9049, batch_reg_loss: 0.1126, reg_loss: 0.1119 ||:  61%|######1   | 68/111 [00:47<00:29,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9236, LAS: 0.8637, UEM: 0.5139, LEM: 0.2831, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3526, partial_loss/deprel_loss: 0.4551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5473, loss: 0.9107, batch_reg_loss: 0.1127, reg_loss: 0.1120 ||:  64%|######3   | 71/111 [00:49<00:27,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8335, UAS: 0.9230, LAS: 0.8629, UEM: 0.5046, LEM: 0.2758, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1078, partial_loss/deprel_loss: 1.0005, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1347, loss: 0.9176, batch_reg_loss: 0.1128, reg_loss: 0.1120 ||:  68%|######7   | 75/111 [00:51<00:23,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8978, UAS: 0.9228, LAS: 0.8627, UEM: 0.5046, LEM: 0.2741, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3583, partial_loss/deprel_loss: 0.5200, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6006, loss: 0.9189, batch_reg_loss: 0.1129, reg_loss: 0.1120 ||:  71%|#######1  | 79/111 [00:54<00:21,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8541, UAS: 0.9231, LAS: 0.8629, UEM: 0.4983, LEM: 0.2688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7399, partial_loss/deprel_loss: 0.8801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9650, loss: 0.9165, batch_reg_loss: 0.1130, reg_loss: 0.1121 ||:  75%|#######4  | 83/111 [00:56<00:17,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8520, UAS: 0.9215, LAS: 0.8608, UEM: 0.4888, LEM: 0.2624, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8571, partial_loss/deprel_loss: 0.8282, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9470, loss: 0.9335, batch_reg_loss: 0.1131, reg_loss: 0.1121 ||:  78%|#######8  | 87/111 [00:59<00:15,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9220, LAS: 0.8617, UEM: 0.4992, LEM: 0.2722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3817, partial_loss/deprel_loss: 0.4937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5845, loss: 0.9263, batch_reg_loss: 0.1131, reg_loss: 0.1122 ||:  82%|########1 | 91/111 [01:02<00:13,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8676, UAS: 0.9226, LAS: 0.8625, UEM: 0.5122, LEM: 0.2863, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7510, partial_loss/deprel_loss: 0.7480, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8618, loss: 0.9195, batch_reg_loss: 0.1132, reg_loss: 0.1122 ||:  86%|########5 | 95/111 [01:04<00:10,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8863, UAS: 0.9221, LAS: 0.8619, UEM: 0.5084, LEM: 0.2824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4955, partial_loss/deprel_loss: 0.6987, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7713, loss: 0.9258, batch_reg_loss: 0.1133, reg_loss: 0.1122 ||:  88%|########8 | 98/111 [01:07<00:08,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9228, LAS: 0.8628, UEM: 0.5095, LEM: 0.2814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4700, partial_loss/deprel_loss: 0.6280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7098, loss: 0.9194, batch_reg_loss: 0.1134, reg_loss: 0.1123 ||:  91%|######### | 101/111 [01:09<00:07,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9230, LAS: 0.8630, UEM: 0.5087, LEM: 0.2790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3940, partial_loss/deprel_loss: 0.6215, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6894, loss: 0.9173, batch_reg_loss: 0.1134, reg_loss: 0.1123 ||:  94%|#########3| 104/111 [01:11<00:05,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8717, UAS: 0.9233, LAS: 0.8633, UEM: 0.5091, LEM: 0.2789, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6688, partial_loss/deprel_loss: 0.7718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8647, loss: 0.9148, batch_reg_loss: 0.1135, reg_loss: 0.1123 ||:  96%|#########6| 107/111 [01:13<00:02,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8285, UAS: 0.9229, LAS: 0.8628, UEM: 0.5057, LEM: 0.2769, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1495, partial_loss/deprel_loss: 1.0547, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1872, loss: 0.9196, batch_reg_loss: 0.1136, reg_loss: 0.1124 ||: 100%|##########| 111/111 [01:16<00:00,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8285, UAS: 0.9229, LAS: 0.8628, UEM: 0.5057, LEM: 0.2769, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1495, partial_loss/deprel_loss: 1.0547, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1872, loss: 0.9196, batch_reg_loss: 0.1136, reg_loss: 0.1124 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
+      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.055  |       N/A\n",
+      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.150  |       N/A\n",
+      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.112  |       N/A\n",
+      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - UEM                      |     0.506  |       N/A\n",
+      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - LAS                      |     0.863  |       N/A\n",
+      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - loss                     |     0.920  |       N/A\n",
+      "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - LEM                      |     0.277  |       N/A\n",
+      "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - UAS                      |     0.923  |       N/A\n",
+      "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - EM                       |     0.829  |       N/A\n",
+      "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:27:55,560 - INFO - combo.training.trainer - Epoch duration: 0:01:16.367015\n",
+      "2023-04-06 23:27:55,560 - INFO - combo.training.trainer - Estimated training time remaining: 8:07:53\n",
+      "2023-04-06 23:27:55,560 - INFO - allennlp.training.trainer - Epoch 29/399\n",
+      "2023-04-06 23:27:55,560 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:27:55,560 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:27:55,567 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9484, LAS: 0.8952, UEM: 0.6497, LEM: 0.3616, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3046, partial_loss/deprel_loss: 0.4306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5190, loss: 0.6486, batch_reg_loss: 0.1136, reg_loss: 0.1136 ||:   3%|2         | 3/111 [00:02<01:22,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8304, UAS: 0.9318, LAS: 0.8774, UEM: 0.5448, LEM: 0.2959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2572, partial_loss/deprel_loss: 1.0995, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2447, loss: 0.8080, batch_reg_loss: 0.1137, reg_loss: 0.1136 ||:   5%|5         | 6/111 [00:04<01:20,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8513, UAS: 0.9304, LAS: 0.8744, UEM: 0.4970, LEM: 0.2492, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9037, partial_loss/deprel_loss: 0.8621, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9842, loss: 0.8255, batch_reg_loss: 0.1138, reg_loss: 0.1137 ||:   8%|8         | 9/111 [00:06<01:16,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8404, UAS: 0.9234, LAS: 0.8670, UEM: 0.5124, LEM: 0.2688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1069, partial_loss/deprel_loss: 1.0057, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1398, loss: 0.8843, batch_reg_loss: 0.1138, reg_loss: 0.1137 ||:  11%|#         | 12/111 [00:09<01:14,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9279, LAS: 0.8722, UEM: 0.5277, LEM: 0.2683, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5707, partial_loss/deprel_loss: 0.5580, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6744, loss: 0.8422, batch_reg_loss: 0.1139, reg_loss: 0.1137 ||:  14%|#3        | 15/111 [00:11<01:10,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9297, LAS: 0.8731, UEM: 0.5152, LEM: 0.2573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8735, partial_loss/deprel_loss: 0.9656, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0611, loss: 0.8408, batch_reg_loss: 0.1139, reg_loss: 0.1138 ||:  16%|#6        | 18/111 [00:13<01:07,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8382, UAS: 0.9254, LAS: 0.8680, UEM: 0.4779, LEM: 0.2334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1899, partial_loss/deprel_loss: 0.9413, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1050, loss: 0.8777, batch_reg_loss: 0.1140, reg_loss: 0.1138 ||:  20%|#9        | 22/111 [00:15<01:00,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9146, UAS: 0.9271, LAS: 0.8695, UEM: 0.4928, LEM: 0.2473, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1706, partial_loss/deprel_loss: 0.4245, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4878, loss: 0.8677, batch_reg_loss: 0.1141, reg_loss: 0.1138 ||:  23%|##3       | 26/111 [00:18<00:56,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9297, LAS: 0.8723, UEM: 0.5254, LEM: 0.2732, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3101, partial_loss/deprel_loss: 0.5013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5773, loss: 0.8417, batch_reg_loss: 0.1142, reg_loss: 0.1139 ||:  26%|##6       | 29/111 [00:20<00:57,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8395, UAS: 0.9264, LAS: 0.8679, UEM: 0.4938, LEM: 0.2548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9940, partial_loss/deprel_loss: 0.9541, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0763, loss: 0.8794, batch_reg_loss: 0.1143, reg_loss: 0.1139 ||:  30%|##9       | 33/111 [00:22<00:52,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9259, LAS: 0.8670, UEM: 0.4878, LEM: 0.2516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3425, partial_loss/deprel_loss: 0.5836, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6497, loss: 0.8870, batch_reg_loss: 0.1143, reg_loss: 0.1140 ||:  32%|###2      | 36/111 [00:25<00:51,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8347, UAS: 0.9254, LAS: 0.8666, UEM: 0.4828, LEM: 0.2487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2760, partial_loss/deprel_loss: 1.0077, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1758, loss: 0.8918, batch_reg_loss: 0.1144, reg_loss: 0.1140 ||:  35%|###5      | 39/111 [00:27<00:50,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8323, UAS: 0.9239, LAS: 0.8647, UEM: 0.4670, LEM: 0.2391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2418, partial_loss/deprel_loss: 0.9941, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1581, loss: 0.9075, batch_reg_loss: 0.1144, reg_loss: 0.1140 ||:  38%|###7      | 42/111 [00:29<00:48,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9235, LAS: 0.8640, UEM: 0.4682, LEM: 0.2383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3704, partial_loss/deprel_loss: 0.5971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6663, loss: 0.9136, batch_reg_loss: 0.1145, reg_loss: 0.1140 ||:  41%|####      | 45/111 [00:31<00:47,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8413, UAS: 0.9244, LAS: 0.8653, UEM: 0.4755, LEM: 0.2426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0601, partial_loss/deprel_loss: 1.0311, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1515, loss: 0.9071, batch_reg_loss: 0.1146, reg_loss: 0.1141 ||:  43%|####3     | 48/111 [00:34<00:48,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8119, UAS: 0.9235, LAS: 0.8643, UEM: 0.4635, LEM: 0.2325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5594, partial_loss/deprel_loss: 1.1760, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3673, loss: 0.9154, batch_reg_loss: 0.1147, reg_loss: 0.1141 ||:  47%|####6     | 52/111 [00:36<00:42,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8303, UAS: 0.9236, LAS: 0.8641, UEM: 0.4612, LEM: 0.2281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1919, partial_loss/deprel_loss: 1.0681, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2076, loss: 0.9156, batch_reg_loss: 0.1147, reg_loss: 0.1142 ||:  50%|####9     | 55/111 [00:38<00:40,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8623, UAS: 0.9229, LAS: 0.8635, UEM: 0.4512, LEM: 0.2224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7935, partial_loss/deprel_loss: 0.7807, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8981, loss: 0.9207, batch_reg_loss: 0.1148, reg_loss: 0.1142 ||:  53%|#####3    | 59/111 [00:41<00:36,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8556, UAS: 0.9232, LAS: 0.8639, UEM: 0.4533, LEM: 0.2245, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7478, partial_loss/deprel_loss: 0.9507, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0250, loss: 0.9175, batch_reg_loss: 0.1149, reg_loss: 0.1142 ||:  57%|#####6    | 63/111 [00:44<00:32,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9243, LAS: 0.8649, UEM: 0.4697, LEM: 0.2379, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2051, partial_loss/deprel_loss: 0.3932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4706, loss: 0.9061, batch_reg_loss: 0.1150, reg_loss: 0.1143 ||:  60%|######    | 67/111 [00:46<00:30,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9244, LAS: 0.8650, UEM: 0.4710, LEM: 0.2382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3257, partial_loss/deprel_loss: 0.4715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5574, loss: 0.9044, batch_reg_loss: 0.1151, reg_loss: 0.1143 ||:  64%|######3   | 71/111 [00:49<00:26,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9256, LAS: 0.8662, UEM: 0.4812, LEM: 0.2444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3156, partial_loss/deprel_loss: 0.4371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5280, loss: 0.8951, batch_reg_loss: 0.1151, reg_loss: 0.1144 ||:  68%|######7   | 75/111 [00:52<00:24,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8323, UAS: 0.9258, LAS: 0.8662, UEM: 0.4778, LEM: 0.2398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0733, partial_loss/deprel_loss: 1.0164, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1430, loss: 0.8939, batch_reg_loss: 0.1152, reg_loss: 0.1144 ||:  71%|#######1  | 79/111 [00:54<00:20,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8683, UAS: 0.9250, LAS: 0.8653, UEM: 0.4695, LEM: 0.2337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6336, partial_loss/deprel_loss: 0.7658, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8547, loss: 0.9007, batch_reg_loss: 0.1153, reg_loss: 0.1144 ||:  75%|#######4  | 83/111 [00:57<00:18,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8341, UAS: 0.9255, LAS: 0.8657, UEM: 0.4783, LEM: 0.2420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0986, partial_loss/deprel_loss: 1.0203, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1513, loss: 0.8969, batch_reg_loss: 0.1154, reg_loss: 0.1145 ||:  78%|#######8  | 87/111 [00:59<00:15,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.9263, LAS: 0.8668, UEM: 0.4890, LEM: 0.2493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6777, partial_loss/deprel_loss: 0.7179, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8253, loss: 0.8871, batch_reg_loss: 0.1154, reg_loss: 0.1145 ||:  82%|########1 | 91/111 [01:02<00:13,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7511, UAS: 0.9233, LAS: 0.8634, UEM: 0.4815, LEM: 0.2455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6230, partial_loss/deprel_loss: 1.7261, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0210, loss: 0.9162, batch_reg_loss: 0.1155, reg_loss: 0.1146 ||:  86%|########5 | 95/111 [01:05<00:10,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8200, UAS: 0.9234, LAS: 0.8636, UEM: 0.4813, LEM: 0.2444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2783, partial_loss/deprel_loss: 1.1654, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3036, loss: 0.9147, batch_reg_loss: 0.1156, reg_loss: 0.1146 ||:  89%|########9 | 99/111 [01:07<00:07,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7740, UAS: 0.9232, LAS: 0.8632, UEM: 0.4859, LEM: 0.2475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9147, partial_loss/deprel_loss: 1.3908, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6113, loss: 0.9170, batch_reg_loss: 0.1157, reg_loss: 0.1146 ||:  93%|#########2| 103/111 [01:10<00:05,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9528, UAS: 0.9242, LAS: 0.8645, UEM: 0.5148, LEM: 0.2843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0692, partial_loss/deprel_loss: 0.2025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2916, loss: 0.9075, batch_reg_loss: 0.1158, reg_loss: 0.1147 ||:  95%|#########5| 106/111 [01:14<00:04,  1.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9248, LAS: 0.8652, UEM: 0.5157, LEM: 0.2832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3227, partial_loss/deprel_loss: 0.4945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5760, loss: 0.9015, batch_reg_loss: 0.1159, reg_loss: 0.1147 ||:  99%|#########9| 110/111 [01:17<00:00,  1.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7932, UAS: 0.9241, LAS: 0.8645, UEM: 0.5140, LEM: 0.2822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8952, partial_loss/deprel_loss: 1.3438, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5700, loss: 0.9075, batch_reg_loss: 0.1159, reg_loss: 0.1147 ||: 100%|##########| 111/111 [01:17<00:00,  1.43it/s]\n",
+      "2023-04-06 23:29:13,387 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:29:13,387 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:29:13,387 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:29:13,387 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:29:13,387 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.344  |       N/A\n",
+      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.895  |       N/A\n",
+      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.115  |       N/A\n",
+      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - UEM                      |     0.514  |       N/A\n",
+      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - LAS                      |     0.865  |       N/A\n",
+      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - loss                     |     0.908  |       N/A\n",
+      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - LEM                      |     0.282  |       N/A\n",
+      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - UAS                      |     0.924  |       N/A\n",
+      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - EM                       |     0.793  |       N/A\n",
+      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:29:13,389 - INFO - combo.training.trainer - Epoch duration: 0:01:17.829257\n",
+      "2023-04-06 23:29:13,389 - INFO - combo.training.trainer - Estimated training time remaining: 8:06:21\n",
+      "2023-04-06 23:29:13,389 - INFO - allennlp.training.trainer - Epoch 30/399\n",
+      "2023-04-06 23:29:13,389 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:29:13,390 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:29:13,396 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8497, UAS: 0.9423, LAS: 0.8831, UEM: 0.5266, LEM: 0.2405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8957, partial_loss/deprel_loss: 0.8831, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0016, loss: 0.7764, batch_reg_loss: 0.1160, reg_loss: 0.1159 ||:   4%|3         | 4/111 [00:02<01:10,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8156, UAS: 0.9297, LAS: 0.8704, UEM: 0.4777, LEM: 0.2176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4410, partial_loss/deprel_loss: 1.0704, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2605, loss: 0.8706, batch_reg_loss: 0.1160, reg_loss: 0.1160 ||:   6%|6         | 7/111 [00:04<01:10,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7884, UAS: 0.9209, LAS: 0.8615, UEM: 0.4229, LEM: 0.1835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9655, partial_loss/deprel_loss: 1.3005, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5497, loss: 0.9493, batch_reg_loss: 0.1161, reg_loss: 0.1160 ||:  10%|9         | 11/111 [00:07<01:05,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8993, UAS: 0.9205, LAS: 0.8604, UEM: 0.4367, LEM: 0.2013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3561, partial_loss/deprel_loss: 0.5195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6030, loss: 0.9509, batch_reg_loss: 0.1162, reg_loss: 0.1160 ||:  13%|#2        | 14/111 [00:09<01:05,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8844, UAS: 0.9244, LAS: 0.8644, UEM: 0.4492, LEM: 0.2016, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4715, partial_loss/deprel_loss: 0.6246, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7102, loss: 0.9135, batch_reg_loss: 0.1162, reg_loss: 0.1161 ||:  15%|#5        | 17/111 [00:11<01:07,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8499, UAS: 0.9269, LAS: 0.8684, UEM: 0.4862, LEM: 0.2381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1172, partial_loss/deprel_loss: 0.9006, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0602, loss: 0.8846, batch_reg_loss: 0.1163, reg_loss: 0.1161 ||:  18%|#8        | 20/111 [00:13<01:05,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8651, UAS: 0.9247, LAS: 0.8656, UEM: 0.4565, LEM: 0.2166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6565, partial_loss/deprel_loss: 0.8579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9340, loss: 0.9051, batch_reg_loss: 0.1164, reg_loss: 0.1161 ||:  22%|##1       | 24/111 [00:16<00:59,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7923, UAS: 0.9189, LAS: 0.8592, UEM: 0.4360, LEM: 0.2045, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9101, partial_loss/deprel_loss: 1.2817, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5238, loss: 0.9555, batch_reg_loss: 0.1164, reg_loss: 0.1162 ||:  24%|##4       | 27/111 [00:18<00:57,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8100, UAS: 0.9204, LAS: 0.8606, UEM: 0.4805, LEM: 0.2478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4343, partial_loss/deprel_loss: 1.1992, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3628, loss: 0.9425, batch_reg_loss: 0.1165, reg_loss: 0.1162 ||:  27%|##7       | 30/111 [00:20<00:58,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8969, UAS: 0.9195, LAS: 0.8595, UEM: 0.4778, LEM: 0.2454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3692, partial_loss/deprel_loss: 0.5469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6280, loss: 0.9496, batch_reg_loss: 0.1166, reg_loss: 0.1162 ||:  31%|###       | 34/111 [00:23<00:54,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8410, UAS: 0.9186, LAS: 0.8582, UEM: 0.4590, LEM: 0.2313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0912, partial_loss/deprel_loss: 0.9415, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0881, loss: 0.9539, batch_reg_loss: 0.1167, reg_loss: 0.1163 ||:  34%|###4      | 38/111 [00:26<00:49,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9054, UAS: 0.9205, LAS: 0.8606, UEM: 0.4768, LEM: 0.2436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2957, partial_loss/deprel_loss: 0.4494, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5354, loss: 0.9355, batch_reg_loss: 0.1168, reg_loss: 0.1163 ||:  38%|###7      | 42/111 [00:28<00:47,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7559, UAS: 0.9180, LAS: 0.8576, UEM: 0.4588, LEM: 0.2320, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5943, partial_loss/deprel_loss: 1.6157, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9283, loss: 0.9636, batch_reg_loss: 0.1169, reg_loss: 0.1164 ||:  41%|####1     | 46/111 [00:31<00:44,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8097, UAS: 0.9180, LAS: 0.8578, UEM: 0.4674, LEM: 0.2415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4850, partial_loss/deprel_loss: 1.1822, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3597, loss: 0.9619, batch_reg_loss: 0.1169, reg_loss: 0.1164 ||:  44%|####4     | 49/111 [00:33<00:44,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8284, UAS: 0.9181, LAS: 0.8578, UEM: 0.4559, LEM: 0.2312, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1495, partial_loss/deprel_loss: 1.0793, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2104, loss: 0.9637, batch_reg_loss: 0.1170, reg_loss: 0.1165 ||:  48%|####7     | 53/111 [00:36<00:40,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8493, UAS: 0.9192, LAS: 0.8589, UEM: 0.4595, LEM: 0.2339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8674, partial_loss/deprel_loss: 1.0027, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0928, loss: 0.9569, batch_reg_loss: 0.1171, reg_loss: 0.1165 ||:  51%|#####1    | 57/111 [00:39<00:36,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9202, LAS: 0.8601, UEM: 0.4839, LEM: 0.2551, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1942, partial_loss/deprel_loss: 0.3969, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4736, loss: 0.9449, batch_reg_loss: 0.1172, reg_loss: 0.1165 ||:  55%|#####4    | 61/111 [00:41<00:33,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8669, UAS: 0.9211, LAS: 0.8613, UEM: 0.4880, LEM: 0.2559, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6812, partial_loss/deprel_loss: 0.7970, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8911, loss: 0.9362, batch_reg_loss: 0.1173, reg_loss: 0.1166 ||:  58%|#####7    | 64/111 [00:43<00:31,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8444, UAS: 0.9211, LAS: 0.8612, UEM: 0.4893, LEM: 0.2595, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9298, partial_loss/deprel_loss: 0.8934, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0180, loss: 0.9348, batch_reg_loss: 0.1173, reg_loss: 0.1166 ||:  60%|######    | 67/111 [00:46<00:31,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8758, UAS: 0.9214, LAS: 0.8614, UEM: 0.4829, LEM: 0.2532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5818, partial_loss/deprel_loss: 0.6596, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7614, loss: 0.9320, batch_reg_loss: 0.1174, reg_loss: 0.1166 ||:  63%|######3   | 70/111 [00:48<00:28,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8274, UAS: 0.9210, LAS: 0.8611, UEM: 0.4750, LEM: 0.2475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3160, partial_loss/deprel_loss: 1.0731, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2391, loss: 0.9346, batch_reg_loss: 0.1175, reg_loss: 0.1167 ||:  67%|######6   | 74/111 [00:50<00:25,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9217, LAS: 0.8620, UEM: 0.4883, LEM: 0.2643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1238, partial_loss/deprel_loss: 0.2637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3533, loss: 0.9277, batch_reg_loss: 0.1175, reg_loss: 0.1167 ||:  69%|######9   | 77/111 [00:52<00:22,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8894, UAS: 0.9227, LAS: 0.8631, UEM: 0.4886, LEM: 0.2645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4876, partial_loss/deprel_loss: 0.5759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6759, loss: 0.9184, batch_reg_loss: 0.1176, reg_loss: 0.1168 ||:  73%|#######2  | 81/111 [00:55<00:19,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9236, LAS: 0.8643, UEM: 0.4999, LEM: 0.2729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2840, partial_loss/deprel_loss: 0.4352, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5226, loss: 0.9100, batch_reg_loss: 0.1177, reg_loss: 0.1168 ||:  77%|#######6  | 85/111 [00:58<00:18,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9548, UAS: 0.9248, LAS: 0.8659, UEM: 0.5212, LEM: 0.2985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0727, partial_loss/deprel_loss: 0.1867, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2816, loss: 0.8990, batch_reg_loss: 0.1177, reg_loss: 0.1168 ||:  79%|#######9  | 88/111 [01:00<00:16,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9253, LAS: 0.8663, UEM: 0.5287, LEM: 0.3033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3533, partial_loss/deprel_loss: 0.6083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6751, loss: 0.8959, batch_reg_loss: 0.1178, reg_loss: 0.1169 ||:  82%|########1 | 91/111 [01:02<00:14,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8822, UAS: 0.9255, LAS: 0.8665, UEM: 0.5249, LEM: 0.2978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5523, partial_loss/deprel_loss: 0.6384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7391, loss: 0.8944, batch_reg_loss: 0.1179, reg_loss: 0.1169 ||:  86%|########5 | 95/111 [01:05<00:10,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8749, UAS: 0.9255, LAS: 0.8662, UEM: 0.5190, LEM: 0.2914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5470, partial_loss/deprel_loss: 0.7722, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8451, loss: 0.8972, batch_reg_loss: 0.1179, reg_loss: 0.1169 ||:  89%|########9 | 99/111 [01:07<00:07,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8835, UAS: 0.9260, LAS: 0.8667, UEM: 0.5188, LEM: 0.2890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5216, partial_loss/deprel_loss: 0.6458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7390, loss: 0.8915, batch_reg_loss: 0.1180, reg_loss: 0.1170 ||:  93%|#########2| 103/111 [01:10<00:05,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9252, LAS: 0.8656, UEM: 0.5142, LEM: 0.2854, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5122, partial_loss/deprel_loss: 0.7142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7919, loss: 0.9013, batch_reg_loss: 0.1181, reg_loss: 0.1170 ||:  95%|#########5| 106/111 [01:12<00:03,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8074, UAS: 0.9252, LAS: 0.8657, UEM: 0.5133, LEM: 0.2834, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5927, partial_loss/deprel_loss: 1.2844, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4642, loss: 0.9032, batch_reg_loss: 0.1181, reg_loss: 0.1171 ||:  99%|#########9| 110/111 [01:15<00:00,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7988, UAS: 0.9247, LAS: 0.8651, UEM: 0.5116, LEM: 0.2824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6141, partial_loss/deprel_loss: 1.2865, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4702, loss: 0.9083, batch_reg_loss: 0.1182, reg_loss: 0.1171 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
+      "2023-04-06 23:30:29,126 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8614, UAS: 0.9506, LAS: 0.8947, UEM: 0.6800, LEM: 0.3545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0408, partial_loss/deprel_loss: 44.2188, partial_loss/cycle_loss: 0.0000, batch_loss: 35.5832, loss: 24.8075, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:09,  1.09it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9196, UAS: 0.9518, LAS: 0.8976, UEM: 0.6637, LEM: 0.3517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3898, partial_loss/deprel_loss: 17.7429, partial_loss/cycle_loss: 0.0000, batch_loss: 14.2723, loss: 22.5560, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:06,  1.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9389, LAS: 0.8836, UEM: 0.6104, LEM: 0.3091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9587, partial_loss/deprel_loss: 37.7004, partial_loss/cycle_loss: 0.0000, batch_loss: 30.3521, loss: 26.7216, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:07<00:04,  1.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8765, UAS: 0.9361, LAS: 0.8796, UEM: 0.5538, LEM: 0.2631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6483, partial_loss/deprel_loss: 35.0183, partial_loss/cycle_loss: 0.0000, batch_loss: 28.1443, loss: 27.8730, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:10<00:01,  1.05it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9399, LAS: 0.8846, UEM: 0.6236, LEM: 0.3534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1799, partial_loss/deprel_loss: 20.4384, partial_loss/cycle_loss: 0.0000, batch_loss: 16.3867, loss: 26.3771, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.06it/s]\n",
+      "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.286  |    20.438\n",
+      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.614  |     0.180\n",
+      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.117  |     0.000\n",
+      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - UEM                      |     0.512  |     0.624\n",
+      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - LAS                      |     0.865  |     0.885\n",
+      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - loss                     |     0.908  |    26.377\n",
+      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - LEM                      |     0.282  |     0.353\n",
+      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - UAS                      |     0.925  |     0.940\n",
+      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - EM                       |     0.799  |     0.937\n",
+      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:30:41,444 - INFO - combo.training.trainer - Epoch duration: 0:01:28.054718\n",
+      "2023-04-06 23:30:41,444 - INFO - combo.training.trainer - Estimated training time remaining: 8:06:52\n",
+      "2023-04-06 23:30:41,444 - INFO - allennlp.training.trainer - Epoch 31/399\n",
+      "2023-04-06 23:30:41,444 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:30:41,445 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:30:41,452 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8748, UAS: 0.9334, LAS: 0.8786, UEM: 0.4443, LEM: 0.1990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7236, partial_loss/deprel_loss: 0.7101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8310, loss: 0.8045, batch_reg_loss: 0.1182, reg_loss: 0.1182 ||:   4%|3         | 4/111 [00:02<01:04,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8270, UAS: 0.9250, LAS: 0.8677, UEM: 0.5060, LEM: 0.2710, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1941, partial_loss/deprel_loss: 1.0869, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2266, loss: 0.8819, batch_reg_loss: 0.1183, reg_loss: 0.1182 ||:   6%|6         | 7/111 [00:04<01:04,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9246, LAS: 0.8647, UEM: 0.5259, LEM: 0.2646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3370, partial_loss/deprel_loss: 0.5980, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6641, loss: 0.9099, batch_reg_loss: 0.1184, reg_loss: 0.1183 ||:   9%|9         | 10/111 [00:06<01:06,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8079, UAS: 0.9163, LAS: 0.8569, UEM: 0.4684, LEM: 0.2328, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7216, partial_loss/deprel_loss: 1.2022, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4245, loss: 0.9877, batch_reg_loss: 0.1184, reg_loss: 0.1183 ||:  12%|#1        | 13/111 [00:08<01:05,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9163, LAS: 0.8573, UEM: 0.4320, LEM: 0.2074, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4364, partial_loss/deprel_loss: 0.6180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7002, loss: 0.9823, batch_reg_loss: 0.1185, reg_loss: 0.1183 ||:  15%|#5        | 17/111 [00:11<01:00,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9544, UAS: 0.9213, LAS: 0.8638, UEM: 0.5339, LEM: 0.3317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0738, partial_loss/deprel_loss: 0.1916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2866, loss: 0.9381, batch_reg_loss: 0.1186, reg_loss: 0.1184 ||:  19%|#8        | 21/111 [00:13<00:59,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7860, UAS: 0.9181, LAS: 0.8604, UEM: 0.5074, LEM: 0.3103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8301, partial_loss/deprel_loss: 1.2250, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4647, loss: 0.9604, batch_reg_loss: 0.1187, reg_loss: 0.1184 ||:  22%|##1       | 24/111 [00:16<00:59,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8936, UAS: 0.9206, LAS: 0.8625, UEM: 0.5125, LEM: 0.3077, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4054, partial_loss/deprel_loss: 0.6092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6872, loss: 0.9412, batch_reg_loss: 0.1188, reg_loss: 0.1185 ||:  25%|##5       | 28/111 [00:18<00:56,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8894, UAS: 0.9232, LAS: 0.8654, UEM: 0.5107, LEM: 0.2988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5208, partial_loss/deprel_loss: 0.6426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7371, loss: 0.9181, batch_reg_loss: 0.1189, reg_loss: 0.1185 ||:  29%|##8       | 32/111 [00:21<00:52,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8736, UAS: 0.9209, LAS: 0.8630, UEM: 0.5014, LEM: 0.2881, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6350, partial_loss/deprel_loss: 0.7174, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8199, loss: 0.9377, batch_reg_loss: 0.1189, reg_loss: 0.1186 ||:  32%|###2      | 36/111 [00:23<00:49,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8600, UAS: 0.9208, LAS: 0.8625, UEM: 0.4858, LEM: 0.2724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7292, partial_loss/deprel_loss: 0.8410, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9377, loss: 0.9367, batch_reg_loss: 0.1190, reg_loss: 0.1186 ||:  36%|###6      | 40/111 [00:26<00:45,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8642, UAS: 0.9211, LAS: 0.8619, UEM: 0.4705, LEM: 0.2575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7919, partial_loss/deprel_loss: 0.9952, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0737, loss: 0.9432, batch_reg_loss: 0.1191, reg_loss: 0.1186 ||:  40%|###9      | 44/111 [00:28<00:41,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8376, UAS: 0.9221, LAS: 0.8633, UEM: 0.4997, LEM: 0.2905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0615, partial_loss/deprel_loss: 1.0132, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1421, loss: 0.9287, batch_reg_loss: 0.1192, reg_loss: 0.1187 ||:  43%|####3     | 48/111 [00:31<00:41,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8288, UAS: 0.9231, LAS: 0.8644, UEM: 0.5092, LEM: 0.2947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0852, partial_loss/deprel_loss: 1.0912, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2093, loss: 0.9185, batch_reg_loss: 0.1193, reg_loss: 0.1187 ||:  47%|####6     | 52/111 [00:34<00:41,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7887, UAS: 0.9225, LAS: 0.8640, UEM: 0.5098, LEM: 0.2945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1006, partial_loss/deprel_loss: 1.3113, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5885, loss: 0.9214, batch_reg_loss: 0.1194, reg_loss: 0.1188 ||:  50%|####9     | 55/111 [00:37<00:40,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8872, UAS: 0.9226, LAS: 0.8640, UEM: 0.5125, LEM: 0.2936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3773, partial_loss/deprel_loss: 0.6483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7135, loss: 0.9201, batch_reg_loss: 0.1194, reg_loss: 0.1188 ||:  52%|#####2    | 58/111 [00:39<00:39,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8890, UAS: 0.9233, LAS: 0.8648, UEM: 0.5058, LEM: 0.2846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5661, partial_loss/deprel_loss: 0.6365, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7419, loss: 0.9154, batch_reg_loss: 0.1195, reg_loss: 0.1188 ||:  56%|#####5    | 62/111 [00:41<00:33,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8473, UAS: 0.9228, LAS: 0.8639, UEM: 0.4991, LEM: 0.2779, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0141, partial_loss/deprel_loss: 0.9395, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0740, loss: 0.9225, batch_reg_loss: 0.1196, reg_loss: 0.1189 ||:  59%|#####9    | 66/111 [00:44<00:29,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9241, LAS: 0.8651, UEM: 0.5039, LEM: 0.2764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4332, partial_loss/deprel_loss: 0.6507, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7269, loss: 0.9121, batch_reg_loss: 0.1197, reg_loss: 0.1189 ||:  63%|######3   | 70/111 [00:46<00:26,  1.54it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8310, UAS: 0.9232, LAS: 0.8641, UEM: 0.4970, LEM: 0.2715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0867, partial_loss/deprel_loss: 0.9831, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1236, loss: 0.9186, batch_reg_loss: 0.1197, reg_loss: 0.1190 ||:  67%|######6   | 74/111 [00:49<00:23,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9234, LAS: 0.8646, UEM: 0.4956, LEM: 0.2692, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3508, partial_loss/deprel_loss: 0.4847, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5778, loss: 0.9129, batch_reg_loss: 0.1198, reg_loss: 0.1190 ||:  70%|#######   | 78/111 [00:51<00:21,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8663, UAS: 0.9245, LAS: 0.8657, UEM: 0.4978, LEM: 0.2687, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6454, partial_loss/deprel_loss: 0.8686, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9439, loss: 0.9062, batch_reg_loss: 0.1199, reg_loss: 0.1191 ||:  74%|#######3  | 82/111 [00:54<00:18,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8569, UAS: 0.9247, LAS: 0.8661, UEM: 0.5063, LEM: 0.2793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8980, partial_loss/deprel_loss: 0.8663, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9927, loss: 0.9016, batch_reg_loss: 0.1200, reg_loss: 0.1191 ||:  77%|#######7  | 86/111 [00:57<00:16,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9053, UAS: 0.9252, LAS: 0.8666, UEM: 0.5083, LEM: 0.2791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2980, partial_loss/deprel_loss: 0.4854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5679, loss: 0.8977, batch_reg_loss: 0.1200, reg_loss: 0.1191 ||:  80%|########  | 89/111 [00:59<00:14,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8134, UAS: 0.9248, LAS: 0.8661, UEM: 0.5076, LEM: 0.2791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3499, partial_loss/deprel_loss: 1.1000, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2701, loss: 0.9023, batch_reg_loss: 0.1201, reg_loss: 0.1192 ||:  83%|########2 | 92/111 [01:01<00:13,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8550, UAS: 0.9230, LAS: 0.8643, UEM: 0.4989, LEM: 0.2738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0115, partial_loss/deprel_loss: 0.9014, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0436, loss: 0.9173, batch_reg_loss: 0.1202, reg_loss: 0.1192 ||:  86%|########6 | 96/111 [01:04<00:10,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9076, UAS: 0.9233, LAS: 0.8645, UEM: 0.4989, LEM: 0.2735, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2969, partial_loss/deprel_loss: 0.4878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5699, loss: 0.9146, batch_reg_loss: 0.1202, reg_loss: 0.1192 ||:  89%|########9 | 99/111 [01:06<00:08,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8444, UAS: 0.9238, LAS: 0.8649, UEM: 0.5049, LEM: 0.2769, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8979, partial_loss/deprel_loss: 0.9199, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0358, loss: 0.9114, batch_reg_loss: 0.1203, reg_loss: 0.1193 ||:  92%|#########1| 102/111 [01:08<00:06,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8377, UAS: 0.9244, LAS: 0.8655, UEM: 0.5149, LEM: 0.2847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1225, partial_loss/deprel_loss: 1.0132, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1554, loss: 0.9060, batch_reg_loss: 0.1204, reg_loss: 0.1193 ||:  95%|#########4| 105/111 [01:10<00:04,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9240, LAS: 0.8650, UEM: 0.5085, LEM: 0.2798, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4996, partial_loss/deprel_loss: 0.6632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7509, loss: 0.9104, batch_reg_loss: 0.1205, reg_loss: 0.1193 ||:  98%|#########8| 109/111 [01:13<00:01,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9245, LAS: 0.8656, UEM: 0.5131, LEM: 0.2829, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4847, partial_loss/deprel_loss: 0.6092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7048, loss: 0.9049, batch_reg_loss: 0.1205, reg_loss: 0.1194 ||: 100%|##########| 111/111 [01:14<00:00,  1.48it/s]\n",
+      "2023-04-06 23:31:56,226 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:31:56,226 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:31:56,226 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:31:56,226 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:31:56,226 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:31:56,226 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:31:56,226 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.609  |       N/A\n",
+      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.485  |       N/A\n",
+      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.119  |       N/A\n",
+      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - UEM                      |     0.513  |       N/A\n",
+      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - LAS                      |     0.866  |       N/A\n",
+      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - loss                     |     0.905  |       N/A\n",
+      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - LEM                      |     0.283  |       N/A\n",
+      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - UAS                      |     0.925  |       N/A\n",
+      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - EM                       |     0.891  |       N/A\n",
+      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:31:56,228 - INFO - combo.training.trainer - Epoch duration: 0:01:14.783878\n",
+      "2023-04-06 23:31:56,228 - INFO - combo.training.trainer - Estimated training time remaining: 8:04:42\n",
+      "2023-04-06 23:31:56,228 - INFO - allennlp.training.trainer - Epoch 32/399\n",
+      "2023-04-06 23:31:56,228 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:31:56,229 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:31:56,236 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8339, UAS: 0.9280, LAS: 0.8652, UEM: 0.3878, LEM: 0.1763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0858, partial_loss/deprel_loss: 1.0690, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1930, loss: 0.9121, batch_reg_loss: 0.1206, reg_loss: 0.1205 ||:   4%|3         | 4/111 [00:02<01:12,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8781, UAS: 0.9222, LAS: 0.8593, UEM: 0.3942, LEM: 0.1663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5145, partial_loss/deprel_loss: 0.7455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8199, loss: 0.9508, batch_reg_loss: 0.1206, reg_loss: 0.1206 ||:   6%|6         | 7/111 [00:04<01:11,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9268, LAS: 0.8661, UEM: 0.4804, LEM: 0.2334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3036, partial_loss/deprel_loss: 0.5117, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5908, loss: 0.8993, batch_reg_loss: 0.1207, reg_loss: 0.1206 ||:   9%|9         | 10/111 [00:06<01:08,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8563, UAS: 0.9294, LAS: 0.8701, UEM: 0.4779, LEM: 0.2266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7947, partial_loss/deprel_loss: 0.9712, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0567, loss: 0.8729, batch_reg_loss: 0.1207, reg_loss: 0.1206 ||:  12%|#1        | 13/111 [00:08<01:07,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8592, UAS: 0.9245, LAS: 0.8648, UEM: 0.4336, LEM: 0.2022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7990, partial_loss/deprel_loss: 0.7857, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9092, loss: 0.9191, batch_reg_loss: 0.1208, reg_loss: 0.1207 ||:  14%|#4        | 16/111 [00:11<01:05,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9516, UAS: 0.9268, LAS: 0.8677, UEM: 0.5322, LEM: 0.3289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0926, partial_loss/deprel_loss: 0.2178, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3136, loss: 0.8968, batch_reg_loss: 0.1209, reg_loss: 0.1207 ||:  17%|#7        | 19/111 [00:13<01:05,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8848, UAS: 0.9291, LAS: 0.8698, UEM: 0.5301, LEM: 0.3121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5335, partial_loss/deprel_loss: 0.6623, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7575, loss: 0.8739, batch_reg_loss: 0.1209, reg_loss: 0.1207 ||:  20%|#9        | 22/111 [00:15<01:06,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8973, UAS: 0.9269, LAS: 0.8675, UEM: 0.5307, LEM: 0.3049, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3634, partial_loss/deprel_loss: 0.5300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6176, loss: 0.8880, batch_reg_loss: 0.1210, reg_loss: 0.1207 ||:  23%|##2       | 25/111 [00:18<01:04,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8435, UAS: 0.9255, LAS: 0.8662, UEM: 0.5171, LEM: 0.2944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1714, partial_loss/deprel_loss: 1.0061, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1602, loss: 0.9002, batch_reg_loss: 0.1210, reg_loss: 0.1208 ||:  25%|##5       | 28/111 [00:20<01:03,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9248, LAS: 0.8655, UEM: 0.5165, LEM: 0.2950, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2944, partial_loss/deprel_loss: 0.4554, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5443, loss: 0.9082, batch_reg_loss: 0.1211, reg_loss: 0.1208 ||:  28%|##7       | 31/111 [00:22<01:01,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9272, LAS: 0.8687, UEM: 0.5406, LEM: 0.3166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1706, partial_loss/deprel_loss: 0.3330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4217, loss: 0.8810, batch_reg_loss: 0.1211, reg_loss: 0.1208 ||:  31%|###       | 34/111 [00:25<00:59,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9299, LAS: 0.8714, UEM: 0.5655, LEM: 0.3288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1528, partial_loss/deprel_loss: 0.3993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4713, loss: 0.8544, batch_reg_loss: 0.1212, reg_loss: 0.1209 ||:  34%|###4      | 38/111 [00:27<00:54,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7832, UAS: 0.9285, LAS: 0.8704, UEM: 0.5675, LEM: 0.3304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1536, partial_loss/deprel_loss: 1.2558, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5566, loss: 0.8616, batch_reg_loss: 0.1213, reg_loss: 0.1209 ||:  37%|###6      | 41/111 [00:30<00:53,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9300, LAS: 0.8721, UEM: 0.5725, LEM: 0.3317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3764, partial_loss/deprel_loss: 0.4992, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5959, loss: 0.8479, batch_reg_loss: 0.1213, reg_loss: 0.1209 ||:  40%|###9      | 44/111 [00:32<00:50,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8943, UAS: 0.9297, LAS: 0.8715, UEM: 0.5590, LEM: 0.3199, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3903, partial_loss/deprel_loss: 0.6036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6823, loss: 0.8563, batch_reg_loss: 0.1214, reg_loss: 0.1210 ||:  43%|####3     | 48/111 [00:35<00:46,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8898, UAS: 0.9309, LAS: 0.8732, UEM: 0.5558, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4737, partial_loss/deprel_loss: 0.6535, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7390, loss: 0.8460, batch_reg_loss: 0.1215, reg_loss: 0.1210 ||:  47%|####6     | 52/111 [00:37<00:41,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8597, UAS: 0.9302, LAS: 0.8723, UEM: 0.5439, LEM: 0.3032, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6993, partial_loss/deprel_loss: 0.7695, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8770, loss: 0.8525, batch_reg_loss: 0.1215, reg_loss: 0.1210 ||:  50%|#####     | 56/111 [00:40<00:37,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8500, UAS: 0.9306, LAS: 0.8729, UEM: 0.5460, LEM: 0.3052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0724, partial_loss/deprel_loss: 1.0548, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1799, loss: 0.8494, batch_reg_loss: 0.1216, reg_loss: 0.1211 ||:  53%|#####3    | 59/111 [00:42<00:37,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8331, UAS: 0.9290, LAS: 0.8712, UEM: 0.5358, LEM: 0.2987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2836, partial_loss/deprel_loss: 0.9883, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1690, loss: 0.8636, batch_reg_loss: 0.1216, reg_loss: 0.1211 ||:  56%|#####5    | 62/111 [00:44<00:34,  1.41it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9293, LAS: 0.8715, UEM: 0.5296, LEM: 0.2908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6870, partial_loss/deprel_loss: 0.7730, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8775, loss: 0.8617, batch_reg_loss: 0.1217, reg_loss: 0.1211 ||:  59%|#####9    | 66/111 [00:47<00:30,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8233, UAS: 0.9263, LAS: 0.8683, UEM: 0.5209, LEM: 0.2855, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4318, partial_loss/deprel_loss: 1.0938, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2831, loss: 0.8883, batch_reg_loss: 0.1218, reg_loss: 0.1211 ||:  62%|######2   | 69/111 [00:49<00:28,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8648, UAS: 0.9263, LAS: 0.8683, UEM: 0.5139, LEM: 0.2789, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7876, partial_loss/deprel_loss: 0.7696, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8951, loss: 0.8890, batch_reg_loss: 0.1218, reg_loss: 0.1212 ||:  66%|######5   | 73/111 [00:51<00:24,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8262, UAS: 0.9260, LAS: 0.8681, UEM: 0.5085, LEM: 0.2743, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1389, partial_loss/deprel_loss: 1.0152, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1619, loss: 0.8884, batch_reg_loss: 0.1219, reg_loss: 0.1212 ||:  69%|######9   | 77/111 [00:54<00:22,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9255, LAS: 0.8675, UEM: 0.5156, LEM: 0.2866, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1239, partial_loss/deprel_loss: 0.2815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3720, loss: 0.8924, batch_reg_loss: 0.1220, reg_loss: 0.1213 ||:  73%|#######2  | 81/111 [00:57<00:19,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9251, LAS: 0.8669, UEM: 0.5146, LEM: 0.2873, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3275, partial_loss/deprel_loss: 0.4241, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5269, loss: 0.8963, batch_reg_loss: 0.1221, reg_loss: 0.1213 ||:  77%|#######6  | 85/111 [00:59<00:17,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8477, UAS: 0.9257, LAS: 0.8675, UEM: 0.5170, LEM: 0.2874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8591, partial_loss/deprel_loss: 0.9767, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0754, loss: 0.8924, batch_reg_loss: 0.1222, reg_loss: 0.1213 ||:  79%|#######9  | 88/111 [01:02<00:16,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9166, UAS: 0.9258, LAS: 0.8675, UEM: 0.5237, LEM: 0.2936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1875, partial_loss/deprel_loss: 0.3560, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4446, loss: 0.8923, batch_reg_loss: 0.1222, reg_loss: 0.1214 ||:  82%|########1 | 91/111 [01:04<00:14,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9017, UAS: 0.9254, LAS: 0.8670, UEM: 0.5240, LEM: 0.2931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3555, partial_loss/deprel_loss: 0.5276, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6155, loss: 0.8989, batch_reg_loss: 0.1223, reg_loss: 0.1214 ||:  86%|########5 | 95/111 [01:07<00:11,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8443, UAS: 0.9248, LAS: 0.8662, UEM: 0.5177, LEM: 0.2888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9644, partial_loss/deprel_loss: 0.8869, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0248, loss: 0.9030, batch_reg_loss: 0.1224, reg_loss: 0.1214 ||:  88%|########8 | 98/111 [01:09<00:09,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8596, UAS: 0.9248, LAS: 0.8662, UEM: 0.5197, LEM: 0.2904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6818, partial_loss/deprel_loss: 0.8229, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9171, loss: 0.9023, batch_reg_loss: 0.1225, reg_loss: 0.1215 ||:  92%|#########1| 102/111 [01:11<00:06,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8629, UAS: 0.9248, LAS: 0.8661, UEM: 0.5155, LEM: 0.2858, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8211, partial_loss/deprel_loss: 0.8211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9436, loss: 0.9038, batch_reg_loss: 0.1226, reg_loss: 0.1215 ||:  95%|#########5| 106/111 [01:14<00:03,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8603, UAS: 0.9251, LAS: 0.8664, UEM: 0.5153, LEM: 0.2849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7650, partial_loss/deprel_loss: 0.8273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9375, loss: 0.9013, batch_reg_loss: 0.1226, reg_loss: 0.1215 ||:  99%|#########9| 110/111 [01:16<00:00,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8006, UAS: 0.9245, LAS: 0.8658, UEM: 0.5134, LEM: 0.2838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5343, partial_loss/deprel_loss: 1.2796, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4532, loss: 0.9062, batch_reg_loss: 0.1227, reg_loss: 0.1215 ||: 100%|##########| 111/111 [01:17<00:00,  1.43it/s]\n",
+      "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.280  |       N/A\n",
+      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.534  |       N/A\n",
+      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.122  |       N/A\n",
+      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - UEM                      |     0.513  |       N/A\n",
+      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - LAS                      |     0.866  |       N/A\n",
+      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - loss                     |     0.906  |       N/A\n",
+      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - LEM                      |     0.284  |       N/A\n",
+      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - UAS                      |     0.925  |       N/A\n",
+      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - EM                       |     0.801  |       N/A\n",
+      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:33:13,715 - INFO - combo.training.trainer - Epoch duration: 0:01:17.486642\n",
+      "2023-04-06 23:33:13,715 - INFO - combo.training.trainer - Estimated training time remaining: 8:03:06\n",
+      "2023-04-06 23:33:13,715 - INFO - allennlp.training.trainer - Epoch 33/399\n",
+      "2023-04-06 23:33:13,715 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:33:13,716 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:33:13,722 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8321, UAS: 0.9211, LAS: 0.8634, UEM: 0.2448, LEM: 0.0606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2054, partial_loss/deprel_loss: 0.9809, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1485, loss: 0.9179, batch_reg_loss: 0.1227, reg_loss: 0.1227 ||:   4%|3         | 4/111 [00:02<01:16,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8664, UAS: 0.9216, LAS: 0.8649, UEM: 0.4007, LEM: 0.2139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8307, partial_loss/deprel_loss: 0.7976, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9270, loss: 0.9128, batch_reg_loss: 0.1228, reg_loss: 0.1227 ||:   6%|6         | 7/111 [00:05<01:17,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9301, LAS: 0.8748, UEM: 0.4858, LEM: 0.2617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5363, partial_loss/deprel_loss: 0.5515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6713, loss: 0.8323, batch_reg_loss: 0.1229, reg_loss: 0.1228 ||:   9%|9         | 10/111 [00:07<01:16,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.9291, LAS: 0.8730, UEM: 0.4607, LEM: 0.2289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6542, partial_loss/deprel_loss: 0.7278, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8360, loss: 0.8399, batch_reg_loss: 0.1229, reg_loss: 0.1228 ||:  13%|#2        | 14/111 [00:10<01:09,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8337, UAS: 0.9238, LAS: 0.8661, UEM: 0.4238, LEM: 0.2058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1477, partial_loss/deprel_loss: 1.0175, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1666, loss: 0.9019, batch_reg_loss: 0.1230, reg_loss: 0.1228 ||:  15%|#5        | 17/111 [00:12<01:06,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9052, UAS: 0.9265, LAS: 0.8681, UEM: 0.4492, LEM: 0.2182, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2747, partial_loss/deprel_loss: 0.4835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5648, loss: 0.8846, batch_reg_loss: 0.1231, reg_loss: 0.1229 ||:  18%|#8        | 20/111 [00:14<01:03,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7840, UAS: 0.9254, LAS: 0.8666, UEM: 0.4648, LEM: 0.2258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8170, partial_loss/deprel_loss: 1.3568, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5720, loss: 0.8961, batch_reg_loss: 0.1231, reg_loss: 0.1229 ||:  21%|##        | 23/111 [00:16<01:02,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8408, UAS: 0.9235, LAS: 0.8644, UEM: 0.4432, LEM: 0.2090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1372, partial_loss/deprel_loss: 0.9852, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1388, loss: 0.9177, batch_reg_loss: 0.1232, reg_loss: 0.1229 ||:  24%|##4       | 27/111 [00:18<00:57,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9265, LAS: 0.8682, UEM: 0.4929, LEM: 0.2502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2421, partial_loss/deprel_loss: 0.4143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5031, loss: 0.8827, batch_reg_loss: 0.1232, reg_loss: 0.1230 ||:  27%|##7       | 30/111 [00:21<00:56,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8520, UAS: 0.9256, LAS: 0.8672, UEM: 0.4734, LEM: 0.2367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9719, partial_loss/deprel_loss: 0.9334, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0644, loss: 0.8918, batch_reg_loss: 0.1233, reg_loss: 0.1230 ||:  30%|##9       | 33/111 [00:23<00:53,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8678, UAS: 0.9268, LAS: 0.8684, UEM: 0.4827, LEM: 0.2445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6742, partial_loss/deprel_loss: 0.7842, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8856, loss: 0.8809, batch_reg_loss: 0.1234, reg_loss: 0.1230 ||:  32%|###2      | 36/111 [00:25<00:52,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9268, LAS: 0.8687, UEM: 0.4928, LEM: 0.2582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1770, partial_loss/deprel_loss: 0.3684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4536, loss: 0.8786, batch_reg_loss: 0.1235, reg_loss: 0.1231 ||:  36%|###6      | 40/111 [00:27<00:47,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7844, UAS: 0.9267, LAS: 0.8682, UEM: 0.4953, LEM: 0.2548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8813, partial_loss/deprel_loss: 1.3088, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5469, loss: 0.8836, batch_reg_loss: 0.1235, reg_loss: 0.1231 ||:  40%|###9      | 44/111 [00:30<00:44,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8473, UAS: 0.9241, LAS: 0.8655, UEM: 0.4929, LEM: 0.2566, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8672, partial_loss/deprel_loss: 0.9594, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0645, loss: 0.9084, batch_reg_loss: 0.1236, reg_loss: 0.1231 ||:  43%|####3     | 48/111 [00:33<00:42,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9233, LAS: 0.8647, UEM: 0.4857, LEM: 0.2512, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4534, partial_loss/deprel_loss: 0.5398, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6462, loss: 0.9137, batch_reg_loss: 0.1237, reg_loss: 0.1232 ||:  47%|####6     | 52/111 [00:35<00:39,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9234, LAS: 0.8646, UEM: 0.4809, LEM: 0.2454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4625, partial_loss/deprel_loss: 0.5691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6716, loss: 0.9135, batch_reg_loss: 0.1238, reg_loss: 0.1232 ||:  50%|#####     | 56/111 [00:38<00:38,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9234, LAS: 0.8646, UEM: 0.5000, LEM: 0.2691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1320, partial_loss/deprel_loss: 0.2790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3734, loss: 0.9154, batch_reg_loss: 0.1239, reg_loss: 0.1233 ||:  54%|#####4    | 60/111 [00:41<00:35,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9247, LAS: 0.8660, UEM: 0.5193, LEM: 0.2878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2943, partial_loss/deprel_loss: 0.4989, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5819, loss: 0.9023, batch_reg_loss: 0.1239, reg_loss: 0.1233 ||:  57%|#####6    | 63/111 [00:44<00:37,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8493, UAS: 0.9245, LAS: 0.8655, UEM: 0.5094, LEM: 0.2790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8338, partial_loss/deprel_loss: 0.9125, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0207, loss: 0.9076, batch_reg_loss: 0.1240, reg_loss: 0.1233 ||:  60%|######    | 67/111 [00:47<00:32,  1.35it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8462, UAS: 0.9238, LAS: 0.8647, UEM: 0.5004, LEM: 0.2726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0190, partial_loss/deprel_loss: 0.8973, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0457, loss: 0.9132, batch_reg_loss: 0.1241, reg_loss: 0.1234 ||:  63%|######3   | 70/111 [00:49<00:29,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8830, UAS: 0.9256, LAS: 0.8670, UEM: 0.5380, LEM: 0.3134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5388, partial_loss/deprel_loss: 0.6799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7758, loss: 0.8967, batch_reg_loss: 0.1241, reg_loss: 0.1234 ||:  66%|######5   | 73/111 [00:51<00:28,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9259, LAS: 0.8673, UEM: 0.5356, LEM: 0.3106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4678, partial_loss/deprel_loss: 0.5111, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6266, loss: 0.8944, batch_reg_loss: 0.1242, reg_loss: 0.1234 ||:  68%|######8   | 76/111 [00:53<00:26,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9264, LAS: 0.8678, UEM: 0.5363, LEM: 0.3104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5585, partial_loss/deprel_loss: 0.7297, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8197, loss: 0.8902, batch_reg_loss: 0.1242, reg_loss: 0.1235 ||:  71%|#######1  | 79/111 [00:56<00:24,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7776, UAS: 0.9260, LAS: 0.8674, UEM: 0.5386, LEM: 0.3097, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2130, partial_loss/deprel_loss: 1.3757, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6674, loss: 0.8933, batch_reg_loss: 0.1243, reg_loss: 0.1235 ||:  74%|#######3  | 82/111 [00:58<00:22,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8544, UAS: 0.9256, LAS: 0.8668, UEM: 0.5348, LEM: 0.3058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7456, partial_loss/deprel_loss: 0.7852, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9016, loss: 0.8981, batch_reg_loss: 0.1244, reg_loss: 0.1235 ||:  77%|#######6  | 85/111 [01:00<00:19,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9255, LAS: 0.8665, UEM: 0.5300, LEM: 0.3019, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5330, partial_loss/deprel_loss: 0.6727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7692, loss: 0.8982, batch_reg_loss: 0.1244, reg_loss: 0.1236 ||:  80%|########  | 89/111 [01:03<00:15,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9262, LAS: 0.8673, UEM: 0.5294, LEM: 0.2988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4852, partial_loss/deprel_loss: 0.6245, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7211, loss: 0.8921, batch_reg_loss: 0.1245, reg_loss: 0.1236 ||:  83%|########2 | 92/111 [01:05<00:13,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9261, LAS: 0.8670, UEM: 0.5272, LEM: 0.2958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3968, partial_loss/deprel_loss: 0.5528, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6462, loss: 0.8936, batch_reg_loss: 0.1246, reg_loss: 0.1236 ||:  86%|########6 | 96/111 [01:08<00:10,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8171, UAS: 0.9254, LAS: 0.8662, UEM: 0.5244, LEM: 0.2939, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5442, partial_loss/deprel_loss: 0.9765, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2147, loss: 0.8996, batch_reg_loss: 0.1246, reg_loss: 0.1237 ||:  89%|########9 | 99/111 [01:10<00:08,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8560, UAS: 0.9260, LAS: 0.8668, UEM: 0.5231, LEM: 0.2913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7287, partial_loss/deprel_loss: 0.8699, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9663, loss: 0.8954, batch_reg_loss: 0.1247, reg_loss: 0.1237 ||:  93%|#########2| 103/111 [01:12<00:05,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8983, UAS: 0.9264, LAS: 0.8673, UEM: 0.5263, LEM: 0.2927, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4031, partial_loss/deprel_loss: 0.6182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6999, loss: 0.8923, batch_reg_loss: 0.1248, reg_loss: 0.1237 ||:  95%|#########5| 106/111 [01:14<00:03,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8152, UAS: 0.9260, LAS: 0.8666, UEM: 0.5221, LEM: 0.2898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2286, partial_loss/deprel_loss: 1.1836, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3174, loss: 0.8969, batch_reg_loss: 0.1249, reg_loss: 0.1238 ||:  99%|#########9| 110/111 [01:17<00:00,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8837, UAS: 0.9261, LAS: 0.8668, UEM: 0.5215, LEM: 0.2886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5971, partial_loss/deprel_loss: 0.7101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8123, loss: 0.8961, batch_reg_loss: 0.1249, reg_loss: 0.1238 ||: 100%|##########| 111/111 [01:17<00:00,  1.42it/s]\n",
+      "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.710  |       N/A\n",
+      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.597  |       N/A\n",
+      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.124  |       N/A\n",
+      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - UEM                      |     0.522  |       N/A\n",
+      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - LAS                      |     0.867  |       N/A\n",
+      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - loss                     |     0.896  |       N/A\n",
+      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - LEM                      |     0.289  |       N/A\n",
+      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - UAS                      |     0.926  |       N/A\n",
+      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - EM                       |     0.884  |       N/A\n",
+      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:34:31,639 - INFO - combo.training.trainer - Epoch duration: 0:01:17.923745\n",
+      "2023-04-06 23:34:31,639 - INFO - combo.training.trainer - Estimated training time remaining: 8:01:36\n",
+      "2023-04-06 23:34:31,639 - INFO - allennlp.training.trainer - Epoch 34/399\n",
+      "2023-04-06 23:34:31,639 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:34:31,640 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:34:31,646 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8560, UAS: 0.9111, LAS: 0.8494, UEM: 0.1556, LEM: 0.0333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7581, partial_loss/deprel_loss: 0.8816, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9818, loss: 1.0546, batch_reg_loss: 0.1249, reg_loss: 0.1249 ||:   3%|2         | 3/111 [00:02<01:13,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9056, LAS: 0.8439, UEM: 0.2538, LEM: 0.0790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4955, partial_loss/deprel_loss: 0.6868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7736, loss: 1.0748, batch_reg_loss: 0.1250, reg_loss: 0.1249 ||:   5%|5         | 6/111 [00:04<01:12,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7825, UAS: 0.9077, LAS: 0.8464, UEM: 0.3817, LEM: 0.1861, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7655, partial_loss/deprel_loss: 1.2883, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5088, loss: 1.0438, batch_reg_loss: 0.1251, reg_loss: 0.1250 ||:   8%|8         | 9/111 [00:06<01:09,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8766, UAS: 0.9136, LAS: 0.8528, UEM: 0.3986, LEM: 0.1842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6326, partial_loss/deprel_loss: 0.7305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8360, loss: 1.0011, batch_reg_loss: 0.1251, reg_loss: 0.1250 ||:  11%|#         | 12/111 [00:08<01:09,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8578, UAS: 0.9196, LAS: 0.8600, UEM: 0.4359, LEM: 0.1994, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0891, partial_loss/deprel_loss: 0.8639, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0341, loss: 0.9523, batch_reg_loss: 0.1252, reg_loss: 0.1250 ||:  14%|#4        | 16/111 [00:10<01:04,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.9183, LAS: 0.8599, UEM: 0.4232, LEM: 0.1982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4165, partial_loss/deprel_loss: 1.0787, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2716, loss: 0.9521, batch_reg_loss: 0.1253, reg_loss: 0.1251 ||:  18%|#8        | 20/111 [00:13<01:00,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9221, LAS: 0.8642, UEM: 0.4556, LEM: 0.2267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4718, partial_loss/deprel_loss: 0.5684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6744, loss: 0.9203, batch_reg_loss: 0.1253, reg_loss: 0.1251 ||:  21%|##        | 23/111 [00:15<01:01,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8940, UAS: 0.9262, LAS: 0.8687, UEM: 0.4854, LEM: 0.2382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4130, partial_loss/deprel_loss: 0.5913, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6810, loss: 0.8882, batch_reg_loss: 0.1254, reg_loss: 0.1251 ||:  23%|##3       | 26/111 [00:18<01:00,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9281, LAS: 0.8704, UEM: 0.4951, LEM: 0.2408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3141, partial_loss/deprel_loss: 0.4727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5664, loss: 0.8715, batch_reg_loss: 0.1255, reg_loss: 0.1252 ||:  26%|##6       | 29/111 [00:20<00:59,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8954, UAS: 0.9292, LAS: 0.8718, UEM: 0.5290, LEM: 0.2772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3000, partial_loss/deprel_loss: 0.4808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5701, loss: 0.8581, batch_reg_loss: 0.1255, reg_loss: 0.1252 ||:  29%|##8       | 32/111 [00:22<00:59,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9294, LAS: 0.8719, UEM: 0.5231, LEM: 0.2740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3971, partial_loss/deprel_loss: 0.5997, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6847, loss: 0.8609, batch_reg_loss: 0.1256, reg_loss: 0.1252 ||:  32%|###2      | 36/111 [00:25<00:53,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8502, UAS: 0.9275, LAS: 0.8696, UEM: 0.5066, LEM: 0.2621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9660, partial_loss/deprel_loss: 0.8184, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9736, loss: 0.8780, batch_reg_loss: 0.1256, reg_loss: 0.1253 ||:  36%|###6      | 40/111 [00:27<00:48,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9269, LAS: 0.8686, UEM: 0.4966, LEM: 0.2515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4479, partial_loss/deprel_loss: 0.6066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7006, loss: 0.8859, batch_reg_loss: 0.1257, reg_loss: 0.1253 ||:  40%|###9      | 44/111 [00:30<00:45,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9260, LAS: 0.8677, UEM: 0.4901, LEM: 0.2465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5388, partial_loss/deprel_loss: 0.5948, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7094, loss: 0.8959, batch_reg_loss: 0.1258, reg_loss: 0.1253 ||:  42%|####2     | 47/111 [00:32<00:44,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9266, LAS: 0.8686, UEM: 0.4965, LEM: 0.2503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2710, partial_loss/deprel_loss: 0.4662, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5530, loss: 0.8885, batch_reg_loss: 0.1259, reg_loss: 0.1254 ||:  46%|####5     | 51/111 [00:35<00:40,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8409, UAS: 0.9264, LAS: 0.8687, UEM: 0.5060, LEM: 0.2660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0437, partial_loss/deprel_loss: 0.9126, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0648, loss: 0.8867, batch_reg_loss: 0.1259, reg_loss: 0.1254 ||:  49%|####8     | 54/111 [00:37<00:39,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8881, UAS: 0.9265, LAS: 0.8685, UEM: 0.4986, LEM: 0.2585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4914, partial_loss/deprel_loss: 0.6521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7459, loss: 0.8885, batch_reg_loss: 0.1260, reg_loss: 0.1254 ||:  51%|#####1    | 57/111 [00:39<00:37,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9267, LAS: 0.8690, UEM: 0.5166, LEM: 0.2750, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3150, partial_loss/deprel_loss: 0.4455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5455, loss: 0.8846, batch_reg_loss: 0.1261, reg_loss: 0.1255 ||:  54%|#####4    | 60/111 [00:41<00:36,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8927, UAS: 0.9268, LAS: 0.8693, UEM: 0.5151, LEM: 0.2750, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4608, partial_loss/deprel_loss: 0.5828, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6845, loss: 0.8828, batch_reg_loss: 0.1261, reg_loss: 0.1255 ||:  57%|#####6    | 63/111 [00:44<00:35,  1.35it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8797, UAS: 0.9262, LAS: 0.8687, UEM: 0.5069, LEM: 0.2689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5799, partial_loss/deprel_loss: 0.7299, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8261, loss: 0.8887, batch_reg_loss: 0.1262, reg_loss: 0.1255 ||:  59%|#####9    | 66/111 [00:46<00:32,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8858, UAS: 0.9267, LAS: 0.8691, UEM: 0.5082, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5195, partial_loss/deprel_loss: 0.6044, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7137, loss: 0.8859, batch_reg_loss: 0.1262, reg_loss: 0.1256 ||:  62%|######2   | 69/111 [00:48<00:31,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7946, UAS: 0.9255, LAS: 0.8676, UEM: 0.4995, LEM: 0.2632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6270, partial_loss/deprel_loss: 1.1887, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4026, loss: 0.8979, batch_reg_loss: 0.1263, reg_loss: 0.1256 ||:  65%|######4   | 72/111 [00:50<00:29,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8650, UAS: 0.9261, LAS: 0.8686, UEM: 0.5204, LEM: 0.2931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7267, partial_loss/deprel_loss: 0.8069, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9172, loss: 0.8909, batch_reg_loss: 0.1264, reg_loss: 0.1256 ||:  68%|######7   | 75/111 [00:53<00:27,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8154, UAS: 0.9257, LAS: 0.8678, UEM: 0.5206, LEM: 0.2942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2415, partial_loss/deprel_loss: 1.1330, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2811, loss: 0.8966, batch_reg_loss: 0.1264, reg_loss: 0.1257 ||:  71%|#######1  | 79/111 [00:55<00:23,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9256, LAS: 0.8678, UEM: 0.5151, LEM: 0.2893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6984, partial_loss/deprel_loss: 0.7058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8308, loss: 0.8966, batch_reg_loss: 0.1265, reg_loss: 0.1257 ||:  74%|#######3  | 82/111 [00:58<00:21,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8430, UAS: 0.9253, LAS: 0.8674, UEM: 0.5110, LEM: 0.2866, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1613, partial_loss/deprel_loss: 0.9831, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1453, loss: 0.9004, batch_reg_loss: 0.1266, reg_loss: 0.1257 ||:  77%|#######6  | 85/111 [01:00<00:18,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8593, UAS: 0.9256, LAS: 0.8676, UEM: 0.5044, LEM: 0.2798, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7210, partial_loss/deprel_loss: 0.8211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9277, loss: 0.8993, batch_reg_loss: 0.1266, reg_loss: 0.1258 ||:  80%|########  | 89/111 [01:02<00:14,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9267, LAS: 0.8690, UEM: 0.5185, LEM: 0.2945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1218, partial_loss/deprel_loss: 0.2729, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3694, loss: 0.8883, batch_reg_loss: 0.1267, reg_loss: 0.1258 ||:  84%|########3 | 93/111 [01:05<00:12,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8676, UAS: 0.9271, LAS: 0.8695, UEM: 0.5184, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8011, partial_loss/deprel_loss: 0.7246, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8667, loss: 0.8846, batch_reg_loss: 0.1268, reg_loss: 0.1258 ||:  87%|########7 | 97/111 [01:07<00:09,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8105, UAS: 0.9253, LAS: 0.8672, UEM: 0.5146, LEM: 0.2885, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3796, partial_loss/deprel_loss: 1.2244, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3823, loss: 0.9042, batch_reg_loss: 0.1269, reg_loss: 0.1259 ||:  91%|######### | 101/111 [01:10<00:06,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8849, UAS: 0.9253, LAS: 0.8672, UEM: 0.5136, LEM: 0.2872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4786, partial_loss/deprel_loss: 0.7123, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7925, loss: 0.9034, batch_reg_loss: 0.1270, reg_loss: 0.1259 ||:  95%|#########4| 105/111 [01:12<00:03,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9259, LAS: 0.8680, UEM: 0.5158, LEM: 0.2860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3995, partial_loss/deprel_loss: 0.4815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5921, loss: 0.8959, batch_reg_loss: 0.1270, reg_loss: 0.1260 ||:  98%|#########8| 109/111 [01:15<00:01,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8528, UAS: 0.9261, LAS: 0.8681, UEM: 0.5174, LEM: 0.2862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8394, partial_loss/deprel_loss: 0.8557, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9796, loss: 0.8944, batch_reg_loss: 0.1271, reg_loss: 0.1260 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
+      "2023-04-06 23:35:48,409 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:35:48,409 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.856  |       N/A\n",
+      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.839  |       N/A\n",
+      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.126  |       N/A\n",
+      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - UEM                      |     0.517  |       N/A\n",
+      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - LAS                      |     0.868  |       N/A\n",
+      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - loss                     |     0.894  |       N/A\n",
+      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - LEM                      |     0.286  |       N/A\n",
+      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - UAS                      |     0.926  |       N/A\n",
+      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:35:48,411 - INFO - combo.training.tensorboard_writer - EM                       |     0.853  |       N/A\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-06 23:35:48,411 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:35:48,411 - INFO - combo.training.trainer - Epoch duration: 0:01:16.772068\n",
+      "2023-04-06 23:35:48,411 - INFO - combo.training.trainer - Estimated training time remaining: 7:59:54\n",
+      "2023-04-06 23:35:48,411 - INFO - allennlp.training.trainer - Epoch 35/399\n",
+      "2023-04-06 23:35:48,411 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:35:48,412 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:35:48,418 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8295, UAS: 0.9216, LAS: 0.8633, UEM: 0.5277, LEM: 0.2900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1609, partial_loss/deprel_loss: 0.9063, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0844, loss: 0.8635, batch_reg_loss: 0.1272, reg_loss: 0.1271 ||:   4%|3         | 4/111 [00:02<01:10,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9235, LAS: 0.8655, UEM: 0.4402, LEM: 0.2191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5437, partial_loss/deprel_loss: 0.6562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7609, loss: 0.8720, batch_reg_loss: 0.1272, reg_loss: 0.1272 ||:   6%|6         | 7/111 [00:04<01:09,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9283, LAS: 0.8721, UEM: 0.5337, LEM: 0.3006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2537, partial_loss/deprel_loss: 0.4130, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5084, loss: 0.8287, batch_reg_loss: 0.1273, reg_loss: 0.1272 ||:  10%|9         | 11/111 [00:07<01:04,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9337, LAS: 0.8795, UEM: 0.6324, LEM: 0.4287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8339, partial_loss/deprel_loss: 0.8628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9844, loss: 0.7854, batch_reg_loss: 0.1274, reg_loss: 0.1272 ||:  13%|#2        | 14/111 [00:09<01:05,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8884, UAS: 0.9359, LAS: 0.8817, UEM: 0.6234, LEM: 0.4027, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4166, partial_loss/deprel_loss: 0.6455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7271, loss: 0.7716, batch_reg_loss: 0.1274, reg_loss: 0.1273 ||:  15%|#5        | 17/111 [00:11<01:03,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8421, UAS: 0.9321, LAS: 0.8770, UEM: 0.5887, LEM: 0.3752, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9956, partial_loss/deprel_loss: 0.8582, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0131, loss: 0.8049, batch_reg_loss: 0.1275, reg_loss: 0.1273 ||:  18%|#8        | 20/111 [00:13<01:02,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9340, LAS: 0.8787, UEM: 0.5950, LEM: 0.3729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3717, partial_loss/deprel_loss: 0.6203, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6981, loss: 0.7990, batch_reg_loss: 0.1275, reg_loss: 0.1273 ||:  21%|##        | 23/111 [00:15<01:01,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8278, UAS: 0.9337, LAS: 0.8779, UEM: 0.5850, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2579, partial_loss/deprel_loss: 0.9992, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1785, loss: 0.8028, batch_reg_loss: 0.1276, reg_loss: 0.1273 ||:  24%|##4       | 27/111 [00:17<00:55,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9350, LAS: 0.8794, UEM: 0.5883, LEM: 0.3559, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2687, partial_loss/deprel_loss: 0.4893, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5729, loss: 0.7937, batch_reg_loss: 0.1276, reg_loss: 0.1274 ||:  27%|##7       | 30/111 [00:20<00:55,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8737, UAS: 0.9357, LAS: 0.8800, UEM: 0.5762, LEM: 0.3392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6725, partial_loss/deprel_loss: 0.7140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8334, loss: 0.7902, batch_reg_loss: 0.1277, reg_loss: 0.1274 ||:  31%|###       | 34/111 [00:22<00:51,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8797, UAS: 0.9370, LAS: 0.8816, UEM: 0.5877, LEM: 0.3504, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5669, partial_loss/deprel_loss: 0.7290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8244, loss: 0.7811, batch_reg_loss: 0.1278, reg_loss: 0.1274 ||:  33%|###3      | 37/111 [00:24<00:50,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8203, UAS: 0.9350, LAS: 0.8792, UEM: 0.5682, LEM: 0.3341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2426, partial_loss/deprel_loss: 1.1232, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2749, loss: 0.8012, batch_reg_loss: 0.1278, reg_loss: 0.1275 ||:  37%|###6      | 41/111 [00:27<00:47,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7827, UAS: 0.9333, LAS: 0.8773, UEM: 0.5601, LEM: 0.3259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1731, partial_loss/deprel_loss: 1.4011, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6834, loss: 0.8193, batch_reg_loss: 0.1279, reg_loss: 0.1275 ||:  41%|####      | 45/111 [00:30<00:44,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8356, UAS: 0.9327, LAS: 0.8767, UEM: 0.5487, LEM: 0.3164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2953, partial_loss/deprel_loss: 0.9857, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1755, loss: 0.8261, batch_reg_loss: 0.1280, reg_loss: 0.1275 ||:  44%|####4     | 49/111 [00:32<00:41,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9332, LAS: 0.8771, UEM: 0.5407, LEM: 0.3053, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6257, partial_loss/deprel_loss: 0.8141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9044, loss: 0.8255, batch_reg_loss: 0.1280, reg_loss: 0.1276 ||:  48%|####7     | 53/111 [00:35<00:37,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8593, UAS: 0.9305, LAS: 0.8738, UEM: 0.5267, LEM: 0.2957, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7496, partial_loss/deprel_loss: 0.8220, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9356, loss: 0.8506, batch_reg_loss: 0.1281, reg_loss: 0.1276 ||:  51%|#####1    | 57/111 [00:37<00:34,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8758, UAS: 0.9294, LAS: 0.8723, UEM: 0.5206, LEM: 0.2915, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5661, partial_loss/deprel_loss: 0.6737, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7804, loss: 0.8612, batch_reg_loss: 0.1282, reg_loss: 0.1276 ||:  55%|#####4    | 61/111 [00:40<00:32,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8640, UAS: 0.9286, LAS: 0.8712, UEM: 0.5098, LEM: 0.2818, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6110, partial_loss/deprel_loss: 0.7682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8651, loss: 0.8717, batch_reg_loss: 0.1283, reg_loss: 0.1277 ||:  59%|#####8    | 65/111 [00:43<00:30,  1.53it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8624, UAS: 0.9255, LAS: 0.8680, UEM: 0.4994, LEM: 0.2757, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8341, partial_loss/deprel_loss: 0.8179, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9495, loss: 0.8981, batch_reg_loss: 0.1284, reg_loss: 0.1277 ||:  62%|######2   | 69/111 [00:45<00:28,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8583, UAS: 0.9260, LAS: 0.8685, UEM: 0.5123, LEM: 0.2920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7949, partial_loss/deprel_loss: 0.7780, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9098, loss: 0.8941, batch_reg_loss: 0.1284, reg_loss: 0.1278 ||:  65%|######4   | 72/111 [00:47<00:26,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7804, UAS: 0.9254, LAS: 0.8680, UEM: 0.5102, LEM: 0.2885, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1089, partial_loss/deprel_loss: 1.2912, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5832, loss: 0.8992, batch_reg_loss: 0.1285, reg_loss: 0.1278 ||:  68%|######7   | 75/111 [00:50<00:24,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9269, LAS: 0.8696, UEM: 0.5202, LEM: 0.2937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2120, partial_loss/deprel_loss: 0.3991, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4903, loss: 0.8862, batch_reg_loss: 0.1286, reg_loss: 0.1278 ||:  71%|#######1  | 79/111 [00:52<00:22,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9274, LAS: 0.8700, UEM: 0.5204, LEM: 0.2910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3154, partial_loss/deprel_loss: 0.4886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5826, loss: 0.8838, batch_reg_loss: 0.1287, reg_loss: 0.1279 ||:  74%|#######3  | 82/111 [00:55<00:20,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9041, UAS: 0.9281, LAS: 0.8709, UEM: 0.5253, LEM: 0.2929, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3072, partial_loss/deprel_loss: 0.4757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5707, loss: 0.8759, batch_reg_loss: 0.1287, reg_loss: 0.1279 ||:  77%|#######6  | 85/111 [00:57<00:18,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8220, UAS: 0.9270, LAS: 0.8697, UEM: 0.5177, LEM: 0.2879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3218, partial_loss/deprel_loss: 1.0454, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2295, loss: 0.8849, batch_reg_loss: 0.1288, reg_loss: 0.1279 ||:  79%|#######9  | 88/111 [00:59<00:17,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8171, UAS: 0.9260, LAS: 0.8684, UEM: 0.5104, LEM: 0.2823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4441, partial_loss/deprel_loss: 1.2558, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4223, loss: 0.8980, batch_reg_loss: 0.1288, reg_loss: 0.1279 ||:  83%|########2 | 92/111 [01:02<00:13,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9262, LAS: 0.8686, UEM: 0.5193, LEM: 0.2901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3134, partial_loss/deprel_loss: 0.4586, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5585, loss: 0.8958, batch_reg_loss: 0.1289, reg_loss: 0.1280 ||:  86%|########5 | 95/111 [01:04<00:11,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8623, UAS: 0.9256, LAS: 0.8679, UEM: 0.5131, LEM: 0.2854, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8674, partial_loss/deprel_loss: 0.8091, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9497, loss: 0.9019, batch_reg_loss: 0.1290, reg_loss: 0.1280 ||:  88%|########8 | 98/111 [01:06<00:09,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9268, LAS: 0.8692, UEM: 0.5273, LEM: 0.2957, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3296, partial_loss/deprel_loss: 0.4673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5688, loss: 0.8912, batch_reg_loss: 0.1290, reg_loss: 0.1280 ||:  91%|######### | 101/111 [01:08<00:07,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8077, UAS: 0.9265, LAS: 0.8689, UEM: 0.5272, LEM: 0.2951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5767, partial_loss/deprel_loss: 1.2628, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4546, loss: 0.8940, batch_reg_loss: 0.1291, reg_loss: 0.1281 ||:  94%|#########3| 104/111 [01:11<00:05,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8524, UAS: 0.9270, LAS: 0.8692, UEM: 0.5252, LEM: 0.2916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9199, partial_loss/deprel_loss: 0.9289, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0563, loss: 0.8924, batch_reg_loss: 0.1292, reg_loss: 0.1281 ||:  97%|#########7| 108/111 [01:13<00:02,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9271, LAS: 0.8694, UEM: 0.5212, LEM: 0.2884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5733, partial_loss/deprel_loss: 0.6382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7544, loss: 0.8907, batch_reg_loss: 0.1292, reg_loss: 0.1281 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
+      "2023-04-06 23:37:04,098 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8198, UAS: 0.9346, LAS: 0.8832, UEM: 0.6393, LEM: 0.3707, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6542, partial_loss/deprel_loss: 60.5480, partial_loss/cycle_loss: 0.0000, batch_loss: 48.7692, loss: 28.2319, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:03<00:10,  1.05s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.9413, LAS: 0.8902, UEM: 0.6892, LEM: 0.4574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7597, partial_loss/deprel_loss: 30.7479, partial_loss/cycle_loss: 0.0000, batch_loss: 24.7503, loss: 26.1370, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:07,  1.02s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9004, UAS: 0.9440, LAS: 0.8904, UEM: 0.6567, LEM: 0.3837, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4145, partial_loss/deprel_loss: 24.9592, partial_loss/cycle_loss: 0.0000, batch_loss: 20.0503, loss: 25.0336, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  69%|######9   | 9/13 [00:08<00:03,  1.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8670, UAS: 0.9429, LAS: 0.8893, UEM: 0.6474, LEM: 0.3799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0086, partial_loss/deprel_loss: 44.8982, partial_loss/cycle_loss: 0.0000, batch_loss: 36.1203, loss: 26.7810, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  92%|#########2| 12/13 [00:11<00:00,  1.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9419, LAS: 0.8881, UEM: 0.6314, LEM: 0.3663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8470, partial_loss/deprel_loss: 31.8272, partial_loss/cycle_loss: 0.0000, batch_loss: 25.6312, loss: 26.6926, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.05it/s]\n",
+      "2023-04-06 23:37:16,466 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.638  |    31.827\n",
+      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.573  |     0.847\n",
+      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.128  |     0.000\n",
+      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - UEM                      |     0.521  |     0.631\n",
+      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - LAS                      |     0.869  |     0.888\n",
+      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - loss                     |     0.891  |    26.693\n",
+      "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - LEM                      |     0.288  |     0.366\n",
+      "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - UAS                      |     0.927  |     0.942\n",
+      "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - EM                       |     0.877  |     0.874\n",
+      "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:37:16,469 - INFO - combo.training.trainer - Epoch duration: 0:01:28.057300\n",
+      "2023-04-06 23:37:16,469 - INFO - combo.training.trainer - Estimated training time remaining: 8:00:08\n",
+      "2023-04-06 23:37:16,469 - INFO - allennlp.training.trainer - Epoch 36/399\n",
+      "2023-04-06 23:37:16,469 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:37:16,469 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-06 23:37:16,477 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9452, LAS: 0.8924, UEM: 0.5289, LEM: 0.2663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4880, partial_loss/deprel_loss: 0.6698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7627, loss: 0.7053, batch_reg_loss: 0.1293, reg_loss: 0.1293 ||:   3%|2         | 3/111 [00:02<01:17,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7919, UAS: 0.9146, LAS: 0.8533, UEM: 0.4009, LEM: 0.1795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6848, partial_loss/deprel_loss: 1.3093, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5138, loss: 1.0154, batch_reg_loss: 0.1294, reg_loss: 0.1293 ||:   6%|6         | 7/111 [00:04<01:10,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9211, LAS: 0.8604, UEM: 0.4206, LEM: 0.1742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4597, partial_loss/deprel_loss: 0.6605, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7498, loss: 0.9638, batch_reg_loss: 0.1294, reg_loss: 0.1293 ||:   9%|9         | 10/111 [00:06<01:09,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8680, UAS: 0.9129, LAS: 0.8526, UEM: 0.3770, LEM: 0.1513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8000, partial_loss/deprel_loss: 0.7861, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9183, loss: 1.0215, batch_reg_loss: 0.1295, reg_loss: 0.1294 ||:  12%|#1        | 13/111 [00:08<01:07,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8891, UAS: 0.9189, LAS: 0.8602, UEM: 0.3997, LEM: 0.1637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4654, partial_loss/deprel_loss: 0.6501, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7427, loss: 0.9621, batch_reg_loss: 0.1295, reg_loss: 0.1294 ||:  14%|#4        | 16/111 [00:11<01:08,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8315, UAS: 0.9139, LAS: 0.8544, UEM: 0.3725, LEM: 0.1497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0556, partial_loss/deprel_loss: 1.0156, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1532, loss: 1.0103, batch_reg_loss: 0.1296, reg_loss: 0.1294 ||:  17%|#7        | 19/111 [00:13<01:05,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9164, LAS: 0.8573, UEM: 0.4090, LEM: 0.1805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3374, partial_loss/deprel_loss: 0.4859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5859, loss: 0.9840, batch_reg_loss: 0.1296, reg_loss: 0.1294 ||:  20%|#9        | 22/111 [00:15<01:03,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9540, UAS: 0.9206, LAS: 0.8620, UEM: 0.5124, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0660, partial_loss/deprel_loss: 0.1975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3009, loss: 0.9505, batch_reg_loss: 0.1297, reg_loss: 0.1295 ||:  23%|##2       | 25/111 [00:17<01:05,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8453, UAS: 0.9192, LAS: 0.8603, UEM: 0.4831, LEM: 0.2796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0821, partial_loss/deprel_loss: 0.8557, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0308, loss: 0.9618, batch_reg_loss: 0.1298, reg_loss: 0.1295 ||:  26%|##6       | 29/111 [00:20<00:58,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9221, LAS: 0.8634, UEM: 0.5052, LEM: 0.2917, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1437, partial_loss/deprel_loss: 0.3982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4772, loss: 0.9353, batch_reg_loss: 0.1299, reg_loss: 0.1295 ||:  29%|##8       | 32/111 [00:22<00:56,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8467, UAS: 0.9198, LAS: 0.8611, UEM: 0.4829, LEM: 0.2747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1443, partial_loss/deprel_loss: 0.8956, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0753, loss: 0.9539, batch_reg_loss: 0.1299, reg_loss: 0.1296 ||:  32%|###2      | 36/111 [00:25<00:52,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8848, UAS: 0.9206, LAS: 0.8620, UEM: 0.4807, LEM: 0.2668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6102, partial_loss/deprel_loss: 0.6688, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7871, loss: 0.9482, batch_reg_loss: 0.1300, reg_loss: 0.1296 ||:  35%|###5      | 39/111 [00:27<00:50,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8373, UAS: 0.9212, LAS: 0.8630, UEM: 0.4812, LEM: 0.2660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1409, partial_loss/deprel_loss: 1.0084, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1650, loss: 0.9400, batch_reg_loss: 0.1301, reg_loss: 0.1297 ||:  39%|###8      | 43/111 [00:29<00:46,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9227, LAS: 0.8648, UEM: 0.4976, LEM: 0.2776, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2244, partial_loss/deprel_loss: 0.4163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5081, loss: 0.9244, batch_reg_loss: 0.1302, reg_loss: 0.1297 ||:  42%|####2     | 47/111 [00:32<00:42,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9247, LAS: 0.8669, UEM: 0.5112, LEM: 0.2824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2245, partial_loss/deprel_loss: 0.4146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5068, loss: 0.9069, batch_reg_loss: 0.1302, reg_loss: 0.1297 ||:  45%|####5     | 50/111 [00:34<00:41,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8419, UAS: 0.9256, LAS: 0.8678, UEM: 0.5218, LEM: 0.2915, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9718, partial_loss/deprel_loss: 0.9520, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0862, loss: 0.8975, batch_reg_loss: 0.1303, reg_loss: 0.1298 ||:  48%|####7     | 53/111 [00:36<00:41,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8846, UAS: 0.9273, LAS: 0.8700, UEM: 0.5428, LEM: 0.3133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5033, partial_loss/deprel_loss: 0.6351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7391, loss: 0.8805, batch_reg_loss: 0.1304, reg_loss: 0.1298 ||:  51%|#####1    | 57/111 [00:39<00:37,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8903, UAS: 0.9283, LAS: 0.8711, UEM: 0.5485, LEM: 0.3151, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4286, partial_loss/deprel_loss: 0.5783, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6788, loss: 0.8710, batch_reg_loss: 0.1304, reg_loss: 0.1298 ||:  54%|#####4    | 60/111 [00:41<00:35,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9104, UAS: 0.9295, LAS: 0.8725, UEM: 0.5627, LEM: 0.3281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3033, partial_loss/deprel_loss: 0.4829, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5775, loss: 0.8593, batch_reg_loss: 0.1305, reg_loss: 0.1299 ||:  57%|#####6    | 63/111 [00:43<00:34,  1.40it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8837, UAS: 0.9297, LAS: 0.8727, UEM: 0.5516, LEM: 0.3177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5741, partial_loss/deprel_loss: 0.7504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8456, loss: 0.8591, batch_reg_loss: 0.1305, reg_loss: 0.1299 ||:  60%|######    | 67/111 [00:46<00:30,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8409, UAS: 0.9298, LAS: 0.8726, UEM: 0.5457, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1037, partial_loss/deprel_loss: 0.9766, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1326, loss: 0.8598, batch_reg_loss: 0.1306, reg_loss: 0.1299 ||:  64%|######3   | 71/111 [00:48<00:27,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9304, LAS: 0.8730, UEM: 0.5460, LEM: 0.3102, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3699, partial_loss/deprel_loss: 0.5524, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6465, loss: 0.8557, batch_reg_loss: 0.1306, reg_loss: 0.1300 ||:  68%|######7   | 75/111 [00:51<00:23,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8167, UAS: 0.9292, LAS: 0.8716, UEM: 0.5398, LEM: 0.3041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4855, partial_loss/deprel_loss: 1.0485, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2665, loss: 0.8661, batch_reg_loss: 0.1307, reg_loss: 0.1300 ||:  71%|#######1  | 79/111 [00:54<00:21,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9298, LAS: 0.8723, UEM: 0.5468, LEM: 0.3095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4292, partial_loss/deprel_loss: 0.6107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7051, loss: 0.8599, batch_reg_loss: 0.1307, reg_loss: 0.1300 ||:  75%|#######4  | 83/111 [00:57<00:19,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8879, UAS: 0.9290, LAS: 0.8713, UEM: 0.5385, LEM: 0.3022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5060, partial_loss/deprel_loss: 0.6993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7915, loss: 0.8692, batch_reg_loss: 0.1308, reg_loss: 0.1301 ||:  78%|#######8  | 87/111 [00:59<00:15,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8627, UAS: 0.9280, LAS: 0.8700, UEM: 0.5342, LEM: 0.2985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7672, partial_loss/deprel_loss: 0.9964, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0814, loss: 0.8801, batch_reg_loss: 0.1309, reg_loss: 0.1301 ||:  82%|########1 | 91/111 [01:01<00:12,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9272, LAS: 0.8690, UEM: 0.5320, LEM: 0.2974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2635, partial_loss/deprel_loss: 0.4135, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5145, loss: 0.8877, batch_reg_loss: 0.1310, reg_loss: 0.1301 ||:  86%|########5 | 95/111 [01:04<00:10,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9000, UAS: 0.9272, LAS: 0.8689, UEM: 0.5316, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3234, partial_loss/deprel_loss: 0.5304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6200, loss: 0.8883, batch_reg_loss: 0.1310, reg_loss: 0.1302 ||:  88%|########8 | 98/111 [01:07<00:09,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9277, LAS: 0.8693, UEM: 0.5311, LEM: 0.2932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3735, partial_loss/deprel_loss: 0.6150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6978, loss: 0.8848, batch_reg_loss: 0.1311, reg_loss: 0.1302 ||:  92%|#########1| 102/111 [01:09<00:05,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8988, UAS: 0.9277, LAS: 0.8695, UEM: 0.5285, LEM: 0.2901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4234, partial_loss/deprel_loss: 0.5900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6879, loss: 0.8845, batch_reg_loss: 0.1312, reg_loss: 0.1302 ||:  95%|#########5| 106/111 [01:12<00:03,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9270, LAS: 0.8688, UEM: 0.5260, LEM: 0.2884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2633, partial_loss/deprel_loss: 0.4330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5303, loss: 0.8900, batch_reg_loss: 0.1313, reg_loss: 0.1303 ||:  99%|#########9| 110/111 [01:15<00:00,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8737, UAS: 0.9271, LAS: 0.8689, UEM: 0.5252, LEM: 0.2873, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5826, partial_loss/deprel_loss: 0.7173, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8217, loss: 0.8894, batch_reg_loss: 0.1313, reg_loss: 0.1303 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
+      "2023-04-06 23:38:32,176 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:38:32,176 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:38:32,176 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:38:32,176 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:38:32,176 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.717  |       N/A\n",
+      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.583  |       N/A\n",
+      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.130  |       N/A\n",
+      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - UEM                      |     0.525  |       N/A\n",
+      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - LAS                      |     0.869  |       N/A\n",
+      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - loss                     |     0.889  |       N/A\n",
+      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - LEM                      |     0.287  |       N/A\n",
+      "2023-04-06 23:38:32,178 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:38:32,178 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:38:32,178 - INFO - combo.training.tensorboard_writer - UAS                      |     0.927  |       N/A\n",
+      "2023-04-06 23:38:32,178 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:38:32,178 - INFO - combo.training.tensorboard_writer - EM                       |     0.874  |       N/A\n",
+      "2023-04-06 23:38:32,178 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:38:32,179 - INFO - combo.training.trainer - Epoch duration: 0:01:15.709732\n",
+      "2023-04-06 23:38:32,179 - INFO - combo.training.trainer - Estimated training time remaining: 7:58:15\n",
+      "2023-04-06 23:38:32,179 - INFO - allennlp.training.trainer - Epoch 37/399\n",
+      "2023-04-06 23:38:32,179 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:38:32,179 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:38:32,188 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9332, LAS: 0.8765, UEM: 0.4678, LEM: 0.2122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3651, partial_loss/deprel_loss: 0.4818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5898, loss: 0.8393, batch_reg_loss: 0.1314, reg_loss: 0.1314 ||:   4%|3         | 4/111 [00:02<01:08,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8846, UAS: 0.9418, LAS: 0.8880, UEM: 0.6776, LEM: 0.4819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5287, partial_loss/deprel_loss: 0.6488, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7562, loss: 0.7479, batch_reg_loss: 0.1315, reg_loss: 0.1314 ||:   6%|6         | 7/111 [00:05<01:12,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9401, LAS: 0.8861, UEM: 0.6351, LEM: 0.4231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3285, partial_loss/deprel_loss: 0.5358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6258, loss: 0.7604, batch_reg_loss: 0.1315, reg_loss: 0.1314 ||:   9%|9         | 10/111 [00:07<01:09,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8978, UAS: 0.9390, LAS: 0.8841, UEM: 0.5888, LEM: 0.3604, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3963, partial_loss/deprel_loss: 0.5860, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6797, loss: 0.7824, batch_reg_loss: 0.1316, reg_loss: 0.1315 ||:  13%|#2        | 14/111 [00:09<01:03,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8355, UAS: 0.9365, LAS: 0.8814, UEM: 0.5696, LEM: 0.3415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2521, partial_loss/deprel_loss: 0.9936, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1770, loss: 0.8040, batch_reg_loss: 0.1316, reg_loss: 0.1315 ||:  15%|#5        | 17/111 [00:11<01:03,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8802, UAS: 0.9375, LAS: 0.8818, UEM: 0.5544, LEM: 0.3182, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5666, partial_loss/deprel_loss: 0.7057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8096, loss: 0.7999, batch_reg_loss: 0.1317, reg_loss: 0.1315 ||:  18%|#8        | 20/111 [00:13<01:01,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8757, UAS: 0.9373, LAS: 0.8809, UEM: 0.5360, LEM: 0.2984, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6051, partial_loss/deprel_loss: 0.7038, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8158, loss: 0.8015, batch_reg_loss: 0.1317, reg_loss: 0.1315 ||:  21%|##        | 23/111 [00:15<00:59,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9358, LAS: 0.8789, UEM: 0.5296, LEM: 0.2913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3506, partial_loss/deprel_loss: 0.5437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6369, loss: 0.8139, batch_reg_loss: 0.1318, reg_loss: 0.1316 ||:  24%|##4       | 27/111 [00:18<00:56,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9368, LAS: 0.8799, UEM: 0.5409, LEM: 0.2947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2640, partial_loss/deprel_loss: 0.4096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5124, loss: 0.8028, batch_reg_loss: 0.1319, reg_loss: 0.1316 ||:  28%|##7       | 31/111 [00:20<00:52,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7975, UAS: 0.9310, LAS: 0.8739, UEM: 0.5321, LEM: 0.2887, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7992, partial_loss/deprel_loss: 1.2460, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4886, loss: 0.8534, batch_reg_loss: 0.1319, reg_loss: 0.1316 ||:  31%|###       | 34/111 [00:23<00:53,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9295, LAS: 0.8724, UEM: 0.5293, LEM: 0.2876, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5793, partial_loss/deprel_loss: 0.6494, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7674, loss: 0.8636, batch_reg_loss: 0.1320, reg_loss: 0.1317 ||:  34%|###4      | 38/111 [00:25<00:49,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9291, LAS: 0.8717, UEM: 0.5239, LEM: 0.2817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7996, partial_loss/deprel_loss: 0.7570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8976, loss: 0.8671, batch_reg_loss: 0.1321, reg_loss: 0.1317 ||:  37%|###6      | 41/111 [00:27<00:48,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8628, UAS: 0.9284, LAS: 0.8710, UEM: 0.5212, LEM: 0.2801, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8072, partial_loss/deprel_loss: 0.7757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9141, loss: 0.8724, batch_reg_loss: 0.1321, reg_loss: 0.1317 ||:  40%|###9      | 44/111 [00:30<00:47,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9267, LAS: 0.8691, UEM: 0.5128, LEM: 0.2733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3557, partial_loss/deprel_loss: 0.5814, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6685, loss: 0.8894, batch_reg_loss: 0.1322, reg_loss: 0.1318 ||:  42%|####2     | 47/111 [00:32<00:45,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9279, LAS: 0.8706, UEM: 0.5283, LEM: 0.2888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2007, partial_loss/deprel_loss: 0.3160, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4252, loss: 0.8751, batch_reg_loss: 0.1323, reg_loss: 0.1318 ||:  46%|####5     | 51/111 [00:35<00:42,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9263, LAS: 0.8688, UEM: 0.5287, LEM: 0.2919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2684, partial_loss/deprel_loss: 0.4409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5387, loss: 0.8898, batch_reg_loss: 0.1323, reg_loss: 0.1318 ||:  49%|####8     | 54/111 [00:37<00:41,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8261, UAS: 0.9249, LAS: 0.8676, UEM: 0.5162, LEM: 0.2841, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4259, partial_loss/deprel_loss: 0.9915, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2108, loss: 0.8998, batch_reg_loss: 0.1324, reg_loss: 0.1319 ||:  51%|#####1    | 57/111 [00:39<00:38,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9245, LAS: 0.8671, UEM: 0.5301, LEM: 0.3042, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1480, partial_loss/deprel_loss: 0.2760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3828, loss: 0.9042, batch_reg_loss: 0.1325, reg_loss: 0.1319 ||:  54%|#####4    | 60/111 [00:41<00:36,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8584, UAS: 0.9240, LAS: 0.8665, UEM: 0.5210, LEM: 0.2975, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8904, partial_loss/deprel_loss: 0.8210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9674, loss: 0.9083, batch_reg_loss: 0.1325, reg_loss: 0.1319 ||:  57%|#####6    | 63/111 [00:43<00:34,  1.41it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9239, LAS: 0.8662, UEM: 0.5185, LEM: 0.2949, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3084, partial_loss/deprel_loss: 0.5285, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6171, loss: 0.9107, batch_reg_loss: 0.1326, reg_loss: 0.1319 ||:  59%|#####9    | 66/111 [00:45<00:31,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9242, LAS: 0.8665, UEM: 0.5151, LEM: 0.2909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3071, partial_loss/deprel_loss: 0.4553, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5583, loss: 0.9102, batch_reg_loss: 0.1327, reg_loss: 0.1320 ||:  63%|######3   | 70/111 [00:48<00:28,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8097, UAS: 0.9240, LAS: 0.8662, UEM: 0.5102, LEM: 0.2864, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4604, partial_loss/deprel_loss: 1.2037, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3878, loss: 0.9143, batch_reg_loss: 0.1327, reg_loss: 0.1320 ||:  67%|######6   | 74/111 [00:50<00:24,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9252, LAS: 0.8674, UEM: 0.5201, LEM: 0.2896, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4208, partial_loss/deprel_loss: 0.6707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7536, loss: 0.9017, batch_reg_loss: 0.1328, reg_loss: 0.1321 ||:  70%|#######   | 78/111 [00:53<00:22,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8867, UAS: 0.9250, LAS: 0.8668, UEM: 0.5147, LEM: 0.2835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4345, partial_loss/deprel_loss: 0.6903, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7721, loss: 0.9045, batch_reg_loss: 0.1329, reg_loss: 0.1321 ||:  74%|#######3  | 82/111 [00:55<00:18,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9257, LAS: 0.8676, UEM: 0.5136, LEM: 0.2802, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7814, partial_loss/deprel_loss: 0.6975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8472, loss: 0.8976, batch_reg_loss: 0.1330, reg_loss: 0.1321 ||:  77%|#######7  | 86/111 [00:58<00:16,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8497, UAS: 0.9262, LAS: 0.8681, UEM: 0.5186, LEM: 0.2849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9150, partial_loss/deprel_loss: 0.9404, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0683, loss: 0.8935, batch_reg_loss: 0.1331, reg_loss: 0.1322 ||:  81%|########1 | 90/111 [01:00<00:13,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8307, UAS: 0.9267, LAS: 0.8686, UEM: 0.5241, LEM: 0.2879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1581, partial_loss/deprel_loss: 0.9771, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1465, loss: 0.8894, batch_reg_loss: 0.1331, reg_loss: 0.1322 ||:  85%|########4 | 94/111 [01:03<00:10,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8477, UAS: 0.9258, LAS: 0.8677, UEM: 0.5219, LEM: 0.2883, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0681, partial_loss/deprel_loss: 1.0203, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1631, loss: 0.8979, batch_reg_loss: 0.1332, reg_loss: 0.1323 ||:  88%|########8 | 98/111 [01:06<00:08,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9266, LAS: 0.8686, UEM: 0.5311, LEM: 0.2940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3334, partial_loss/deprel_loss: 0.4944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5954, loss: 0.8899, batch_reg_loss: 0.1333, reg_loss: 0.1323 ||:  92%|#########1| 102/111 [01:09<00:06,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9265, LAS: 0.8684, UEM: 0.5272, LEM: 0.2905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4459, partial_loss/deprel_loss: 0.6718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7599, loss: 0.8925, batch_reg_loss: 0.1333, reg_loss: 0.1323 ||:  95%|#########4| 105/111 [01:11<00:04,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8827, UAS: 0.9261, LAS: 0.8679, UEM: 0.5228, LEM: 0.2874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5106, partial_loss/deprel_loss: 0.6320, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7411, loss: 0.8953, batch_reg_loss: 0.1334, reg_loss: 0.1324 ||:  97%|#########7| 108/111 [01:13<00:02,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9265, LAS: 0.8684, UEM: 0.5222, LEM: 0.2859, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5453, partial_loss/deprel_loss: 0.6499, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7624, loss: 0.8914, batch_reg_loss: 0.1334, reg_loss: 0.1324 ||: 100%|##########| 111/111 [01:15<00:00,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9265, LAS: 0.8684, UEM: 0.5222, LEM: 0.2859, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5453, partial_loss/deprel_loss: 0.6499, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7624, loss: 0.8914, batch_reg_loss: 0.1334, reg_loss: 0.1324 ||: 100%|##########| 111/111 [01:15<00:00,  1.46it/s]\n",
+      "2023-04-06 23:39:48,042 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:39:48,042 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:39:48,042 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:39:48,042 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:39:48,042 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:39:48,042 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.650  |       N/A\n",
+      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.545  |       N/A\n",
+      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.132  |       N/A\n",
+      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - UEM                      |     0.522  |       N/A\n",
+      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - LAS                      |     0.868  |       N/A\n",
+      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - loss                     |     0.891  |       N/A\n",
+      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - LEM                      |     0.286  |       N/A\n",
+      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - UAS                      |     0.926  |       N/A\n",
+      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - EM                       |     0.894  |       N/A\n",
+      "2023-04-06 23:39:48,044 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:39:48,044 - INFO - combo.training.trainer - Epoch duration: 0:01:15.865530\n",
+      "2023-04-06 23:39:48,045 - INFO - combo.training.trainer - Estimated training time remaining: 7:56:25\n",
+      "2023-04-06 23:39:48,045 - INFO - allennlp.training.trainer - Epoch 38/399\n",
+      "2023-04-06 23:39:48,045 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:39:48,045 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:39:48,052 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8437, UAS: 0.9161, LAS: 0.8534, UEM: 0.1467, LEM: 0.0433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0036, partial_loss/deprel_loss: 0.8636, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0250, loss: 0.9915, batch_reg_loss: 0.1335, reg_loss: 0.1335 ||:   3%|2         | 3/111 [00:02<01:16,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8142, UAS: 0.9123, LAS: 0.8513, UEM: 0.1802, LEM: 0.0496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5122, partial_loss/deprel_loss: 1.1313, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3410, loss: 1.0190, batch_reg_loss: 0.1335, reg_loss: 0.1335 ||:   5%|5         | 6/111 [00:04<01:13,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9073, LAS: 0.8475, UEM: 0.2964, LEM: 0.1575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3239, partial_loss/deprel_loss: 0.4766, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5797, loss: 1.0513, batch_reg_loss: 0.1336, reg_loss: 0.1335 ||:   9%|9         | 10/111 [00:06<01:08,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9198, LAS: 0.8619, UEM: 0.4844, LEM: 0.2866, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5275, partial_loss/deprel_loss: 0.6271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7409, loss: 0.9421, batch_reg_loss: 0.1337, reg_loss: 0.1336 ||:  13%|#2        | 14/111 [00:09<01:04,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9218, LAS: 0.8642, UEM: 0.4745, LEM: 0.2762, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3876, partial_loss/deprel_loss: 0.4967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6086, loss: 0.9359, batch_reg_loss: 0.1338, reg_loss: 0.1336 ||:  15%|#5        | 17/111 [00:11<01:02,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8924, UAS: 0.9248, LAS: 0.8685, UEM: 0.4811, LEM: 0.2716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4559, partial_loss/deprel_loss: 0.6083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7117, loss: 0.9002, batch_reg_loss: 0.1338, reg_loss: 0.1336 ||:  19%|#8        | 21/111 [00:13<00:59,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9240, LAS: 0.8676, UEM: 0.4905, LEM: 0.2772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5441, partial_loss/deprel_loss: 0.6274, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7447, loss: 0.9093, batch_reg_loss: 0.1339, reg_loss: 0.1337 ||:  22%|##1       | 24/111 [00:16<01:00,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8375, UAS: 0.9241, LAS: 0.8673, UEM: 0.4942, LEM: 0.2837, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0271, partial_loss/deprel_loss: 0.9570, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1050, loss: 0.9047, batch_reg_loss: 0.1340, reg_loss: 0.1337 ||:  24%|##4       | 27/111 [00:18<00:59,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9236, LAS: 0.8662, UEM: 0.4872, LEM: 0.2738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3372, partial_loss/deprel_loss: 0.5897, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6733, loss: 0.9112, batch_reg_loss: 0.1340, reg_loss: 0.1337 ||:  27%|##7       | 30/111 [00:20<00:58,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9250, LAS: 0.8682, UEM: 0.5068, LEM: 0.2874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3059, partial_loss/deprel_loss: 0.4710, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5721, loss: 0.8960, batch_reg_loss: 0.1341, reg_loss: 0.1338 ||:  30%|##9       | 33/111 [00:22<00:55,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7594, UAS: 0.9238, LAS: 0.8673, UEM: 0.5198, LEM: 0.2986, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6236, partial_loss/deprel_loss: 1.6358, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9675, loss: 0.9092, batch_reg_loss: 0.1341, reg_loss: 0.1338 ||:  32%|###2      | 36/111 [00:25<00:56,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8449, UAS: 0.9248, LAS: 0.8688, UEM: 0.5415, LEM: 0.3280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0372, partial_loss/deprel_loss: 0.9183, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0763, loss: 0.8961, batch_reg_loss: 0.1342, reg_loss: 0.1338 ||:  35%|###5      | 39/111 [00:27<00:53,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9254, LAS: 0.8697, UEM: 0.5361, LEM: 0.3217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3875, partial_loss/deprel_loss: 0.4584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5785, loss: 0.8888, batch_reg_loss: 0.1343, reg_loss: 0.1338 ||:  38%|###7      | 42/111 [00:29<00:51,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9276, LAS: 0.8721, UEM: 0.5593, LEM: 0.3361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1639, partial_loss/deprel_loss: 0.4386, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5180, loss: 0.8677, batch_reg_loss: 0.1343, reg_loss: 0.1339 ||:  41%|####1     | 46/111 [00:32<00:46,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9286, LAS: 0.8729, UEM: 0.5516, LEM: 0.3245, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4020, partial_loss/deprel_loss: 0.5790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6780, loss: 0.8602, batch_reg_loss: 0.1344, reg_loss: 0.1339 ||:  45%|####5     | 50/111 [00:34<00:42,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8677, UAS: 0.9283, LAS: 0.8724, UEM: 0.5407, LEM: 0.3145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7025, partial_loss/deprel_loss: 0.8024, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9169, loss: 0.8647, batch_reg_loss: 0.1345, reg_loss: 0.1340 ||:  48%|####7     | 53/111 [00:37<00:42,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9300, LAS: 0.8742, UEM: 0.5445, LEM: 0.3121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3832, partial_loss/deprel_loss: 0.6491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7305, loss: 0.8520, batch_reg_loss: 0.1345, reg_loss: 0.1340 ||:  51%|#####1    | 57/111 [00:39<00:38,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8420, UAS: 0.9292, LAS: 0.8732, UEM: 0.5361, LEM: 0.3047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0990, partial_loss/deprel_loss: 0.9602, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1226, loss: 0.8597, batch_reg_loss: 0.1346, reg_loss: 0.1340 ||:  55%|#####4    | 61/111 [00:42<00:34,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9296, LAS: 0.8736, UEM: 0.5367, LEM: 0.3039, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4994, partial_loss/deprel_loss: 0.5723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6924, loss: 0.8544, batch_reg_loss: 0.1346, reg_loss: 0.1341 ||:  58%|#####7    | 64/111 [00:44<00:33,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7939, UAS: 0.9282, LAS: 0.8718, UEM: 0.5287, LEM: 0.2974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7784, partial_loss/deprel_loss: 1.2841, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5176, loss: 0.8678, batch_reg_loss: 0.1347, reg_loss: 0.1341 ||:  60%|######    | 67/111 [00:46<00:30,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8464, UAS: 0.9276, LAS: 0.8711, UEM: 0.5219, LEM: 0.2923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9674, partial_loss/deprel_loss: 0.8496, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0079, loss: 0.8726, batch_reg_loss: 0.1347, reg_loss: 0.1341 ||:  63%|######3   | 70/111 [00:48<00:29,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8898, UAS: 0.9280, LAS: 0.8714, UEM: 0.5153, LEM: 0.2841, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4529, partial_loss/deprel_loss: 0.6124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7153, loss: 0.8731, batch_reg_loss: 0.1348, reg_loss: 0.1341 ||:  67%|######6   | 74/111 [00:51<00:24,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8183, UAS: 0.9288, LAS: 0.8724, UEM: 0.5400, LEM: 0.3144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4612, partial_loss/deprel_loss: 1.1146, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3188, loss: 0.8662, batch_reg_loss: 0.1349, reg_loss: 0.1342 ||:  70%|#######   | 78/111 [00:54<00:23,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9283, LAS: 0.8717, UEM: 0.5372, LEM: 0.3119, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3601, partial_loss/deprel_loss: 0.5822, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6727, loss: 0.8713, batch_reg_loss: 0.1349, reg_loss: 0.1342 ||:  73%|#######2  | 81/111 [00:56<00:21,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8786, UAS: 0.9280, LAS: 0.8713, UEM: 0.5341, LEM: 0.3088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5286, partial_loss/deprel_loss: 0.6541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7640, loss: 0.8738, batch_reg_loss: 0.1350, reg_loss: 0.1342 ||:  76%|#######5  | 84/111 [00:58<00:18,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8724, UAS: 0.9284, LAS: 0.8716, UEM: 0.5292, LEM: 0.3033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6210, partial_loss/deprel_loss: 0.6848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8071, loss: 0.8722, batch_reg_loss: 0.1351, reg_loss: 0.1343 ||:  79%|#######9  | 88/111 [01:01<00:15,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8379, UAS: 0.9283, LAS: 0.8715, UEM: 0.5263, LEM: 0.3003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2265, partial_loss/deprel_loss: 0.9465, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1377, loss: 0.8723, batch_reg_loss: 0.1352, reg_loss: 0.1343 ||:  83%|########2 | 92/111 [01:03<00:12,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9284, LAS: 0.8716, UEM: 0.5317, LEM: 0.3056, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3219, partial_loss/deprel_loss: 0.5873, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6694, loss: 0.8716, batch_reg_loss: 0.1352, reg_loss: 0.1343 ||:  86%|########6 | 96/111 [01:06<00:10,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7974, UAS: 0.9280, LAS: 0.8711, UEM: 0.5262, LEM: 0.3005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6483, partial_loss/deprel_loss: 1.2148, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4368, loss: 0.8753, batch_reg_loss: 0.1353, reg_loss: 0.1344 ||:  90%|######### | 100/111 [01:09<00:07,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8199, UAS: 0.9261, LAS: 0.8692, UEM: 0.5205, LEM: 0.2971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4797, partial_loss/deprel_loss: 1.0433, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2660, loss: 0.8891, batch_reg_loss: 0.1354, reg_loss: 0.1344 ||:  93%|#########2| 103/111 [01:11<00:05,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8481, UAS: 0.9259, LAS: 0.8689, UEM: 0.5149, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9886, partial_loss/deprel_loss: 0.9805, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1176, loss: 0.8923, batch_reg_loss: 0.1354, reg_loss: 0.1345 ||:  96%|#########6| 107/111 [01:14<00:02,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9264, LAS: 0.8696, UEM: 0.5161, LEM: 0.2913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2614, partial_loss/deprel_loss: 0.4928, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5820, loss: 0.8875, batch_reg_loss: 0.1355, reg_loss: 0.1345 ||: 100%|##########| 111/111 [01:16<00:00,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9264, LAS: 0.8696, UEM: 0.5161, LEM: 0.2913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2614, partial_loss/deprel_loss: 0.4928, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5820, loss: 0.8875, batch_reg_loss: 0.1355, reg_loss: 0.1345 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
+      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.493  |       N/A\n",
+      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.261  |       N/A\n",
+      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.134  |       N/A\n",
+      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - UEM                      |     0.516  |       N/A\n",
+      "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - LAS                      |     0.870  |       N/A\n",
+      "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - loss                     |     0.888  |       N/A\n",
+      "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - LEM                      |     0.291  |       N/A\n",
+      "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - UAS                      |     0.926  |       N/A\n",
+      "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - EM                       |     0.911  |       N/A\n",
+      "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:41:04,482 - INFO - combo.training.trainer - Epoch duration: 0:01:16.437091\n",
+      "2023-04-06 23:41:04,482 - INFO - combo.training.trainer - Estimated training time remaining: 7:54:43\n",
+      "2023-04-06 23:41:04,482 - INFO - allennlp.training.trainer - Epoch 39/399\n",
+      "2023-04-06 23:41:04,482 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:41:04,482 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:41:04,489 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8679, UAS: 0.9271, LAS: 0.8726, UEM: 0.3130, LEM: 0.1275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7463, partial_loss/deprel_loss: 0.7432, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8794, loss: 0.8727, batch_reg_loss: 0.1356, reg_loss: 0.1356 ||:   3%|2         | 3/111 [00:02<01:26,  1.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8643, UAS: 0.9318, LAS: 0.8801, UEM: 0.6530, LEM: 0.5221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8199, partial_loss/deprel_loss: 0.7412, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8926, loss: 0.8137, batch_reg_loss: 0.1357, reg_loss: 0.1356 ||:   5%|5         | 6/111 [00:04<01:23,  1.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8942, UAS: 0.9279, LAS: 0.8751, UEM: 0.6365, LEM: 0.4647, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4726, partial_loss/deprel_loss: 0.5603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6784, loss: 0.8520, batch_reg_loss: 0.1357, reg_loss: 0.1356 ||:   8%|8         | 9/111 [00:07<01:20,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9365, LAS: 0.8843, UEM: 0.6833, LEM: 0.4764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1591, partial_loss/deprel_loss: 0.3740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4668, loss: 0.7746, batch_reg_loss: 0.1358, reg_loss: 0.1357 ||:  11%|#         | 12/111 [00:09<01:17,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9311, LAS: 0.8782, UEM: 0.6278, LEM: 0.4261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4972, partial_loss/deprel_loss: 0.5300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6593, loss: 0.8231, batch_reg_loss: 0.1358, reg_loss: 0.1357 ||:  14%|#4        | 16/111 [00:11<01:08,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8565, UAS: 0.9309, LAS: 0.8773, UEM: 0.5934, LEM: 0.3878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9564, partial_loss/deprel_loss: 0.8364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9963, loss: 0.8333, batch_reg_loss: 0.1359, reg_loss: 0.1357 ||:  17%|#7        | 19/111 [00:14<01:07,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9315, LAS: 0.8780, UEM: 0.6091, LEM: 0.4108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1309, partial_loss/deprel_loss: 0.2656, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3746, loss: 0.8262, batch_reg_loss: 0.1360, reg_loss: 0.1358 ||:  20%|#9        | 22/111 [00:16<01:05,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8924, UAS: 0.9291, LAS: 0.8751, UEM: 0.5884, LEM: 0.3928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4094, partial_loss/deprel_loss: 0.5780, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6803, loss: 0.8458, batch_reg_loss: 0.1360, reg_loss: 0.1358 ||:  23%|##2       | 25/111 [00:18<01:03,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8899, UAS: 0.9310, LAS: 0.8771, UEM: 0.5775, LEM: 0.3731, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4881, partial_loss/deprel_loss: 0.6655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7661, loss: 0.8331, batch_reg_loss: 0.1361, reg_loss: 0.1358 ||:  25%|##5       | 28/111 [00:20<00:59,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9315, LAS: 0.8775, UEM: 0.5766, LEM: 0.3667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3092, partial_loss/deprel_loss: 0.4598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5658, loss: 0.8266, batch_reg_loss: 0.1361, reg_loss: 0.1358 ||:  28%|##7       | 31/111 [00:23<01:02,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9334, LAS: 0.8794, UEM: 0.5744, LEM: 0.3537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4142, partial_loss/deprel_loss: 0.5945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6946, loss: 0.8153, batch_reg_loss: 0.1362, reg_loss: 0.1359 ||:  32%|###1      | 35/111 [00:25<00:56,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9338, LAS: 0.8798, UEM: 0.5824, LEM: 0.3585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1928, partial_loss/deprel_loss: 0.3426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4489, loss: 0.8117, batch_reg_loss: 0.1363, reg_loss: 0.1359 ||:  35%|###5      | 39/111 [00:28<00:49,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9350, LAS: 0.8810, UEM: 0.5892, LEM: 0.3634, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3795, partial_loss/deprel_loss: 0.5966, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6895, loss: 0.8028, batch_reg_loss: 0.1363, reg_loss: 0.1360 ||:  39%|###8      | 43/111 [00:30<00:45,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9368, LAS: 0.8829, UEM: 0.5965, LEM: 0.3631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2365, partial_loss/deprel_loss: 0.4359, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5324, loss: 0.7887, batch_reg_loss: 0.1364, reg_loss: 0.1360 ||:  42%|####2     | 47/111 [00:32<00:40,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8263, UAS: 0.9351, LAS: 0.8808, UEM: 0.5802, LEM: 0.3496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2804, partial_loss/deprel_loss: 1.0114, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2017, loss: 0.8047, batch_reg_loss: 0.1365, reg_loss: 0.1360 ||:  46%|####5     | 51/111 [00:35<00:38,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7825, UAS: 0.9341, LAS: 0.8795, UEM: 0.5765, LEM: 0.3437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8381, partial_loss/deprel_loss: 1.2425, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4981, loss: 0.8138, batch_reg_loss: 0.1365, reg_loss: 0.1361 ||:  50%|####9     | 55/111 [00:38<00:38,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9343, LAS: 0.8798, UEM: 0.5758, LEM: 0.3433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2422, partial_loss/deprel_loss: 0.3801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4891, loss: 0.8124, batch_reg_loss: 0.1366, reg_loss: 0.1361 ||:  52%|#####2    | 58/111 [00:40<00:36,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9338, LAS: 0.8791, UEM: 0.5644, LEM: 0.3330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5629, partial_loss/deprel_loss: 0.6541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7725, loss: 0.8162, batch_reg_loss: 0.1366, reg_loss: 0.1361 ||:  56%|#####5    | 62/111 [00:42<00:31,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8466, UAS: 0.9340, LAS: 0.8790, UEM: 0.5651, LEM: 0.3313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0235, partial_loss/deprel_loss: 0.9341, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0887, loss: 0.8163, batch_reg_loss: 0.1367, reg_loss: 0.1362 ||:  59%|#####9    | 66/111 [00:45<00:28,  1.61it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8475, UAS: 0.9333, LAS: 0.8778, UEM: 0.5585, LEM: 0.3260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8708, partial_loss/deprel_loss: 1.0278, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1332, loss: 0.8263, batch_reg_loss: 0.1368, reg_loss: 0.1362 ||:  63%|######3   | 70/111 [00:48<00:26,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9324, LAS: 0.8769, UEM: 0.5601, LEM: 0.3258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4513, partial_loss/deprel_loss: 0.5420, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6606, loss: 0.8319, batch_reg_loss: 0.1368, reg_loss: 0.1362 ||:  67%|######6   | 74/111 [00:50<00:23,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9312, LAS: 0.8757, UEM: 0.5582, LEM: 0.3261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3023, partial_loss/deprel_loss: 0.4266, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5386, loss: 0.8426, batch_reg_loss: 0.1369, reg_loss: 0.1363 ||:  70%|#######   | 78/111 [00:53<00:22,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9305, LAS: 0.8749, UEM: 0.5510, LEM: 0.3210, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3944, partial_loss/deprel_loss: 0.5743, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6753, loss: 0.8499, batch_reg_loss: 0.1370, reg_loss: 0.1363 ||:  74%|#######3  | 82/111 [00:56<00:19,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9310, LAS: 0.8753, UEM: 0.5488, LEM: 0.3173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3884, partial_loss/deprel_loss: 0.5201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6308, loss: 0.8477, batch_reg_loss: 0.1370, reg_loss: 0.1363 ||:  77%|#######6  | 85/111 [00:58<00:17,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8486, UAS: 0.9303, LAS: 0.8745, UEM: 0.5408, LEM: 0.3115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9831, partial_loss/deprel_loss: 0.8483, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0123, loss: 0.8528, batch_reg_loss: 0.1371, reg_loss: 0.1363 ||:  79%|#######9  | 88/111 [01:00<00:15,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9297, LAS: 0.8737, UEM: 0.5392, LEM: 0.3100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4849, partial_loss/deprel_loss: 0.6716, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7715, loss: 0.8581, batch_reg_loss: 0.1372, reg_loss: 0.1364 ||:  83%|########2 | 92/111 [01:02<00:12,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8381, UAS: 0.9299, LAS: 0.8737, UEM: 0.5393, LEM: 0.3086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0448, partial_loss/deprel_loss: 0.8961, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0631, loss: 0.8567, batch_reg_loss: 0.1373, reg_loss: 0.1364 ||:  86%|########6 | 96/111 [01:05<00:09,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8109, UAS: 0.9285, LAS: 0.8721, UEM: 0.5326, LEM: 0.3036, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6162, partial_loss/deprel_loss: 1.2664, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4737, loss: 0.8717, batch_reg_loss: 0.1374, reg_loss: 0.1364 ||:  90%|######### | 100/111 [01:08<00:07,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8685, UAS: 0.9289, LAS: 0.8726, UEM: 0.5333, LEM: 0.3021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6726, partial_loss/deprel_loss: 0.6797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8157, loss: 0.8672, batch_reg_loss: 0.1374, reg_loss: 0.1365 ||:  93%|#########2| 103/111 [01:10<00:05,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8184, UAS: 0.9280, LAS: 0.8714, UEM: 0.5288, LEM: 0.2982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3722, partial_loss/deprel_loss: 1.1339, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3191, loss: 0.8774, batch_reg_loss: 0.1375, reg_loss: 0.1365 ||:  96%|#########6| 107/111 [01:13<00:02,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8885, UAS: 0.9276, LAS: 0.8710, UEM: 0.5262, LEM: 0.2959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5914, partial_loss/deprel_loss: 0.5512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6968, loss: 0.8794, batch_reg_loss: 0.1376, reg_loss: 0.1365 ||: 100%|##########| 111/111 [01:15<00:00,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8885, UAS: 0.9276, LAS: 0.8710, UEM: 0.5262, LEM: 0.2959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5914, partial_loss/deprel_loss: 0.5512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6968, loss: 0.8794, batch_reg_loss: 0.1376, reg_loss: 0.1365 ||: 100%|##########| 111/111 [01:15<00:00,  1.46it/s]\n",
+      "2023-04-06 23:42:20,382 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:42:20,382 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:42:20,382 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.551  |       N/A\n",
+      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.591  |       N/A\n",
+      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.137  |       N/A\n",
+      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - UEM                      |     0.526  |       N/A\n",
+      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - LAS                      |     0.871  |       N/A\n",
+      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - loss                     |     0.879  |       N/A\n",
+      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - LEM                      |     0.296  |       N/A\n",
+      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - UAS                      |     0.928  |       N/A\n",
+      "2023-04-06 23:42:20,384 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:42:20,384 - INFO - combo.training.tensorboard_writer - EM                       |     0.889  |       N/A\n",
+      "2023-04-06 23:42:20,384 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:42:20,384 - INFO - combo.training.trainer - Epoch duration: 0:01:15.902319\n",
+      "2023-04-06 23:42:20,384 - INFO - combo.training.trainer - Estimated training time remaining: 7:52:57\n",
+      "2023-04-06 23:42:20,385 - INFO - allennlp.training.trainer - Epoch 40/399\n",
+      "2023-04-06 23:42:20,385 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:42:20,385 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:42:20,392 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8570, UAS: 0.9317, LAS: 0.8756, UEM: 0.5489, LEM: 0.2962, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8281, partial_loss/deprel_loss: 0.8210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9601, loss: 0.8450, batch_reg_loss: 0.1376, reg_loss: 0.1376 ||:   4%|3         | 4/111 [00:02<01:11,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9439, LAS: 0.8883, UEM: 0.6418, LEM: 0.3665, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3450, partial_loss/deprel_loss: 0.6142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6981, loss: 0.7376, batch_reg_loss: 0.1377, reg_loss: 0.1376 ||:   6%|6         | 7/111 [00:05<01:17,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8566, UAS: 0.9406, LAS: 0.8849, UEM: 0.5977, LEM: 0.3307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9597, partial_loss/deprel_loss: 0.8677, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0238, loss: 0.7623, batch_reg_loss: 0.1378, reg_loss: 0.1377 ||:   9%|9         | 10/111 [00:07<01:15,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8822, UAS: 0.9310, LAS: 0.8748, UEM: 0.5612, LEM: 0.3008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5104, partial_loss/deprel_loss: 0.6686, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7747, loss: 0.8476, batch_reg_loss: 0.1378, reg_loss: 0.1377 ||:  12%|#1        | 13/111 [00:09<01:12,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9346, LAS: 0.8790, UEM: 0.5600, LEM: 0.2946, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3911, partial_loss/deprel_loss: 0.5027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6182, loss: 0.8156, batch_reg_loss: 0.1379, reg_loss: 0.1377 ||:  14%|#4        | 16/111 [00:12<01:10,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8492, UAS: 0.9323, LAS: 0.8758, UEM: 0.5203, LEM: 0.2651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9130, partial_loss/deprel_loss: 0.9827, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1067, loss: 0.8472, batch_reg_loss: 0.1379, reg_loss: 0.1378 ||:  18%|#8        | 20/111 [00:14<01:05,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8734, UAS: 0.9317, LAS: 0.8753, UEM: 0.4986, LEM: 0.2493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7004, partial_loss/deprel_loss: 0.7843, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9055, loss: 0.8557, batch_reg_loss: 0.1380, reg_loss: 0.1378 ||:  21%|##        | 23/111 [00:16<01:03,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9292, LAS: 0.8729, UEM: 0.4781, LEM: 0.2357, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4067, partial_loss/deprel_loss: 0.5801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6835, loss: 0.8777, batch_reg_loss: 0.1381, reg_loss: 0.1378 ||:  24%|##4       | 27/111 [00:19<00:57,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8920, UAS: 0.9319, LAS: 0.8755, UEM: 0.5036, LEM: 0.2529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5178, partial_loss/deprel_loss: 0.6325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7477, loss: 0.8563, batch_reg_loss: 0.1381, reg_loss: 0.1379 ||:  28%|##7       | 31/111 [00:21<00:53,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8942, UAS: 0.9352, LAS: 0.8802, UEM: 0.5864, LEM: 0.3575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4408, partial_loss/deprel_loss: 0.6740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7656, loss: 0.8228, batch_reg_loss: 0.1382, reg_loss: 0.1379 ||:  31%|###       | 34/111 [00:24<00:56,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9331, LAS: 0.8780, UEM: 0.5720, LEM: 0.3460, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5699, partial_loss/deprel_loss: 0.6384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7629, loss: 0.8427, batch_reg_loss: 0.1382, reg_loss: 0.1379 ||:  33%|###3      | 37/111 [00:26<00:53,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9335, LAS: 0.8782, UEM: 0.5702, LEM: 0.3385, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2598, partial_loss/deprel_loss: 0.4579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5566, loss: 0.8412, batch_reg_loss: 0.1383, reg_loss: 0.1380 ||:  37%|###6      | 41/111 [00:29<00:48,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8557, UAS: 0.9335, LAS: 0.8780, UEM: 0.5642, LEM: 0.3338, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8098, partial_loss/deprel_loss: 0.8707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9969, loss: 0.8421, batch_reg_loss: 0.1384, reg_loss: 0.1380 ||:  40%|###9      | 44/111 [00:31<00:48,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9330, LAS: 0.8774, UEM: 0.5605, LEM: 0.3306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3433, partial_loss/deprel_loss: 0.4961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6040, loss: 0.8485, batch_reg_loss: 0.1384, reg_loss: 0.1380 ||:  42%|####2     | 47/111 [00:33<00:46,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9339, LAS: 0.8782, UEM: 0.5593, LEM: 0.3252, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3518, partial_loss/deprel_loss: 0.4778, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5911, loss: 0.8408, batch_reg_loss: 0.1385, reg_loss: 0.1380 ||:  45%|####5     | 50/111 [00:35<00:43,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8571, UAS: 0.9330, LAS: 0.8769, UEM: 0.5442, LEM: 0.3141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8073, partial_loss/deprel_loss: 0.8530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9824, loss: 0.8503, batch_reg_loss: 0.1385, reg_loss: 0.1381 ||:  49%|####8     | 54/111 [00:38<00:39,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8757, UAS: 0.9338, LAS: 0.8778, UEM: 0.5522, LEM: 0.3229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5658, partial_loss/deprel_loss: 0.7195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8274, loss: 0.8418, batch_reg_loss: 0.1386, reg_loss: 0.1381 ||:  51%|#####1    | 57/111 [00:40<00:39,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8581, UAS: 0.9322, LAS: 0.8759, UEM: 0.5406, LEM: 0.3129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8303, partial_loss/deprel_loss: 0.8697, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0005, loss: 0.8547, batch_reg_loss: 0.1387, reg_loss: 0.1381 ||:  55%|#####4    | 61/111 [00:43<00:34,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8370, UAS: 0.9314, LAS: 0.8750, UEM: 0.5303, LEM: 0.3042, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0092, partial_loss/deprel_loss: 0.9400, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0926, loss: 0.8601, batch_reg_loss: 0.1387, reg_loss: 0.1382 ||:  59%|#####8    | 65/111 [00:45<00:29,  1.54it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9322, LAS: 0.8760, UEM: 0.5436, LEM: 0.3141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2285, partial_loss/deprel_loss: 0.4120, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.8483, batch_reg_loss: 0.1388, reg_loss: 0.1382 ||:  62%|######2   | 69/111 [00:48<00:27,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8724, UAS: 0.9315, LAS: 0.8752, UEM: 0.5358, LEM: 0.3083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7962, partial_loss/deprel_loss: 0.7627, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9083, loss: 0.8559, batch_reg_loss: 0.1389, reg_loss: 0.1382 ||:  66%|######5   | 73/111 [00:50<00:25,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8556, UAS: 0.9308, LAS: 0.8746, UEM: 0.5263, LEM: 0.3017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9985, partial_loss/deprel_loss: 0.9882, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1292, loss: 0.8618, batch_reg_loss: 0.1390, reg_loss: 0.1383 ||:  69%|######9   | 77/111 [00:53<00:23,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9109, UAS: 0.9306, LAS: 0.8743, UEM: 0.5325, LEM: 0.3061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2627, partial_loss/deprel_loss: 0.4424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5455, loss: 0.8641, batch_reg_loss: 0.1390, reg_loss: 0.1383 ||:  73%|#######2  | 81/111 [00:56<00:21,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9309, LAS: 0.8746, UEM: 0.5345, LEM: 0.3060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3698, partial_loss/deprel_loss: 0.4835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5998, loss: 0.8614, batch_reg_loss: 0.1391, reg_loss: 0.1383 ||:  77%|#######6  | 85/111 [00:59<00:17,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9311, LAS: 0.8748, UEM: 0.5386, LEM: 0.3098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1995, partial_loss/deprel_loss: 0.3761, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4799, loss: 0.8597, batch_reg_loss: 0.1392, reg_loss: 0.1384 ||:  79%|#######9  | 88/111 [01:01<00:15,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7752, UAS: 0.9306, LAS: 0.8743, UEM: 0.5397, LEM: 0.3097, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1589, partial_loss/deprel_loss: 1.3621, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6607, loss: 0.8631, batch_reg_loss: 0.1392, reg_loss: 0.1384 ||:  83%|########2 | 92/111 [01:03<00:12,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8928, UAS: 0.9301, LAS: 0.8737, UEM: 0.5393, LEM: 0.3071, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4196, partial_loss/deprel_loss: 0.6012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7042, loss: 0.8662, batch_reg_loss: 0.1393, reg_loss: 0.1384 ||:  86%|########5 | 95/111 [01:06<00:11,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8977, UAS: 0.9305, LAS: 0.8740, UEM: 0.5404, LEM: 0.3065, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3724, partial_loss/deprel_loss: 0.5439, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6489, loss: 0.8636, batch_reg_loss: 0.1393, reg_loss: 0.1385 ||:  88%|########8 | 98/111 [01:08<00:09,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8126, UAS: 0.9289, LAS: 0.8722, UEM: 0.5321, LEM: 0.3010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5588, partial_loss/deprel_loss: 1.1620, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3808, loss: 0.8792, batch_reg_loss: 0.1394, reg_loss: 0.1385 ||:  92%|#########1| 102/111 [01:10<00:06,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9288, LAS: 0.8719, UEM: 0.5261, LEM: 0.2958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6212, partial_loss/deprel_loss: 0.7073, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8296, loss: 0.8832, batch_reg_loss: 0.1395, reg_loss: 0.1385 ||:  95%|#########5| 106/111 [01:13<00:03,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8191, UAS: 0.9283, LAS: 0.8714, UEM: 0.5235, LEM: 0.2934, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4445, partial_loss/deprel_loss: 1.0017, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2298, loss: 0.8870, batch_reg_loss: 0.1396, reg_loss: 0.1386 ||:  99%|#########9| 110/111 [01:16<00:00,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9286, LAS: 0.8717, UEM: 0.5255, LEM: 0.2944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2913, partial_loss/deprel_loss: 0.4945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5934, loss: 0.8844, batch_reg_loss: 0.1396, reg_loss: 0.1386 ||: 100%|##########| 111/111 [01:17<00:00,  1.44it/s]\n",
+      "2023-04-06 23:43:37,470 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9060, UAS: 0.9208, LAS: 0.8625, UEM: 0.4979, LEM: 0.1992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3803, partial_loss/deprel_loss: 25.0669, partial_loss/cycle_loss: 0.0000, batch_loss: 20.1296, loss: 34.6105, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:11,  1.03s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8574, UAS: 0.9200, LAS: 0.8624, UEM: 0.3798, LEM: 0.1298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2659, partial_loss/deprel_loss: 50.9556, partial_loss/cycle_loss: 0.0000, batch_loss: 41.0176, loss: 35.2960, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  31%|###       | 4/13 [00:04<00:09,  1.03s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8879, UAS: 0.9319, LAS: 0.8754, UEM: 0.4854, LEM: 0.2095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5658, partial_loss/deprel_loss: 25.1574, partial_loss/cycle_loss: 0.0000, batch_loss: 20.2391, loss: 30.3282, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  54%|#####3    | 7/13 [00:06<00:05,  1.00it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9064, UAS: 0.9407, LAS: 0.8855, UEM: 0.6077, LEM: 0.3154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3743, partial_loss/deprel_loss: 26.9548, partial_loss/cycle_loss: 0.0000, batch_loss: 21.6387, loss: 28.1431, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  69%|######9   | 9/13 [00:08<00:04,  1.01s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8816, UAS: 0.9435, LAS: 0.8899, UEM: 0.6518, LEM: 0.3867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7037, partial_loss/deprel_loss: 31.0434, partial_loss/cycle_loss: 0.0000, batch_loss: 24.9755, loss: 26.9689, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  92%|#########2| 12/13 [00:11<00:00,  1.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8706, UAS: 0.9423, LAS: 0.8885, UEM: 0.6328, LEM: 0.3709, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9222, partial_loss/deprel_loss: 32.1733, partial_loss/cycle_loss: 0.0000, batch_loss: 25.9231, loss: 26.8884, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.05it/s]\n",
+      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.494  |    32.173\n",
+      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.291  |     0.922\n",
+      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.139  |     0.000\n",
+      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - UEM                      |     0.525  |     0.633\n",
+      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - LAS                      |     0.872  |     0.888\n",
+      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - loss                     |     0.884  |    26.888\n",
+      "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - LEM                      |     0.294  |     0.371\n",
+      "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - UAS                      |     0.929  |     0.942\n",
+      "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - EM                       |     0.911  |     0.871\n",
+      "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:43:49,822 - INFO - combo.training.trainer - Epoch duration: 0:01:29.437908\n",
+      "2023-04-06 23:43:49,823 - INFO - combo.training.trainer - Estimated training time remaining: 7:53:11\n",
+      "2023-04-06 23:43:49,823 - INFO - allennlp.training.trainer - Epoch 41/399\n",
+      "2023-04-06 23:43:49,823 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:43:49,823 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:43:49,829 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8656, UAS: 0.9473, LAS: 0.8922, UEM: 0.5747, LEM: 0.2760, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7457, partial_loss/deprel_loss: 0.8736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9877, loss: 0.7340, batch_reg_loss: 0.1397, reg_loss: 0.1396 ||:   4%|3         | 4/111 [00:02<01:06,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8831, UAS: 0.9386, LAS: 0.8829, UEM: 0.5009, LEM: 0.2195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5661, partial_loss/deprel_loss: 0.6803, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7971, loss: 0.8012, batch_reg_loss: 0.1397, reg_loss: 0.1397 ||:   6%|6         | 7/111 [00:04<01:06,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9384, LAS: 0.8814, UEM: 0.4792, LEM: 0.2018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3911, partial_loss/deprel_loss: 0.5334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6447, loss: 0.8055, batch_reg_loss: 0.1398, reg_loss: 0.1397 ||:  10%|9         | 11/111 [00:07<01:05,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9380, LAS: 0.8812, UEM: 0.4718, LEM: 0.1999, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6246, partial_loss/deprel_loss: 0.7587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8718, loss: 0.8062, batch_reg_loss: 0.1399, reg_loss: 0.1397 ||:  14%|#3        | 15/111 [00:09<01:01,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9369, LAS: 0.8806, UEM: 0.4850, LEM: 0.2139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4880, partial_loss/deprel_loss: 0.5864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7066, loss: 0.8159, batch_reg_loss: 0.1399, reg_loss: 0.1398 ||:  16%|#6        | 18/111 [00:12<01:03,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9013, UAS: 0.9404, LAS: 0.8844, UEM: 0.5462, LEM: 0.2671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2989, partial_loss/deprel_loss: 0.4637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5707, loss: 0.7806, batch_reg_loss: 0.1400, reg_loss: 0.1398 ||:  19%|#8        | 21/111 [00:14<01:02,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8661, UAS: 0.9405, LAS: 0.8848, UEM: 0.5380, LEM: 0.2601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7704, partial_loss/deprel_loss: 0.7739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9132, loss: 0.7765, batch_reg_loss: 0.1400, reg_loss: 0.1398 ||:  22%|##1       | 24/111 [00:16<01:03,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8796, UAS: 0.9381, LAS: 0.8821, UEM: 0.5425, LEM: 0.2663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4807, partial_loss/deprel_loss: 0.6797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7800, loss: 0.7943, batch_reg_loss: 0.1401, reg_loss: 0.1398 ||:  24%|##4       | 27/111 [00:18<01:00,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8412, UAS: 0.9360, LAS: 0.8798, UEM: 0.5291, LEM: 0.2597, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2766, partial_loss/deprel_loss: 0.8635, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0862, loss: 0.8113, batch_reg_loss: 0.1401, reg_loss: 0.1399 ||:  27%|##7       | 30/111 [00:20<00:56,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8469, UAS: 0.9353, LAS: 0.8792, UEM: 0.5505, LEM: 0.2951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0839, partial_loss/deprel_loss: 0.9513, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1179, loss: 0.8167, batch_reg_loss: 0.1401, reg_loss: 0.1399 ||:  30%|##9       | 33/111 [00:22<00:55,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9379, LAS: 0.8819, UEM: 0.5853, LEM: 0.3245, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1621, partial_loss/deprel_loss: 0.4345, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5203, loss: 0.7952, batch_reg_loss: 0.1402, reg_loss: 0.1399 ||:  32%|###2      | 36/111 [00:25<00:54,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8714, UAS: 0.9373, LAS: 0.8810, UEM: 0.5804, LEM: 0.3192, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5903, partial_loss/deprel_loss: 0.6910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8111, loss: 0.8015, batch_reg_loss: 0.1403, reg_loss: 0.1399 ||:  36%|###6      | 40/111 [00:27<00:50,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9365, LAS: 0.8805, UEM: 0.5882, LEM: 0.3335, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1602, partial_loss/deprel_loss: 0.3119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4219, loss: 0.8045, batch_reg_loss: 0.1403, reg_loss: 0.1400 ||:  39%|###8      | 43/111 [00:29<00:48,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8546, UAS: 0.9357, LAS: 0.8799, UEM: 0.5839, LEM: 0.3325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0559, partial_loss/deprel_loss: 0.8560, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0364, loss: 0.8087, batch_reg_loss: 0.1404, reg_loss: 0.1400 ||:  41%|####1     | 46/111 [00:32<00:45,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9030, UAS: 0.9341, LAS: 0.8782, UEM: 0.5697, LEM: 0.3216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4055, partial_loss/deprel_loss: 0.4768, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6030, loss: 0.8229, batch_reg_loss: 0.1404, reg_loss: 0.1400 ||:  45%|####5     | 50/111 [00:34<00:41,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8459, UAS: 0.9332, LAS: 0.8772, UEM: 0.5581, LEM: 0.3137, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9401, partial_loss/deprel_loss: 0.8900, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0405, loss: 0.8303, batch_reg_loss: 0.1405, reg_loss: 0.1401 ||:  48%|####7     | 53/111 [00:36<00:39,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9313, LAS: 0.8754, UEM: 0.5553, LEM: 0.3113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7602, partial_loss/deprel_loss: 0.7644, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9042, loss: 0.8451, batch_reg_loss: 0.1406, reg_loss: 0.1401 ||:  50%|#####     | 56/111 [00:38<00:38,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9299, LAS: 0.8736, UEM: 0.5401, LEM: 0.3008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6608, partial_loss/deprel_loss: 0.7292, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8562, loss: 0.8595, batch_reg_loss: 0.1406, reg_loss: 0.1401 ||:  54%|#####4    | 60/111 [00:41<00:35,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8242, UAS: 0.9297, LAS: 0.8732, UEM: 0.5341, LEM: 0.2944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2914, partial_loss/deprel_loss: 0.9993, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1984, loss: 0.8635, batch_reg_loss: 0.1407, reg_loss: 0.1401 ||:  57%|#####6    | 63/111 [00:43<00:33,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9030, UAS: 0.9302, LAS: 0.8736, UEM: 0.5320, LEM: 0.2897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3977, partial_loss/deprel_loss: 0.5494, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6598, loss: 0.8592, batch_reg_loss: 0.1408, reg_loss: 0.1402 ||:  59%|#####9    | 66/111 [00:45<00:31,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8815, UAS: 0.9306, LAS: 0.8740, UEM: 0.5362, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5458, partial_loss/deprel_loss: 0.6075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7360, loss: 0.8557, batch_reg_loss: 0.1408, reg_loss: 0.1402 ||:  63%|######3   | 70/111 [00:48<00:28,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8934, UAS: 0.9305, LAS: 0.8737, UEM: 0.5287, LEM: 0.2884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3618, partial_loss/deprel_loss: 0.5886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6841, loss: 0.8577, batch_reg_loss: 0.1409, reg_loss: 0.1402 ||:  67%|######6   | 74/111 [00:50<00:24,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8691, UAS: 0.9301, LAS: 0.8732, UEM: 0.5233, LEM: 0.2842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6254, partial_loss/deprel_loss: 0.8169, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9195, loss: 0.8652, batch_reg_loss: 0.1410, reg_loss: 0.1403 ||:  70%|#######   | 78/111 [00:53<00:21,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8655, UAS: 0.9296, LAS: 0.8724, UEM: 0.5124, LEM: 0.2764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8604, partial_loss/deprel_loss: 0.7997, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9529, loss: 0.8711, batch_reg_loss: 0.1411, reg_loss: 0.1403 ||:  74%|#######3  | 82/111 [00:56<00:19,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8117, UAS: 0.9287, LAS: 0.8713, UEM: 0.5086, LEM: 0.2733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6232, partial_loss/deprel_loss: 1.1753, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4060, loss: 0.8803, batch_reg_loss: 0.1411, reg_loss: 0.1404 ||:  77%|#######7  | 86/111 [00:58<00:16,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8470, UAS: 0.9289, LAS: 0.8716, UEM: 0.5090, LEM: 0.2731, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9237, partial_loss/deprel_loss: 0.8957, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0425, loss: 0.8771, batch_reg_loss: 0.1412, reg_loss: 0.1404 ||:  81%|########1 | 90/111 [01:01<00:14,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8360, UAS: 0.9291, LAS: 0.8718, UEM: 0.5114, LEM: 0.2740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2032, partial_loss/deprel_loss: 1.0468, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2193, loss: 0.8760, batch_reg_loss: 0.1413, reg_loss: 0.1404 ||:  84%|########3 | 93/111 [01:05<00:15,  1.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9488, UAS: 0.9303, LAS: 0.8733, UEM: 0.5341, LEM: 0.3001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0761, partial_loss/deprel_loss: 0.1753, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2968, loss: 0.8647, batch_reg_loss: 0.1413, reg_loss: 0.1404 ||:  86%|########6 | 96/111 [01:08<00:12,  1.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8879, UAS: 0.9304, LAS: 0.8733, UEM: 0.5303, LEM: 0.2949, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4572, partial_loss/deprel_loss: 0.5740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6921, loss: 0.8644, batch_reg_loss: 0.1414, reg_loss: 0.1405 ||:  90%|######### | 100/111 [01:10<00:08,  1.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7828, UAS: 0.9302, LAS: 0.8732, UEM: 0.5366, LEM: 0.3012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0178, partial_loss/deprel_loss: 1.2750, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5650, loss: 0.8644, batch_reg_loss: 0.1415, reg_loss: 0.1405 ||:  93%|#########2| 103/111 [01:12<00:06,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8301, UAS: 0.9297, LAS: 0.8725, UEM: 0.5303, LEM: 0.2958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2271, partial_loss/deprel_loss: 0.9879, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1772, loss: 0.8693, batch_reg_loss: 0.1415, reg_loss: 0.1405 ||:  96%|#########6| 107/111 [01:15<00:02,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8079, UAS: 0.9286, LAS: 0.8714, UEM: 0.5247, LEM: 0.2920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5258, partial_loss/deprel_loss: 1.1332, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3533, loss: 0.8775, batch_reg_loss: 0.1416, reg_loss: 0.1406 ||: 100%|##########| 111/111 [01:17<00:00,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8079, UAS: 0.9286, LAS: 0.8714, UEM: 0.5247, LEM: 0.2920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5258, partial_loss/deprel_loss: 1.1332, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3533, loss: 0.8775, batch_reg_loss: 0.1416, reg_loss: 0.1406 ||: 100%|##########| 111/111 [01:17<00:00,  1.43it/s]\n",
+      "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.133  |       N/A\n",
+      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.526  |       N/A\n",
+      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.141  |       N/A\n",
+      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - UEM                      |     0.525  |       N/A\n",
+      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - LAS                      |     0.871  |       N/A\n",
+      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - loss                     |     0.877  |       N/A\n",
+      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - LEM                      |     0.292  |       N/A\n",
+      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - UAS                      |     0.929  |       N/A\n",
+      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - EM                       |     0.808  |       N/A\n",
+      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:45:07,634 - INFO - combo.training.trainer - Epoch duration: 0:01:17.811230\n",
+      "2023-04-06 23:45:07,634 - INFO - combo.training.trainer - Estimated training time remaining: 7:51:41\n",
+      "2023-04-06 23:45:07,634 - INFO - allennlp.training.trainer - Epoch 42/399\n",
+      "2023-04-06 23:45:07,634 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:45:07,635 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:45:07,641 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9418, LAS: 0.8844, UEM: 0.6837, LEM: 0.4383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1491, partial_loss/deprel_loss: 0.3171, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4252, loss: 0.7424, batch_reg_loss: 0.1416, reg_loss: 0.1416 ||:   3%|2         | 3/111 [00:02<01:17,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9439, LAS: 0.8897, UEM: 0.6355, LEM: 0.3676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3734, partial_loss/deprel_loss: 0.5091, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6237, loss: 0.7500, batch_reg_loss: 0.1417, reg_loss: 0.1416 ||:   6%|6         | 7/111 [00:04<01:12,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8109, UAS: 0.9345, LAS: 0.8808, UEM: 0.5993, LEM: 0.3413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8176, partial_loss/deprel_loss: 1.0696, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3609, loss: 0.8223, batch_reg_loss: 0.1418, reg_loss: 0.1417 ||:   9%|9         | 10/111 [00:06<01:10,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8456, UAS: 0.9321, LAS: 0.8780, UEM: 0.5473, LEM: 0.3023, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9754, partial_loss/deprel_loss: 0.9375, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0869, loss: 0.8430, batch_reg_loss: 0.1418, reg_loss: 0.1417 ||:  12%|#1        | 13/111 [00:09<01:11,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8557, UAS: 0.9290, LAS: 0.8745, UEM: 0.5006, LEM: 0.2696, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9098, partial_loss/deprel_loss: 0.8706, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0203, loss: 0.8699, batch_reg_loss: 0.1419, reg_loss: 0.1417 ||:  14%|#4        | 16/111 [00:11<01:08,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7885, UAS: 0.9225, LAS: 0.8667, UEM: 0.4693, LEM: 0.2489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9202, partial_loss/deprel_loss: 1.2812, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5509, loss: 0.9321, batch_reg_loss: 0.1419, reg_loss: 0.1418 ||:  17%|#7        | 19/111 [00:13<01:06,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9252, LAS: 0.8689, UEM: 0.4885, LEM: 0.2640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2645, partial_loss/deprel_loss: 0.3956, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5114, loss: 0.9091, batch_reg_loss: 0.1420, reg_loss: 0.1418 ||:  20%|#9        | 22/111 [00:15<01:04,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7888, UAS: 0.9224, LAS: 0.8653, UEM: 0.4605, LEM: 0.2419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7105, partial_loss/deprel_loss: 1.1578, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4104, loss: 0.9309, batch_reg_loss: 0.1421, reg_loss: 0.1418 ||:  23%|##3       | 26/111 [00:18<00:57,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8680, UAS: 0.9242, LAS: 0.8673, UEM: 0.4631, LEM: 0.2382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6195, partial_loss/deprel_loss: 0.7172, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8398, loss: 0.9185, batch_reg_loss: 0.1421, reg_loss: 0.1419 ||:  27%|##7       | 30/111 [00:20<00:54,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9257, LAS: 0.8693, UEM: 0.4708, LEM: 0.2398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4584, partial_loss/deprel_loss: 0.5306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6584, loss: 0.9047, batch_reg_loss: 0.1422, reg_loss: 0.1419 ||:  31%|###       | 34/111 [00:22<00:49,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8119, UAS: 0.9266, LAS: 0.8708, UEM: 0.5190, LEM: 0.2948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5656, partial_loss/deprel_loss: 1.1580, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3818, loss: 0.8919, batch_reg_loss: 0.1423, reg_loss: 0.1419 ||:  34%|###4      | 38/111 [00:25<00:47,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8013, UAS: 0.9268, LAS: 0.8702, UEM: 0.5255, LEM: 0.2939, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6049, partial_loss/deprel_loss: 1.2007, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4239, loss: 0.8945, batch_reg_loss: 0.1424, reg_loss: 0.1420 ||:  38%|###7      | 42/111 [00:28<00:44,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9244, LAS: 0.8681, UEM: 0.5113, LEM: 0.2843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5069, partial_loss/deprel_loss: 0.5866, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7131, loss: 0.9143, batch_reg_loss: 0.1425, reg_loss: 0.1420 ||:  41%|####1     | 46/111 [00:30<00:42,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8545, UAS: 0.9260, LAS: 0.8699, UEM: 0.5146, LEM: 0.2838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9033, partial_loss/deprel_loss: 0.9612, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0922, loss: 0.9012, batch_reg_loss: 0.1425, reg_loss: 0.1421 ||:  45%|####5     | 50/111 [00:33<00:41,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9020, UAS: 0.9262, LAS: 0.8700, UEM: 0.5082, LEM: 0.2782, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3898, partial_loss/deprel_loss: 0.5459, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6573, loss: 0.8964, batch_reg_loss: 0.1426, reg_loss: 0.1421 ||:  48%|####7     | 53/111 [00:35<00:39,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9264, LAS: 0.8700, UEM: 0.5088, LEM: 0.2775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2628, partial_loss/deprel_loss: 0.4712, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5722, loss: 0.8967, batch_reg_loss: 0.1427, reg_loss: 0.1421 ||:  50%|#####     | 56/111 [00:38<00:38,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8572, UAS: 0.9269, LAS: 0.8703, UEM: 0.5012, LEM: 0.2697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8432, partial_loss/deprel_loss: 0.8230, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9697, loss: 0.8934, batch_reg_loss: 0.1427, reg_loss: 0.1422 ||:  54%|#####4    | 60/111 [00:40<00:33,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8983, UAS: 0.9261, LAS: 0.8694, UEM: 0.4960, LEM: 0.2659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4341, partial_loss/deprel_loss: 0.5681, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6841, loss: 0.9014, batch_reg_loss: 0.1428, reg_loss: 0.1422 ||:  58%|#####7    | 64/111 [00:43<00:31,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9270, LAS: 0.8702, UEM: 0.5018, LEM: 0.2708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4418, partial_loss/deprel_loss: 0.5853, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6995, loss: 0.8965, batch_reg_loss: 0.1429, reg_loss: 0.1422 ||:  61%|######1   | 68/111 [00:45<00:29,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9281, LAS: 0.8715, UEM: 0.5132, LEM: 0.2776, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3822, partial_loss/deprel_loss: 0.5883, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6900, loss: 0.8848, batch_reg_loss: 0.1429, reg_loss: 0.1423 ||:  64%|######3   | 71/111 [00:47<00:27,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9280, LAS: 0.8712, UEM: 0.5081, LEM: 0.2720, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6994, partial_loss/deprel_loss: 0.7017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8442, loss: 0.8869, batch_reg_loss: 0.1430, reg_loss: 0.1423 ||:  68%|######7   | 75/111 [00:50<00:23,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8278, UAS: 0.9281, LAS: 0.8714, UEM: 0.5251, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4009, partial_loss/deprel_loss: 1.1302, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3274, loss: 0.8879, batch_reg_loss: 0.1431, reg_loss: 0.1423 ||:  71%|#######1  | 79/111 [00:53<00:21,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8092, UAS: 0.9276, LAS: 0.8707, UEM: 0.5240, LEM: 0.2971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5534, partial_loss/deprel_loss: 1.0782, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3164, loss: 0.8904, batch_reg_loss: 0.1432, reg_loss: 0.1424 ||:  75%|#######4  | 83/111 [00:55<00:18,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9264, LAS: 0.8695, UEM: 0.5132, LEM: 0.2898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8338, partial_loss/deprel_loss: 0.8070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9556, loss: 0.9018, batch_reg_loss: 0.1432, reg_loss: 0.1424 ||:  78%|#######8  | 87/111 [00:58<00:15,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9264, LAS: 0.8696, UEM: 0.5124, LEM: 0.2889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2878, partial_loss/deprel_loss: 0.4932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5954, loss: 0.9021, batch_reg_loss: 0.1433, reg_loss: 0.1425 ||:  82%|########1 | 91/111 [01:00<00:12,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9273, LAS: 0.8706, UEM: 0.5229, LEM: 0.2959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3174, partial_loss/deprel_loss: 0.4176, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5409, loss: 0.8934, batch_reg_loss: 0.1434, reg_loss: 0.1425 ||:  86%|########5 | 95/111 [01:04<00:11,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8778, UAS: 0.9280, LAS: 0.8714, UEM: 0.5268, LEM: 0.2972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5531, partial_loss/deprel_loss: 0.6957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8106, loss: 0.8872, batch_reg_loss: 0.1434, reg_loss: 0.1425 ||:  88%|########8 | 98/111 [01:06<00:09,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8226, UAS: 0.9276, LAS: 0.8709, UEM: 0.5227, LEM: 0.2933, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2476, partial_loss/deprel_loss: 1.0486, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2319, loss: 0.8905, batch_reg_loss: 0.1435, reg_loss: 0.1425 ||:  91%|######### | 101/111 [01:08<00:07,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8271, UAS: 0.9276, LAS: 0.8708, UEM: 0.5191, LEM: 0.2894, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2091, partial_loss/deprel_loss: 0.9989, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1845, loss: 0.8903, batch_reg_loss: 0.1435, reg_loss: 0.1426 ||:  94%|#########3| 104/111 [01:10<00:04,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8996, UAS: 0.9281, LAS: 0.8713, UEM: 0.5172, LEM: 0.2862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3627, partial_loss/deprel_loss: 0.5546, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6599, loss: 0.8854, batch_reg_loss: 0.1436, reg_loss: 0.1426 ||:  97%|#########7| 108/111 [01:12<00:02,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9289, LAS: 0.8721, UEM: 0.5273, LEM: 0.2946, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1537, partial_loss/deprel_loss: 0.3458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4510, loss: 0.8789, batch_reg_loss: 0.1437, reg_loss: 0.1426 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
+      "2023-04-06 23:46:23,087 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.346  |       N/A\n",
+      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.154  |       N/A\n",
+      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.143  |       N/A\n",
+      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - UEM                      |     0.527  |       N/A\n",
+      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - LAS                      |     0.872  |       N/A\n",
+      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - loss                     |     0.879  |       N/A\n",
+      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - LEM                      |     0.295  |       N/A\n",
+      "2023-04-06 23:46:23,089 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:46:23,089 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:46:23,089 - INFO - combo.training.tensorboard_writer - UAS                      |     0.929  |       N/A\n",
+      "2023-04-06 23:46:23,089 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:46:23,089 - INFO - combo.training.tensorboard_writer - EM                       |     0.923  |       N/A\n",
+      "2023-04-06 23:46:23,089 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:46:23,089 - INFO - combo.training.trainer - Epoch duration: 0:01:15.455331\n",
+      "2023-04-06 23:46:23,090 - INFO - combo.training.trainer - Estimated training time remaining: 7:49:52\n",
+      "2023-04-06 23:46:23,090 - INFO - allennlp.training.trainer - Epoch 43/399\n",
+      "2023-04-06 23:46:23,090 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:46:23,090 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:46:23,096 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8652, UAS: 0.9428, LAS: 0.8899, UEM: 0.5301, LEM: 0.2811, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7088, partial_loss/deprel_loss: 0.7559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8902, loss: 0.7165, batch_reg_loss: 0.1437, reg_loss: 0.1437 ||:   4%|3         | 4/111 [00:02<01:12,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8554, UAS: 0.9305, LAS: 0.8755, UEM: 0.4153, LEM: 0.2112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9663, partial_loss/deprel_loss: 0.8616, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0263, loss: 0.8579, batch_reg_loss: 0.1438, reg_loss: 0.1437 ||:   6%|6         | 7/111 [00:04<01:12,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9267, LAS: 0.8695, UEM: 0.3652, LEM: 0.1685, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4697, partial_loss/deprel_loss: 0.6609, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7665, loss: 0.8932, batch_reg_loss: 0.1438, reg_loss: 0.1438 ||:  10%|9         | 11/111 [00:07<01:07,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9170, UAS: 0.9308, LAS: 0.8744, UEM: 0.4503, LEM: 0.2264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2776, partial_loss/deprel_loss: 0.3887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5104, loss: 0.8467, batch_reg_loss: 0.1439, reg_loss: 0.1438 ||:  13%|#2        | 14/111 [00:09<01:07,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9310, LAS: 0.8749, UEM: 0.4808, LEM: 0.2451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4315, partial_loss/deprel_loss: 0.5662, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6832, loss: 0.8372, batch_reg_loss: 0.1439, reg_loss: 0.1438 ||:  15%|#5        | 17/111 [00:11<01:07,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9305, LAS: 0.8744, UEM: 0.4984, LEM: 0.2527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2001, partial_loss/deprel_loss: 0.4246, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5237, loss: 0.8381, batch_reg_loss: 0.1440, reg_loss: 0.1438 ||:  18%|#8        | 20/111 [00:14<01:04,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9020, UAS: 0.9311, LAS: 0.8754, UEM: 0.4955, LEM: 0.2494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4113, partial_loss/deprel_loss: 0.5384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6570, loss: 0.8374, batch_reg_loss: 0.1440, reg_loss: 0.1438 ||:  21%|##        | 23/111 [00:16<01:02,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8517, UAS: 0.9299, LAS: 0.8747, UEM: 0.5014, LEM: 0.2621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0566, partial_loss/deprel_loss: 0.9292, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0988, loss: 0.8457, batch_reg_loss: 0.1441, reg_loss: 0.1439 ||:  23%|##3       | 26/111 [00:18<01:00,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8671, UAS: 0.9280, LAS: 0.8729, UEM: 0.4755, LEM: 0.2457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7893, partial_loss/deprel_loss: 0.7554, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9063, loss: 0.8606, batch_reg_loss: 0.1441, reg_loss: 0.1439 ||:  27%|##7       | 30/111 [00:20<00:53,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9309, LAS: 0.8757, UEM: 0.4968, LEM: 0.2569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4710, partial_loss/deprel_loss: 0.7238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8175, loss: 0.8412, batch_reg_loss: 0.1442, reg_loss: 0.1439 ||:  31%|###       | 34/111 [00:23<00:50,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9296, LAS: 0.8741, UEM: 0.4825, LEM: 0.2462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4805, partial_loss/deprel_loss: 0.6438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7554, loss: 0.8578, batch_reg_loss: 0.1443, reg_loss: 0.1440 ||:  33%|###3      | 37/111 [00:25<00:49,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9576, UAS: 0.9296, LAS: 0.8747, UEM: 0.5280, LEM: 0.3088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0719, partial_loss/deprel_loss: 0.1706, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2952, loss: 0.8560, batch_reg_loss: 0.1443, reg_loss: 0.1440 ||:  36%|###6      | 40/111 [00:27<00:49,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8147, UAS: 0.9272, LAS: 0.8719, UEM: 0.5142, LEM: 0.2989, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4103, partial_loss/deprel_loss: 1.0491, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2657, loss: 0.8769, batch_reg_loss: 0.1444, reg_loss: 0.1440 ||:  39%|###8      | 43/111 [00:29<00:46,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8604, UAS: 0.9253, LAS: 0.8700, UEM: 0.5011, LEM: 0.2891, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8102, partial_loss/deprel_loss: 0.8194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9620, loss: 0.8908, batch_reg_loss: 0.1444, reg_loss: 0.1440 ||:  41%|####1     | 46/111 [00:31<00:46,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9264, LAS: 0.8710, UEM: 0.5009, LEM: 0.2851, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3478, partial_loss/deprel_loss: 0.5009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6148, loss: 0.8833, batch_reg_loss: 0.1445, reg_loss: 0.1441 ||:  44%|####4     | 49/111 [00:33<00:43,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8962, UAS: 0.9273, LAS: 0.8721, UEM: 0.5077, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4123, partial_loss/deprel_loss: 0.5633, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6777, loss: 0.8738, batch_reg_loss: 0.1446, reg_loss: 0.1441 ||:  48%|####7     | 53/111 [00:36<00:39,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9096, UAS: 0.9277, LAS: 0.8724, UEM: 0.5111, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2746, partial_loss/deprel_loss: 0.5166, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6128, loss: 0.8723, batch_reg_loss: 0.1446, reg_loss: 0.1441 ||:  50%|#####     | 56/111 [00:38<00:38,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9271, LAS: 0.8720, UEM: 0.5031, LEM: 0.2829, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3995, partial_loss/deprel_loss: 0.4965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6218, loss: 0.8758, batch_reg_loss: 0.1447, reg_loss: 0.1442 ||:  54%|#####4    | 60/111 [00:41<00:35,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9282, LAS: 0.8732, UEM: 0.5039, LEM: 0.2799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4876, partial_loss/deprel_loss: 0.6137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7333, loss: 0.8675, batch_reg_loss: 0.1448, reg_loss: 0.1442 ||:  58%|#####7    | 64/111 [00:43<00:31,  1.49it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8652, UAS: 0.9280, LAS: 0.8729, UEM: 0.5005, LEM: 0.2765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7839, partial_loss/deprel_loss: 0.7660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9144, loss: 0.8710, batch_reg_loss: 0.1449, reg_loss: 0.1442 ||:  61%|######1   | 68/111 [00:46<00:27,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9287, LAS: 0.8736, UEM: 0.4970, LEM: 0.2705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4859, partial_loss/deprel_loss: 0.6183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7367, loss: 0.8662, batch_reg_loss: 0.1449, reg_loss: 0.1443 ||:  65%|######4   | 72/111 [00:48<00:23,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8157, UAS: 0.9272, LAS: 0.8720, UEM: 0.4943, LEM: 0.2668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5636, partial_loss/deprel_loss: 1.0879, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3280, loss: 0.8815, batch_reg_loss: 0.1450, reg_loss: 0.1443 ||:  68%|######8   | 76/111 [00:50<00:21,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8144, UAS: 0.9269, LAS: 0.8717, UEM: 0.5034, LEM: 0.2805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5043, partial_loss/deprel_loss: 1.1348, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3537, loss: 0.8843, batch_reg_loss: 0.1450, reg_loss: 0.1443 ||:  72%|#######2  | 80/111 [00:53<00:18,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8524, UAS: 0.9266, LAS: 0.8709, UEM: 0.4931, LEM: 0.2729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7594, partial_loss/deprel_loss: 0.8771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9986, loss: 0.8908, batch_reg_loss: 0.1451, reg_loss: 0.1444 ||:  76%|#######5  | 84/111 [00:55<00:16,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9272, LAS: 0.8716, UEM: 0.5056, LEM: 0.2823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3730, partial_loss/deprel_loss: 0.5287, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6428, loss: 0.8835, batch_reg_loss: 0.1452, reg_loss: 0.1444 ||:  79%|#######9  | 88/111 [00:58<00:15,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9283, LAS: 0.8730, UEM: 0.5235, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1638, partial_loss/deprel_loss: 0.2994, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4175, loss: 0.8710, batch_reg_loss: 0.1453, reg_loss: 0.1445 ||:  83%|########2 | 92/111 [01:01<00:13,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8782, UAS: 0.9284, LAS: 0.8731, UEM: 0.5205, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4851, partial_loss/deprel_loss: 0.6839, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7895, loss: 0.8712, batch_reg_loss: 0.1453, reg_loss: 0.1445 ||:  86%|########6 | 96/111 [01:04<00:09,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8395, UAS: 0.9279, LAS: 0.8724, UEM: 0.5209, LEM: 0.2968, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1321, partial_loss/deprel_loss: 1.0463, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2089, loss: 0.8762, batch_reg_loss: 0.1454, reg_loss: 0.1445 ||:  90%|######### | 100/111 [01:06<00:07,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8728, UAS: 0.9277, LAS: 0.8722, UEM: 0.5211, LEM: 0.2954, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6545, partial_loss/deprel_loss: 0.6932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8310, loss: 0.8775, batch_reg_loss: 0.1455, reg_loss: 0.1446 ||:  94%|#########3| 104/111 [01:09<00:04,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8994, UAS: 0.9282, LAS: 0.8725, UEM: 0.5207, LEM: 0.2928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3772, partial_loss/deprel_loss: 0.5600, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6690, loss: 0.8751, batch_reg_loss: 0.1455, reg_loss: 0.1446 ||:  97%|#########7| 108/111 [01:11<00:01,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7823, UAS: 0.9278, LAS: 0.8719, UEM: 0.5203, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0270, partial_loss/deprel_loss: 1.3010, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5918, loss: 0.8791, batch_reg_loss: 0.1456, reg_loss: 0.1446 ||: 100%|##########| 111/111 [01:14<00:00,  1.50it/s]\n",
+      "2023-04-06 23:47:37,185 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:47:37,185 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:47:37,185 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:47:37,185 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:47:37,185 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:47:37,185 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.301  |       N/A\n",
+      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     2.027  |       N/A\n",
+      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.145  |       N/A\n",
+      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - UEM                      |     0.520  |       N/A\n",
+      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - LAS                      |     0.872  |       N/A\n",
+      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - loss                     |     0.879  |       N/A\n",
+      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - LEM                      |     0.292  |       N/A\n",
+      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - UAS                      |     0.928  |       N/A\n",
+      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - EM                       |     0.782  |       N/A\n",
+      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:47:37,187 - INFO - combo.training.trainer - Epoch duration: 0:01:14.097322\n",
+      "2023-04-06 23:47:37,187 - INFO - combo.training.trainer - Estimated training time remaining: 7:47:54\n",
+      "2023-04-06 23:47:37,187 - INFO - allennlp.training.trainer - Epoch 44/399\n",
+      "2023-04-06 23:47:37,187 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:47:37,188 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:47:37,194 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9630, LAS: 0.9171, UEM: 0.7763, LEM: 0.5258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3786, partial_loss/deprel_loss: 0.5238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6404, loss: 0.5429, batch_reg_loss: 0.1456, reg_loss: 0.1456 ||:   3%|2         | 3/111 [00:02<01:23,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8908, UAS: 0.9468, LAS: 0.8951, UEM: 0.6389, LEM: 0.3900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5384, partial_loss/deprel_loss: 0.6080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7398, loss: 0.7117, batch_reg_loss: 0.1457, reg_loss: 0.1456 ||:   6%|6         | 7/111 [00:04<01:16,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9520, LAS: 0.9005, UEM: 0.6665, LEM: 0.3958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4527, partial_loss/deprel_loss: 0.5690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6915, loss: 0.6676, batch_reg_loss: 0.1458, reg_loss: 0.1457 ||:  10%|9         | 11/111 [00:07<01:09,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7963, UAS: 0.9398, LAS: 0.8874, UEM: 0.6268, LEM: 0.3682, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8417, partial_loss/deprel_loss: 1.2189, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4893, loss: 0.7801, batch_reg_loss: 0.1458, reg_loss: 0.1457 ||:  13%|#2        | 14/111 [00:09<01:07,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8781, UAS: 0.9389, LAS: 0.8862, UEM: 0.6093, LEM: 0.3491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6420, partial_loss/deprel_loss: 0.6886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8252, loss: 0.7783, batch_reg_loss: 0.1458, reg_loss: 0.1457 ||:  15%|#5        | 17/111 [00:11<01:06,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8938, UAS: 0.9394, LAS: 0.8866, UEM: 0.6067, LEM: 0.3482, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4438, partial_loss/deprel_loss: 0.6601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7627, loss: 0.7781, batch_reg_loss: 0.1459, reg_loss: 0.1457 ||:  18%|#8        | 20/111 [00:13<01:04,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8509, UAS: 0.9330, LAS: 0.8786, UEM: 0.5653, LEM: 0.3216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9093, partial_loss/deprel_loss: 0.8832, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0344, loss: 0.8428, batch_reg_loss: 0.1460, reg_loss: 0.1458 ||:  22%|##1       | 24/111 [00:16<00:59,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7874, UAS: 0.9295, LAS: 0.8749, UEM: 0.5659, LEM: 0.3276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0483, partial_loss/deprel_loss: 1.1934, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5104, loss: 0.8740, batch_reg_loss: 0.1460, reg_loss: 0.1458 ||:  25%|##5       | 28/111 [00:18<00:56,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8710, UAS: 0.9314, LAS: 0.8773, UEM: 0.5799, LEM: 0.3389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6995, partial_loss/deprel_loss: 0.7559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8907, loss: 0.8550, batch_reg_loss: 0.1461, reg_loss: 0.1458 ||:  28%|##7       | 31/111 [00:21<00:55,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9303, LAS: 0.8762, UEM: 0.5832, LEM: 0.3393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4871, partial_loss/deprel_loss: 0.5664, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6967, loss: 0.8632, batch_reg_loss: 0.1462, reg_loss: 0.1459 ||:  32%|###1      | 35/111 [00:23<00:51,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8777, UAS: 0.9297, LAS: 0.8753, UEM: 0.5582, LEM: 0.3193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6452, partial_loss/deprel_loss: 0.7188, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8503, loss: 0.8698, batch_reg_loss: 0.1462, reg_loss: 0.1459 ||:  35%|###5      | 39/111 [00:26<00:48,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8624, UAS: 0.9305, LAS: 0.8756, UEM: 0.5537, LEM: 0.3114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7213, partial_loss/deprel_loss: 0.7833, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9172, loss: 0.8642, batch_reg_loss: 0.1463, reg_loss: 0.1459 ||:  38%|###7      | 42/111 [00:28<00:47,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8437, UAS: 0.9290, LAS: 0.8735, UEM: 0.5410, LEM: 0.2992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0237, partial_loss/deprel_loss: 0.8837, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0581, loss: 0.8770, batch_reg_loss: 0.1464, reg_loss: 0.1460 ||:  41%|####1     | 46/111 [00:30<00:43,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8991, UAS: 0.9317, LAS: 0.8768, UEM: 0.5692, LEM: 0.3247, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3221, partial_loss/deprel_loss: 0.5263, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6319, loss: 0.8508, batch_reg_loss: 0.1465, reg_loss: 0.1460 ||:  45%|####5     | 50/111 [00:33<00:40,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8850, UAS: 0.9321, LAS: 0.8772, UEM: 0.5601, LEM: 0.3158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5211, partial_loss/deprel_loss: 0.6311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7556, loss: 0.8474, batch_reg_loss: 0.1465, reg_loss: 0.1460 ||:  49%|####8     | 54/111 [00:36<00:37,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9311, LAS: 0.8759, UEM: 0.5516, LEM: 0.3082, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5666, partial_loss/deprel_loss: 0.6358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7685, loss: 0.8563, batch_reg_loss: 0.1466, reg_loss: 0.1461 ||:  52%|#####2    | 58/111 [00:38<00:35,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8161, UAS: 0.9310, LAS: 0.8758, UEM: 0.5487, LEM: 0.3056, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4201, partial_loss/deprel_loss: 1.0710, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2874, loss: 0.8568, batch_reg_loss: 0.1466, reg_loss: 0.1461 ||:  56%|#####5    | 62/111 [00:41<00:34,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8756, UAS: 0.9310, LAS: 0.8756, UEM: 0.5411, LEM: 0.2988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6316, partial_loss/deprel_loss: 0.7124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8429, loss: 0.8575, batch_reg_loss: 0.1467, reg_loss: 0.1461 ||:  59%|#####8    | 65/111 [00:43<00:32,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9304, LAS: 0.8748, UEM: 0.5300, LEM: 0.2917, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8484, partial_loss/deprel_loss: 0.8227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9745, loss: 0.8617, batch_reg_loss: 0.1467, reg_loss: 0.1462 ||:  61%|######1   | 68/111 [00:46<00:29,  1.44it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8927, UAS: 0.9297, LAS: 0.8742, UEM: 0.5247, LEM: 0.2871, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5040, partial_loss/deprel_loss: 0.5522, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6894, loss: 0.8663, batch_reg_loss: 0.1468, reg_loss: 0.1462 ||:  65%|######4   | 72/111 [00:48<00:25,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9296, LAS: 0.8740, UEM: 0.5207, LEM: 0.2814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2853, partial_loss/deprel_loss: 0.5267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6253, loss: 0.8694, batch_reg_loss: 0.1469, reg_loss: 0.1462 ||:  68%|######8   | 76/111 [00:51<00:23,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8936, UAS: 0.9301, LAS: 0.8746, UEM: 0.5239, LEM: 0.2825, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4784, partial_loss/deprel_loss: 0.6309, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7473, loss: 0.8649, batch_reg_loss: 0.1470, reg_loss: 0.1463 ||:  72%|#######2  | 80/111 [00:53<00:20,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8661, UAS: 0.9295, LAS: 0.8739, UEM: 0.5156, LEM: 0.2772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8536, partial_loss/deprel_loss: 0.8270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9793, loss: 0.8710, batch_reg_loss: 0.1470, reg_loss: 0.1463 ||:  76%|#######5  | 84/111 [00:56<00:17,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8424, UAS: 0.9279, LAS: 0.8721, UEM: 0.5087, LEM: 0.2720, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1010, partial_loss/deprel_loss: 0.9139, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0984, loss: 0.8855, batch_reg_loss: 0.1471, reg_loss: 0.1463 ||:  79%|#######9  | 88/111 [00:58<00:15,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8623, UAS: 0.9283, LAS: 0.8724, UEM: 0.5060, LEM: 0.2680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7206, partial_loss/deprel_loss: 0.8822, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9970, loss: 0.8843, batch_reg_loss: 0.1472, reg_loss: 0.1464 ||:  83%|########2 | 92/111 [01:01<00:11,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.9280, LAS: 0.8721, UEM: 0.5019, LEM: 0.2653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9525, partial_loss/deprel_loss: 0.8787, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0407, loss: 0.8880, batch_reg_loss: 0.1473, reg_loss: 0.1464 ||:  86%|########6 | 96/111 [01:03<00:09,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9492, UAS: 0.9288, LAS: 0.8728, UEM: 0.5220, LEM: 0.2890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0723, partial_loss/deprel_loss: 0.2095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3294, loss: 0.8826, batch_reg_loss: 0.1473, reg_loss: 0.1464 ||:  90%|######### | 100/111 [01:07<00:07,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8337, UAS: 0.9286, LAS: 0.8726, UEM: 0.5207, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3335, partial_loss/deprel_loss: 1.0984, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2928, loss: 0.8856, batch_reg_loss: 0.1474, reg_loss: 0.1465 ||:  93%|#########2| 103/111 [01:09<00:05,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8814, UAS: 0.9291, LAS: 0.8730, UEM: 0.5236, LEM: 0.2890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4793, partial_loss/deprel_loss: 0.6887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7942, loss: 0.8808, batch_reg_loss: 0.1474, reg_loss: 0.1465 ||:  95%|#########5| 106/111 [01:11<00:03,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9294, LAS: 0.8734, UEM: 0.5320, LEM: 0.2991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1479, partial_loss/deprel_loss: 0.2737, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3960, loss: 0.8765, batch_reg_loss: 0.1475, reg_loss: 0.1465 ||:  98%|#########8| 109/111 [01:13<00:01,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8766, UAS: 0.9296, LAS: 0.8735, UEM: 0.5301, LEM: 0.2970, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6356, partial_loss/deprel_loss: 0.8034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9174, loss: 0.8758, batch_reg_loss: 0.1475, reg_loss: 0.1465 ||: 100%|##########| 111/111 [01:15<00:00,  1.48it/s]\n",
+      "2023-04-06 23:48:52,323 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:48:52,323 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.803  |       N/A\n",
+      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.636  |       N/A\n",
+      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.147  |       N/A\n",
+      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - UEM                      |     0.530  |       N/A\n",
+      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - LAS                      |     0.873  |       N/A\n",
+      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - loss                     |     0.876  |       N/A\n",
+      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - LEM                      |     0.297  |       N/A\n",
+      "2023-04-06 23:48:52,325 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:48:52,325 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:48:52,325 - INFO - combo.training.tensorboard_writer - UAS                      |     0.930  |       N/A\n",
+      "2023-04-06 23:48:52,325 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:48:52,325 - INFO - combo.training.tensorboard_writer - EM                       |     0.877  |       N/A\n",
+      "2023-04-06 23:48:52,325 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:48:52,326 - INFO - combo.training.trainer - Epoch duration: 0:01:15.138417\n",
+      "2023-04-06 23:48:52,326 - INFO - combo.training.trainer - Estimated training time remaining: 7:46:06\n",
+      "2023-04-06 23:48:52,326 - INFO - allennlp.training.trainer - Epoch 45/399\n",
+      "2023-04-06 23:48:52,326 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:48:52,326 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:48:52,334 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9169, LAS: 0.8645, UEM: 0.6209, LEM: 0.3762, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3488, partial_loss/deprel_loss: 0.4880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6077, loss: 0.9611, batch_reg_loss: 0.1476, reg_loss: 0.1476 ||:   4%|3         | 4/111 [00:02<01:17,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7991, UAS: 0.9205, LAS: 0.8661, UEM: 0.6082, LEM: 0.3561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7394, partial_loss/deprel_loss: 1.2242, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4749, loss: 0.9431, batch_reg_loss: 0.1476, reg_loss: 0.1476 ||:   6%|6         | 7/111 [00:05<01:14,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8656, UAS: 0.9206, LAS: 0.8646, UEM: 0.5249, LEM: 0.2889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7115, partial_loss/deprel_loss: 0.7655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9024, loss: 0.9411, batch_reg_loss: 0.1477, reg_loss: 0.1476 ||:  10%|9         | 11/111 [00:07<01:07,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8830, UAS: 0.9248, LAS: 0.8690, UEM: 0.5142, LEM: 0.2694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5019, partial_loss/deprel_loss: 0.7006, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8086, loss: 0.8999, batch_reg_loss: 0.1478, reg_loss: 0.1476 ||:  13%|#2        | 14/111 [00:09<01:06,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9275, LAS: 0.8721, UEM: 0.5363, LEM: 0.2925, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2829, partial_loss/deprel_loss: 0.3895, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5160, loss: 0.8710, batch_reg_loss: 0.1478, reg_loss: 0.1477 ||:  15%|#5        | 17/111 [00:11<01:06,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8806, UAS: 0.9285, LAS: 0.8730, UEM: 0.5128, LEM: 0.2727, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5980, partial_loss/deprel_loss: 0.6489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7866, loss: 0.8690, batch_reg_loss: 0.1479, reg_loss: 0.1477 ||:  18%|#8        | 20/111 [00:13<01:04,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8446, UAS: 0.9269, LAS: 0.8713, UEM: 0.4956, LEM: 0.2596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9929, partial_loss/deprel_loss: 0.9136, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0774, loss: 0.8785, batch_reg_loss: 0.1479, reg_loss: 0.1477 ||:  21%|##        | 23/111 [00:15<01:02,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9277, LAS: 0.8720, UEM: 0.4875, LEM: 0.2508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7347, partial_loss/deprel_loss: 0.7592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9022, loss: 0.8687, batch_reg_loss: 0.1480, reg_loss: 0.1478 ||:  23%|##3       | 26/111 [00:18<01:00,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9321, LAS: 0.8777, UEM: 0.5737, LEM: 0.3447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3178, partial_loss/deprel_loss: 0.5158, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6243, loss: 0.8307, batch_reg_loss: 0.1480, reg_loss: 0.1478 ||:  26%|##6       | 29/111 [00:21<01:05,  1.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9321, LAS: 0.8777, UEM: 0.5882, LEM: 0.3674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4529, partial_loss/deprel_loss: 0.5867, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7080, loss: 0.8318, batch_reg_loss: 0.1481, reg_loss: 0.1478 ||:  30%|##9       | 33/111 [00:23<00:58,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9305, LAS: 0.8756, UEM: 0.5741, LEM: 0.3538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8034, partial_loss/deprel_loss: 0.8026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9509, loss: 0.8478, batch_reg_loss: 0.1481, reg_loss: 0.1478 ||:  32%|###2      | 36/111 [00:25<00:54,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8671, UAS: 0.9317, LAS: 0.8763, UEM: 0.5771, LEM: 0.3511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6548, partial_loss/deprel_loss: 0.8313, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9442, loss: 0.8396, batch_reg_loss: 0.1482, reg_loss: 0.1479 ||:  35%|###5      | 39/111 [00:27<00:52,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9338, LAS: 0.8790, UEM: 0.5864, LEM: 0.3539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3781, partial_loss/deprel_loss: 0.5629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6742, loss: 0.8236, batch_reg_loss: 0.1482, reg_loss: 0.1479 ||:  39%|###8      | 43/111 [00:30<00:47,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8419, UAS: 0.9320, LAS: 0.8768, UEM: 0.5703, LEM: 0.3423, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1642, partial_loss/deprel_loss: 0.9447, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1368, loss: 0.8393, batch_reg_loss: 0.1483, reg_loss: 0.1479 ||:  41%|####1     | 46/111 [00:32<00:45,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9201, UAS: 0.9331, LAS: 0.8779, UEM: 0.5812, LEM: 0.3521, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1896, partial_loss/deprel_loss: 0.3194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4418, loss: 0.8277, batch_reg_loss: 0.1483, reg_loss: 0.1479 ||:  44%|####4     | 49/111 [00:34<00:42,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9328, LAS: 0.8772, UEM: 0.5853, LEM: 0.3549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1467, partial_loss/deprel_loss: 0.3971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4954, loss: 0.8332, batch_reg_loss: 0.1484, reg_loss: 0.1480 ||:  47%|####6     | 52/111 [00:36<00:40,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8404, UAS: 0.9322, LAS: 0.8766, UEM: 0.5773, LEM: 0.3481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2362, partial_loss/deprel_loss: 0.9801, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1798, loss: 0.8400, batch_reg_loss: 0.1484, reg_loss: 0.1480 ||:  50%|####9     | 55/111 [00:38<00:39,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9042, UAS: 0.9298, LAS: 0.8743, UEM: 0.5684, LEM: 0.3423, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3632, partial_loss/deprel_loss: 0.4450, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5771, loss: 0.8590, batch_reg_loss: 0.1485, reg_loss: 0.1480 ||:  53%|#####3    | 59/111 [00:41<00:37,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9287, LAS: 0.8731, UEM: 0.5648, LEM: 0.3388, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3237, partial_loss/deprel_loss: 0.4315, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5585, loss: 0.8692, batch_reg_loss: 0.1485, reg_loss: 0.1480 ||:  56%|#####5    | 62/111 [00:44<00:35,  1.38it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8407, UAS: 0.9284, LAS: 0.8725, UEM: 0.5539, LEM: 0.3295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2580, partial_loss/deprel_loss: 1.0314, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2254, loss: 0.8760, batch_reg_loss: 0.1486, reg_loss: 0.1481 ||:  59%|#####9    | 66/111 [00:46<00:31,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8227, UAS: 0.9278, LAS: 0.8719, UEM: 0.5486, LEM: 0.3246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4298, partial_loss/deprel_loss: 0.9430, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1891, loss: 0.8808, batch_reg_loss: 0.1487, reg_loss: 0.1481 ||:  62%|######2   | 69/111 [00:48<00:29,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8764, UAS: 0.9270, LAS: 0.8709, UEM: 0.5420, LEM: 0.3179, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6441, partial_loss/deprel_loss: 0.6258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7782, loss: 0.8877, batch_reg_loss: 0.1487, reg_loss: 0.1481 ||:  65%|######4   | 72/111 [00:50<00:27,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8926, UAS: 0.9276, LAS: 0.8713, UEM: 0.5411, LEM: 0.3138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4335, partial_loss/deprel_loss: 0.6407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7481, loss: 0.8853, batch_reg_loss: 0.1488, reg_loss: 0.1482 ||:  68%|######8   | 76/111 [00:53<00:24,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8540, UAS: 0.9268, LAS: 0.8706, UEM: 0.5445, LEM: 0.3183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9612, partial_loss/deprel_loss: 0.8148, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9930, loss: 0.8901, batch_reg_loss: 0.1489, reg_loss: 0.1482 ||:  71%|#######1  | 79/111 [00:55<00:22,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9272, LAS: 0.8709, UEM: 0.5434, LEM: 0.3147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3584, partial_loss/deprel_loss: 0.5370, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6502, loss: 0.8875, batch_reg_loss: 0.1490, reg_loss: 0.1482 ||:  74%|#######3  | 82/111 [00:58<00:21,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8341, UAS: 0.9271, LAS: 0.8708, UEM: 0.5359, LEM: 0.3090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1788, partial_loss/deprel_loss: 0.9773, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1667, loss: 0.8887, batch_reg_loss: 0.1490, reg_loss: 0.1483 ||:  77%|#######7  | 86/111 [01:00<00:17,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8259, UAS: 0.9264, LAS: 0.8700, UEM: 0.5294, LEM: 0.3038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1285, partial_loss/deprel_loss: 1.1447, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2905, loss: 0.8945, batch_reg_loss: 0.1491, reg_loss: 0.1483 ||:  81%|########1 | 90/111 [01:02<00:13,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8613, UAS: 0.9266, LAS: 0.8703, UEM: 0.5230, LEM: 0.2979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9470, partial_loss/deprel_loss: 0.7802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9627, loss: 0.8945, batch_reg_loss: 0.1492, reg_loss: 0.1483 ||:  85%|########4 | 94/111 [01:05<00:11,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9273, LAS: 0.8712, UEM: 0.5234, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2959, partial_loss/deprel_loss: 0.5120, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6180, loss: 0.8880, batch_reg_loss: 0.1493, reg_loss: 0.1484 ||:  88%|########8 | 98/111 [01:07<00:08,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8325, UAS: 0.9275, LAS: 0.8714, UEM: 0.5286, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2757, partial_loss/deprel_loss: 0.9351, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1526, loss: 0.8843, batch_reg_loss: 0.1493, reg_loss: 0.1484 ||:  92%|#########1| 102/111 [01:10<00:06,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9280, LAS: 0.8719, UEM: 0.5266, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5151, partial_loss/deprel_loss: 0.5887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7234, loss: 0.8805, batch_reg_loss: 0.1494, reg_loss: 0.1484 ||:  95%|#########5| 106/111 [01:13<00:03,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9284, LAS: 0.8724, UEM: 0.5281, LEM: 0.2977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3449, partial_loss/deprel_loss: 0.4950, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6144, loss: 0.8774, batch_reg_loss: 0.1494, reg_loss: 0.1485 ||:  99%|#########9| 110/111 [01:16<00:00,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8283, UAS: 0.9282, LAS: 0.8720, UEM: 0.5259, LEM: 0.2964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1604, partial_loss/deprel_loss: 1.0838, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2486, loss: 0.8807, batch_reg_loss: 0.1495, reg_loss: 0.1485 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
+      "2023-04-06 23:50:09,062 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9534, LAS: 0.9001, UEM: 0.6753, LEM: 0.3628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1819, partial_loss/deprel_loss: 23.7693, partial_loss/cycle_loss: 0.0000, batch_loss: 19.0518, loss: 22.2928, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:08,  1.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9487, LAS: 0.8920, UEM: 0.6040, LEM: 0.2900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9910, partial_loss/deprel_loss: 37.4935, partial_loss/cycle_loss: 0.0000, batch_loss: 30.1930, loss: 23.5104, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:06,  1.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9415, LAS: 0.8858, UEM: 0.5706, LEM: 0.2838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9017, partial_loss/deprel_loss: 31.2307, partial_loss/cycle_loss: 0.0000, batch_loss: 25.1649, loss: 25.3184, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  69%|######9   | 9/13 [00:07<00:03,  1.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9419, LAS: 0.8882, UEM: 0.6289, LEM: 0.3770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1918, partial_loss/deprel_loss: 20.7598, partial_loss/cycle_loss: 0.0000, batch_loss: 16.6462, loss: 25.8303, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:09<00:01,  1.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8678, UAS: 0.9422, LAS: 0.8879, UEM: 0.6232, LEM: 0.3631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0590, partial_loss/deprel_loss: 43.7483, partial_loss/cycle_loss: 0.0000, batch_loss: 35.2104, loss: 26.2072, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:11<00:00,  1.05it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8678, UAS: 0.9422, LAS: 0.8879, UEM: 0.6232, LEM: 0.3631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0590, partial_loss/deprel_loss: 43.7483, partial_loss/cycle_loss: 0.0000, batch_loss: 35.2104, loss: 26.2072, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:11<00:00,  1.09it/s]\n",
+      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.084  |    43.748\n",
+      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.160  |     1.059\n",
+      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.148  |     0.000\n",
+      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - UEM                      |     0.526  |     0.623\n",
+      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - LAS                      |     0.872  |     0.888\n",
+      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - loss                     |     0.881  |    26.207\n",
+      "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - LEM                      |     0.296  |     0.363\n",
+      "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - UAS                      |     0.928  |     0.942\n",
+      "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - EM                       |     0.828  |     0.868\n",
+      "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:50:21,017 - INFO - combo.training.trainer - Epoch duration: 0:01:28.691575\n",
+      "2023-04-06 23:50:21,018 - INFO - combo.training.trainer - Estimated training time remaining: 7:46:03\n",
+      "2023-04-06 23:50:21,018 - INFO - allennlp.training.trainer - Epoch 46/399\n",
+      "2023-04-06 23:50:21,018 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:50:21,018 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:50:21,024 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9393, LAS: 0.8848, UEM: 0.7867, LEM: 0.5840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1217, partial_loss/deprel_loss: 0.2555, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3782, loss: 0.7494, batch_reg_loss: 0.1495, reg_loss: 0.1495 ||:   3%|2         | 3/111 [00:02<01:20,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8622, UAS: 0.9277, LAS: 0.8710, UEM: 0.5986, LEM: 0.4062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7870, partial_loss/deprel_loss: 0.9187, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0420, loss: 0.8931, batch_reg_loss: 0.1496, reg_loss: 0.1495 ||:   6%|6         | 7/111 [00:04<01:10,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9300, LAS: 0.8734, UEM: 0.5550, LEM: 0.3467, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4426, partial_loss/deprel_loss: 0.5726, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6963, loss: 0.8855, batch_reg_loss: 0.1496, reg_loss: 0.1496 ||:  10%|9         | 11/111 [00:06<01:05,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9138, UAS: 0.9345, LAS: 0.8780, UEM: 0.5825, LEM: 0.3564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2641, partial_loss/deprel_loss: 0.3866, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5118, loss: 0.8413, batch_reg_loss: 0.1497, reg_loss: 0.1496 ||:  13%|#2        | 14/111 [00:08<01:05,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8545, UAS: 0.9332, LAS: 0.8768, UEM: 0.5385, LEM: 0.3190, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9611, partial_loss/deprel_loss: 0.9256, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0825, loss: 0.8551, batch_reg_loss: 0.1498, reg_loss: 0.1496 ||:  16%|#6        | 18/111 [00:11<01:00,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9484, UAS: 0.9320, LAS: 0.8767, UEM: 0.5975, LEM: 0.3967, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0807, partial_loss/deprel_loss: 0.1996, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3256, loss: 0.8484, batch_reg_loss: 0.1498, reg_loss: 0.1496 ||:  20%|#9        | 22/111 [00:14<01:00,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8950, UAS: 0.9341, LAS: 0.8794, UEM: 0.5979, LEM: 0.3846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4832, partial_loss/deprel_loss: 0.6899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7985, loss: 0.8280, batch_reg_loss: 0.1499, reg_loss: 0.1497 ||:  23%|##2       | 25/111 [00:16<00:58,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9348, LAS: 0.8796, UEM: 0.5840, LEM: 0.3619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3874, partial_loss/deprel_loss: 0.6064, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7125, loss: 0.8244, batch_reg_loss: 0.1499, reg_loss: 0.1497 ||:  26%|##6       | 29/111 [00:19<00:55,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9347, LAS: 0.8794, UEM: 0.5729, LEM: 0.3494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5306, partial_loss/deprel_loss: 0.5927, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7302, loss: 0.8259, batch_reg_loss: 0.1500, reg_loss: 0.1497 ||:  29%|##8       | 32/111 [00:21<00:53,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9323, LAS: 0.8763, UEM: 0.5530, LEM: 0.3312, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5293, partial_loss/deprel_loss: 0.6402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7681, loss: 0.8487, batch_reg_loss: 0.1500, reg_loss: 0.1498 ||:  32%|###2      | 36/111 [00:23<00:49,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9328, LAS: 0.8771, UEM: 0.5633, LEM: 0.3422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1378, partial_loss/deprel_loss: 0.3228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4359, loss: 0.8430, batch_reg_loss: 0.1501, reg_loss: 0.1498 ||:  35%|###5      | 39/111 [00:25<00:48,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9319, LAS: 0.8759, UEM: 0.5512, LEM: 0.3293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3804, partial_loss/deprel_loss: 0.6162, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7192, loss: 0.8529, batch_reg_loss: 0.1501, reg_loss: 0.1498 ||:  39%|###8      | 43/111 [00:28<00:45,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9323, LAS: 0.8762, UEM: 0.5401, LEM: 0.3185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4595, partial_loss/deprel_loss: 0.5603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6904, loss: 0.8498, batch_reg_loss: 0.1502, reg_loss: 0.1498 ||:  42%|####2     | 47/111 [00:30<00:41,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8462, UAS: 0.9327, LAS: 0.8767, UEM: 0.5498, LEM: 0.3266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0265, partial_loss/deprel_loss: 0.8848, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0634, loss: 0.8436, batch_reg_loss: 0.1503, reg_loss: 0.1499 ||:  46%|####5     | 51/111 [00:33<00:38,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8446, UAS: 0.9336, LAS: 0.8777, UEM: 0.5578, LEM: 0.3318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9532, partial_loss/deprel_loss: 0.9401, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0931, loss: 0.8347, batch_reg_loss: 0.1503, reg_loss: 0.1499 ||:  50%|####9     | 55/111 [00:35<00:35,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8091, UAS: 0.9310, LAS: 0.8748, UEM: 0.5446, LEM: 0.3223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6452, partial_loss/deprel_loss: 1.0977, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3576, loss: 0.8591, batch_reg_loss: 0.1504, reg_loss: 0.1499 ||:  53%|#####3    | 59/111 [00:38<00:32,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9295, LAS: 0.8733, UEM: 0.5337, LEM: 0.3132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5317, partial_loss/deprel_loss: 0.6523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7787, loss: 0.8732, batch_reg_loss: 0.1505, reg_loss: 0.1500 ||:  57%|#####6    | 63/111 [00:40<00:30,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9297, LAS: 0.8738, UEM: 0.5323, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2996, partial_loss/deprel_loss: 0.4510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5713, loss: 0.8672, batch_reg_loss: 0.1505, reg_loss: 0.1500 ||:  60%|######    | 67/111 [00:43<00:28,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9302, LAS: 0.8744, UEM: 0.5323, LEM: 0.3087, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2982, partial_loss/deprel_loss: 0.4410, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5631, loss: 0.8616, batch_reg_loss: 0.1506, reg_loss: 0.1500 ||:  64%|######3   | 71/111 [00:46<00:26,  1.51it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8887, UAS: 0.9310, LAS: 0.8752, UEM: 0.5322, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4613, partial_loss/deprel_loss: 0.6015, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7241, loss: 0.8551, batch_reg_loss: 0.1507, reg_loss: 0.1501 ||:  68%|######7   | 75/111 [00:49<00:24,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8928, UAS: 0.9300, LAS: 0.8740, UEM: 0.5275, LEM: 0.2992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3972, partial_loss/deprel_loss: 0.5661, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6831, loss: 0.8679, batch_reg_loss: 0.1508, reg_loss: 0.1501 ||:  71%|#######1  | 79/111 [00:51<00:21,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8049, UAS: 0.9278, LAS: 0.8714, UEM: 0.5172, LEM: 0.2928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6741, partial_loss/deprel_loss: 1.1973, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4435, loss: 0.8901, batch_reg_loss: 0.1508, reg_loss: 0.1501 ||:  75%|#######4  | 83/111 [00:54<00:18,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9281, LAS: 0.8717, UEM: 0.5223, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3916, partial_loss/deprel_loss: 0.5200, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6452, loss: 0.8872, batch_reg_loss: 0.1509, reg_loss: 0.1502 ||:  78%|#######8  | 87/111 [00:57<00:16,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8840, UAS: 0.9278, LAS: 0.8714, UEM: 0.5150, LEM: 0.2903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5170, partial_loss/deprel_loss: 0.6603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7826, loss: 0.8900, batch_reg_loss: 0.1510, reg_loss: 0.1502 ||:  82%|########1 | 91/111 [00:59<00:13,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8360, UAS: 0.9279, LAS: 0.8717, UEM: 0.5151, LEM: 0.2906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3055, partial_loss/deprel_loss: 0.9726, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1902, loss: 0.8875, batch_reg_loss: 0.1511, reg_loss: 0.1502 ||:  86%|########5 | 95/111 [01:01<00:10,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9284, LAS: 0.8722, UEM: 0.5175, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1813, partial_loss/deprel_loss: 0.4224, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5253, loss: 0.8842, batch_reg_loss: 0.1512, reg_loss: 0.1503 ||:  89%|########9 | 99/111 [01:04<00:07,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9037, UAS: 0.9288, LAS: 0.8727, UEM: 0.5197, LEM: 0.2928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2933, partial_loss/deprel_loss: 0.4974, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6078, loss: 0.8797, batch_reg_loss: 0.1512, reg_loss: 0.1503 ||:  93%|#########2| 103/111 [01:07<00:05,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7736, UAS: 0.9286, LAS: 0.8725, UEM: 0.5249, LEM: 0.2976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1080, partial_loss/deprel_loss: 1.4011, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6937, loss: 0.8808, batch_reg_loss: 0.1513, reg_loss: 0.1504 ||:  96%|#########6| 107/111 [01:10<00:02,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8936, UAS: 0.9285, LAS: 0.8723, UEM: 0.5211, LEM: 0.2944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4362, partial_loss/deprel_loss: 0.5338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6656, loss: 0.8816, batch_reg_loss: 0.1513, reg_loss: 0.1504 ||:  99%|#########9| 110/111 [01:12<00:00,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9286, LAS: 0.8724, UEM: 0.5211, LEM: 0.2937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5446, partial_loss/deprel_loss: 0.5990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7395, loss: 0.8803, batch_reg_loss: 0.1513, reg_loss: 0.1504 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
+      "2023-04-06 23:51:34,483 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:51:34,483 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:51:34,483 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:51:34,483 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.599  |       N/A\n",
+      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.545  |       N/A\n",
+      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.150  |       N/A\n",
+      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - UEM                      |     0.521  |       N/A\n",
+      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - LAS                      |     0.872  |       N/A\n",
+      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - loss                     |     0.880  |       N/A\n",
+      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - LEM                      |     0.294  |       N/A\n",
+      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:51:34,485 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:51:34,485 - INFO - combo.training.tensorboard_writer - UAS                      |     0.929  |       N/A\n",
+      "2023-04-06 23:51:34,485 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:51:34,485 - INFO - combo.training.tensorboard_writer - EM                       |     0.890  |       N/A\n",
+      "2023-04-06 23:51:34,485 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:51:34,486 - INFO - combo.training.trainer - Epoch duration: 0:01:13.468063\n",
+      "2023-04-06 23:51:34,486 - INFO - combo.training.trainer - Estimated training time remaining: 7:44:03\n",
+      "2023-04-06 23:51:34,486 - INFO - allennlp.training.trainer - Epoch 47/399\n",
+      "2023-04-06 23:51:34,486 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:51:34,487 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:51:34,497 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8854, UAS: 0.9484, LAS: 0.8921, UEM: 0.5152, LEM: 0.2265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5373, partial_loss/deprel_loss: 0.6751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7989, loss: 0.7461, batch_reg_loss: 0.1514, reg_loss: 0.1514 ||:   4%|3         | 4/111 [00:02<01:05,  1.63it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8846, UAS: 0.9466, LAS: 0.8903, UEM: 0.5488, LEM: 0.2500, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4419, partial_loss/deprel_loss: 0.6563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7649, loss: 0.7337, batch_reg_loss: 0.1514, reg_loss: 0.1514 ||:   6%|6         | 7/111 [00:04<01:10,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9452, LAS: 0.8893, UEM: 0.5505, LEM: 0.2724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5635, partial_loss/deprel_loss: 0.6452, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7804, loss: 0.7389, batch_reg_loss: 0.1515, reg_loss: 0.1514 ||:   9%|9         | 10/111 [00:07<01:09,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8630, UAS: 0.9440, LAS: 0.8878, UEM: 0.5283, LEM: 0.2561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8270, partial_loss/deprel_loss: 0.9081, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0434, loss: 0.7611, batch_reg_loss: 0.1515, reg_loss: 0.1514 ||:  12%|#1        | 13/111 [00:09<01:07,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9360, LAS: 0.8785, UEM: 0.4933, LEM: 0.2363, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5545, partial_loss/deprel_loss: 0.6104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7509, loss: 0.8289, batch_reg_loss: 0.1516, reg_loss: 0.1515 ||:  15%|#5        | 17/111 [00:11<01:02,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9351, LAS: 0.8776, UEM: 0.4647, LEM: 0.2148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5660, partial_loss/deprel_loss: 0.6389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7760, loss: 0.8371, batch_reg_loss: 0.1517, reg_loss: 0.1515 ||:  19%|#8        | 21/111 [00:13<00:57,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9373, LAS: 0.8812, UEM: 0.4902, LEM: 0.2398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2424, partial_loss/deprel_loss: 0.4311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5451, loss: 0.8146, batch_reg_loss: 0.1517, reg_loss: 0.1515 ||:  22%|##1       | 24/111 [00:16<00:57,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9377, LAS: 0.8817, UEM: 0.5209, LEM: 0.2785, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4732, partial_loss/deprel_loss: 0.6436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7613, loss: 0.8096, batch_reg_loss: 0.1518, reg_loss: 0.1516 ||:  24%|##4       | 27/111 [00:18<00:55,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8254, UAS: 0.9377, LAS: 0.8823, UEM: 0.5501, LEM: 0.3158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4170, partial_loss/deprel_loss: 1.0259, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2560, loss: 0.8059, batch_reg_loss: 0.1518, reg_loss: 0.1516 ||:  28%|##7       | 31/111 [00:20<00:52,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9379, LAS: 0.8831, UEM: 0.5481, LEM: 0.3144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3535, partial_loss/deprel_loss: 0.4208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5592, loss: 0.8039, batch_reg_loss: 0.1519, reg_loss: 0.1516 ||:  31%|###       | 34/111 [00:22<00:51,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8378, UAS: 0.9348, LAS: 0.8797, UEM: 0.5299, LEM: 0.3030, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1099, partial_loss/deprel_loss: 1.1716, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3112, loss: 0.8368, batch_reg_loss: 0.1519, reg_loss: 0.1516 ||:  33%|###3      | 37/111 [00:24<00:49,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8553, UAS: 0.9310, LAS: 0.8754, UEM: 0.5079, LEM: 0.2880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8518, partial_loss/deprel_loss: 0.8380, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9927, loss: 0.8694, batch_reg_loss: 0.1520, reg_loss: 0.1517 ||:  37%|###6      | 41/111 [00:27<00:46,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8168, UAS: 0.9289, LAS: 0.8730, UEM: 0.4885, LEM: 0.2745, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4595, partial_loss/deprel_loss: 1.1418, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3574, loss: 0.8871, batch_reg_loss: 0.1521, reg_loss: 0.1517 ||:  41%|####      | 45/111 [00:29<00:43,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9281, LAS: 0.8723, UEM: 0.4868, LEM: 0.2702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4924, partial_loss/deprel_loss: 0.6568, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7761, loss: 0.8943, batch_reg_loss: 0.1521, reg_loss: 0.1517 ||:  44%|####4     | 49/111 [00:32<00:41,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9272, LAS: 0.8714, UEM: 0.4838, LEM: 0.2672, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3521, partial_loss/deprel_loss: 0.5455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6591, loss: 0.9020, batch_reg_loss: 0.1522, reg_loss: 0.1518 ||:  47%|####6     | 52/111 [00:34<00:39,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9289, LAS: 0.8733, UEM: 0.5055, LEM: 0.2813, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2791, partial_loss/deprel_loss: 0.4182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5426, loss: 0.8857, batch_reg_loss: 0.1523, reg_loss: 0.1518 ||:  50%|####9     | 55/111 [00:37<00:39,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9281, LAS: 0.8722, UEM: 0.4949, LEM: 0.2733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7369, partial_loss/deprel_loss: 0.7573, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9055, loss: 0.8954, batch_reg_loss: 0.1523, reg_loss: 0.1518 ||:  52%|#####2    | 58/111 [00:39<00:37,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9273, LAS: 0.8712, UEM: 0.4849, LEM: 0.2654, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5280, partial_loss/deprel_loss: 0.7407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8505, loss: 0.9024, batch_reg_loss: 0.1524, reg_loss: 0.1518 ||:  55%|#####4    | 61/111 [00:41<00:34,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9278, LAS: 0.8717, UEM: 0.4898, LEM: 0.2680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3571, partial_loss/deprel_loss: 0.5670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6775, loss: 0.8988, batch_reg_loss: 0.1525, reg_loss: 0.1519 ||:  59%|#####8    | 65/111 [00:43<00:30,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8651, UAS: 0.9284, LAS: 0.8724, UEM: 0.4908, LEM: 0.2672, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7764, partial_loss/deprel_loss: 0.8388, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9789, loss: 0.8927, batch_reg_loss: 0.1525, reg_loss: 0.1519 ||:  61%|######1   | 68/111 [00:45<00:29,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9291, LAS: 0.8732, UEM: 0.5030, LEM: 0.2763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1377, partial_loss/deprel_loss: 0.3870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4897, loss: 0.8876, batch_reg_loss: 0.1526, reg_loss: 0.1519 ||:  64%|######3   | 71/111 [00:48<00:28,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9283, LAS: 0.8722, UEM: 0.4949, LEM: 0.2694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9420, partial_loss/deprel_loss: 0.8445, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0166, loss: 0.8945, batch_reg_loss: 0.1526, reg_loss: 0.1520 ||:  68%|######7   | 75/111 [00:50<00:24,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9281, LAS: 0.8719, UEM: 0.4908, LEM: 0.2648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4672, partial_loss/deprel_loss: 0.6235, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7450, loss: 0.8979, batch_reg_loss: 0.1527, reg_loss: 0.1520 ||:  71%|#######1  | 79/111 [00:53<00:21,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9287, LAS: 0.8727, UEM: 0.4885, LEM: 0.2607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5525, partial_loss/deprel_loss: 0.6233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7619, loss: 0.8915, batch_reg_loss: 0.1528, reg_loss: 0.1520 ||:  75%|#######4  | 83/111 [00:55<00:18,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8832, UAS: 0.9288, LAS: 0.8729, UEM: 0.4905, LEM: 0.2638, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6938, partial_loss/deprel_loss: 0.7008, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8522, loss: 0.8901, batch_reg_loss: 0.1528, reg_loss: 0.1521 ||:  78%|#######8  | 87/111 [00:58<00:15,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8669, UAS: 0.9289, LAS: 0.8732, UEM: 0.4935, LEM: 0.2668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8700, partial_loss/deprel_loss: 0.8386, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9978, loss: 0.8883, batch_reg_loss: 0.1529, reg_loss: 0.1521 ||:  82%|########1 | 91/111 [01:01<00:13,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9280, LAS: 0.8724, UEM: 0.4954, LEM: 0.2697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2556, partial_loss/deprel_loss: 0.3945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5197, loss: 0.8933, batch_reg_loss: 0.1530, reg_loss: 0.1521 ||:  85%|########4 | 94/111 [01:03<00:11,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9572, UAS: 0.9289, LAS: 0.8735, UEM: 0.5164, LEM: 0.2943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0686, partial_loss/deprel_loss: 0.1776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3088, loss: 0.8856, batch_reg_loss: 0.1530, reg_loss: 0.1522 ||:  87%|########7 | 97/111 [01:06<00:10,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9109, UAS: 0.9289, LAS: 0.8735, UEM: 0.5153, LEM: 0.2937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3051, partial_loss/deprel_loss: 0.4620, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5837, loss: 0.8855, batch_reg_loss: 0.1531, reg_loss: 0.1522 ||:  91%|######### | 101/111 [01:08<00:07,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9299, LAS: 0.8746, UEM: 0.5268, LEM: 0.3022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2536, partial_loss/deprel_loss: 0.3871, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5135, loss: 0.8753, batch_reg_loss: 0.1532, reg_loss: 0.1522 ||:  95%|#########4| 105/111 [01:10<00:03,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9301, LAS: 0.8749, UEM: 0.5290, LEM: 0.3036, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2639, partial_loss/deprel_loss: 0.4698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5818, loss: 0.8739, batch_reg_loss: 0.1532, reg_loss: 0.1523 ||:  98%|#########8| 109/111 [01:12<00:01,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8612, UAS: 0.9302, LAS: 0.8748, UEM: 0.5266, LEM: 0.3005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7826, partial_loss/deprel_loss: 0.8032, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9523, loss: 0.8742, batch_reg_loss: 0.1532, reg_loss: 0.1523 ||: 100%|##########| 111/111 [01:14<00:00,  1.50it/s]\n",
+      "2023-04-06 23:52:48,579 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:52:48,579 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.803  |       N/A\n",
+      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.783  |       N/A\n",
+      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.152  |       N/A\n",
+      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - UEM                      |     0.527  |       N/A\n",
+      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - LAS                      |     0.875  |       N/A\n",
+      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - loss                     |     0.874  |       N/A\n",
+      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - LEM                      |     0.301  |       N/A\n",
+      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - UAS                      |     0.930  |       N/A\n",
+      "2023-04-06 23:52:48,581 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:52:48,581 - INFO - combo.training.tensorboard_writer - EM                       |     0.861  |       N/A\n",
+      "2023-04-06 23:52:48,581 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:52:48,581 - INFO - combo.training.trainer - Epoch duration: 0:01:14.095098\n",
+      "2023-04-06 23:52:48,581 - INFO - combo.training.trainer - Estimated training time remaining: 7:42:09\n",
+      "2023-04-06 23:52:48,581 - INFO - allennlp.training.trainer - Epoch 48/399\n",
+      "2023-04-06 23:52:48,581 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:52:48,582 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:52:48,587 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9000, UAS: 0.9342, LAS: 0.8798, UEM: 0.4156, LEM: 0.1978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4324, partial_loss/deprel_loss: 0.5304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6641, loss: 0.8418, batch_reg_loss: 0.1533, reg_loss: 0.1533 ||:   4%|3         | 4/111 [00:02<01:08,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8507, UAS: 0.9253, LAS: 0.8706, UEM: 0.3450, LEM: 0.1517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0604, partial_loss/deprel_loss: 0.8071, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0111, loss: 0.9093, batch_reg_loss: 0.1534, reg_loss: 0.1533 ||:   7%|7         | 8/111 [00:04<01:04,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8520, UAS: 0.9315, LAS: 0.8776, UEM: 0.5266, LEM: 0.3168, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9183, partial_loss/deprel_loss: 0.9036, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0599, loss: 0.8473, batch_reg_loss: 0.1534, reg_loss: 0.1533 ||:  10%|9         | 11/111 [00:07<01:08,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8656, UAS: 0.9278, LAS: 0.8743, UEM: 0.5129, LEM: 0.3092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9617, partial_loss/deprel_loss: 0.8241, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0050, loss: 0.8777, batch_reg_loss: 0.1534, reg_loss: 0.1533 ||:  13%|#2        | 14/111 [00:09<01:06,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8652, UAS: 0.9300, LAS: 0.8761, UEM: 0.5064, LEM: 0.2942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7605, partial_loss/deprel_loss: 0.8143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9571, loss: 0.8568, batch_reg_loss: 0.1535, reg_loss: 0.1534 ||:  16%|#6        | 18/111 [00:12<01:02,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8517, UAS: 0.9269, LAS: 0.8725, UEM: 0.4682, LEM: 0.2664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0474, partial_loss/deprel_loss: 0.8697, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0588, loss: 0.8885, batch_reg_loss: 0.1536, reg_loss: 0.1534 ||:  20%|#9        | 22/111 [00:14<00:58,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9289, LAS: 0.8747, UEM: 0.4699, LEM: 0.2578, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4745, partial_loss/deprel_loss: 0.5828, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7148, loss: 0.8740, batch_reg_loss: 0.1536, reg_loss: 0.1534 ||:  23%|##3       | 26/111 [00:16<00:54,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9288, LAS: 0.8747, UEM: 0.4876, LEM: 0.2748, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3346, partial_loss/deprel_loss: 0.4859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6094, loss: 0.8699, batch_reg_loss: 0.1537, reg_loss: 0.1535 ||:  27%|##7       | 30/111 [00:19<00:52,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9319, LAS: 0.8781, UEM: 0.5407, LEM: 0.3196, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1436, partial_loss/deprel_loss: 0.3075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4285, loss: 0.8452, batch_reg_loss: 0.1538, reg_loss: 0.1535 ||:  30%|##9       | 33/111 [00:21<00:53,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9313, LAS: 0.8776, UEM: 0.5379, LEM: 0.3147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4710, partial_loss/deprel_loss: 0.5909, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7208, loss: 0.8510, batch_reg_loss: 0.1538, reg_loss: 0.1535 ||:  33%|###3      | 37/111 [00:24<00:49,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9324, LAS: 0.8791, UEM: 0.5453, LEM: 0.3157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3170, partial_loss/deprel_loss: 0.4551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5813, loss: 0.8379, batch_reg_loss: 0.1539, reg_loss: 0.1536 ||:  36%|###6      | 40/111 [00:26<00:48,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8750, UAS: 0.9319, LAS: 0.8783, UEM: 0.5334, LEM: 0.3062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5949, partial_loss/deprel_loss: 0.6138, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7640, loss: 0.8391, batch_reg_loss: 0.1539, reg_loss: 0.1536 ||:  39%|###8      | 43/111 [00:28<00:47,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9336, LAS: 0.8803, UEM: 0.5564, LEM: 0.3248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2271, partial_loss/deprel_loss: 0.3773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5012, loss: 0.8227, batch_reg_loss: 0.1540, reg_loss: 0.1536 ||:  41%|####1     | 46/111 [00:31<00:46,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9314, LAS: 0.8775, UEM: 0.5413, LEM: 0.3131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5589, partial_loss/deprel_loss: 0.5810, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7306, loss: 0.8463, batch_reg_loss: 0.1540, reg_loss: 0.1536 ||:  45%|####5     | 50/111 [00:33<00:42,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9315, LAS: 0.8776, UEM: 0.5407, LEM: 0.3128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2421, partial_loss/deprel_loss: 0.3574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4884, loss: 0.8460, batch_reg_loss: 0.1541, reg_loss: 0.1537 ||:  48%|####7     | 53/111 [00:35<00:40,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9021, UAS: 0.9324, LAS: 0.8785, UEM: 0.5441, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3978, partial_loss/deprel_loss: 0.6004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7141, loss: 0.8389, batch_reg_loss: 0.1542, reg_loss: 0.1537 ||:  51%|#####1    | 57/111 [00:38<00:37,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9316, LAS: 0.8776, UEM: 0.5364, LEM: 0.3044, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6206, partial_loss/deprel_loss: 0.7314, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8634, loss: 0.8457, batch_reg_loss: 0.1542, reg_loss: 0.1537 ||:  54%|#####4    | 60/111 [00:40<00:35,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7838, UAS: 0.9304, LAS: 0.8762, UEM: 0.5293, LEM: 0.2987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1126, partial_loss/deprel_loss: 1.3161, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6297, loss: 0.8591, batch_reg_loss: 0.1543, reg_loss: 0.1538 ||:  58%|#####7    | 64/111 [00:43<00:31,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9300, LAS: 0.8758, UEM: 0.5307, LEM: 0.3013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2438, partial_loss/deprel_loss: 0.3579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4894, loss: 0.8597, batch_reg_loss: 0.1543, reg_loss: 0.1538 ||:  60%|######    | 67/111 [00:45<00:30,  1.45it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9548, UAS: 0.9313, LAS: 0.8773, UEM: 0.5548, LEM: 0.3303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0642, partial_loss/deprel_loss: 0.1699, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3031, loss: 0.8491, batch_reg_loss: 0.1544, reg_loss: 0.1538 ||:  63%|######3   | 70/111 [00:47<00:29,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8385, UAS: 0.9314, LAS: 0.8771, UEM: 0.5535, LEM: 0.3281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1907, partial_loss/deprel_loss: 1.0234, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2113, loss: 0.8511, batch_reg_loss: 0.1544, reg_loss: 0.1538 ||:  66%|######5   | 73/111 [00:50<00:28,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8736, UAS: 0.9308, LAS: 0.8763, UEM: 0.5414, LEM: 0.3172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5767, partial_loss/deprel_loss: 0.7398, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8617, loss: 0.8574, batch_reg_loss: 0.1545, reg_loss: 0.1539 ||:  69%|######9   | 77/111 [00:52<00:24,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8864, UAS: 0.9307, LAS: 0.8762, UEM: 0.5364, LEM: 0.3123, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4993, partial_loss/deprel_loss: 0.6346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7621, loss: 0.8571, batch_reg_loss: 0.1546, reg_loss: 0.1539 ||:  73%|#######2  | 81/111 [00:54<00:20,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8896, UAS: 0.9312, LAS: 0.8766, UEM: 0.5370, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4384, partial_loss/deprel_loss: 0.6207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7389, loss: 0.8523, batch_reg_loss: 0.1546, reg_loss: 0.1539 ||:  76%|#######5  | 84/111 [00:57<00:18,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9312, LAS: 0.8766, UEM: 0.5312, LEM: 0.3050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7141, partial_loss/deprel_loss: 0.6809, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8422, loss: 0.8526, batch_reg_loss: 0.1547, reg_loss: 0.1539 ||:  78%|#######8  | 87/111 [00:59<00:16,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8319, UAS: 0.9298, LAS: 0.8751, UEM: 0.5309, LEM: 0.3053, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1345, partial_loss/deprel_loss: 0.9797, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1654, loss: 0.8649, batch_reg_loss: 0.1547, reg_loss: 0.1540 ||:  81%|########1 | 90/111 [01:01<00:14,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8867, UAS: 0.9301, LAS: 0.8755, UEM: 0.5403, LEM: 0.3164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5235, partial_loss/deprel_loss: 0.6702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7956, loss: 0.8621, batch_reg_loss: 0.1548, reg_loss: 0.1540 ||:  84%|########3 | 93/111 [01:03<00:12,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8038, UAS: 0.9290, LAS: 0.8744, UEM: 0.5343, LEM: 0.3122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9209, partial_loss/deprel_loss: 1.1134, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4297, loss: 0.8719, batch_reg_loss: 0.1548, reg_loss: 0.1540 ||:  86%|########6 | 96/111 [01:05<00:10,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8983, UAS: 0.9294, LAS: 0.8747, UEM: 0.5321, LEM: 0.3085, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3043, partial_loss/deprel_loss: 0.5841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6830, loss: 0.8683, batch_reg_loss: 0.1549, reg_loss: 0.1541 ||:  90%|######### | 100/111 [01:08<00:07,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8439, UAS: 0.9285, LAS: 0.8737, UEM: 0.5242, LEM: 0.3027, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1519, partial_loss/deprel_loss: 0.9448, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1412, loss: 0.8762, batch_reg_loss: 0.1550, reg_loss: 0.1541 ||:  94%|#########3| 104/111 [01:10<00:04,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9284, LAS: 0.8734, UEM: 0.5209, LEM: 0.2983, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3185, partial_loss/deprel_loss: 0.4996, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6184, loss: 0.8786, batch_reg_loss: 0.1550, reg_loss: 0.1541 ||:  97%|#########7| 108/111 [01:13<00:01,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9289, LAS: 0.8740, UEM: 0.5235, LEM: 0.2984, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3537, partial_loss/deprel_loss: 0.4988, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6249, loss: 0.8731, batch_reg_loss: 0.1551, reg_loss: 0.1542 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
+      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.499  |       N/A\n",
+      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.354  |       N/A\n",
+      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.154  |       N/A\n",
+      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - UEM                      |     0.523  |       N/A\n",
+      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - LAS                      |     0.874  |       N/A\n",
+      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - loss                     |     0.873  |       N/A\n",
+      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - LEM                      |     0.298  |       N/A\n",
+      "2023-04-06 23:54:04,143 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:54:04,143 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:54:04,143 - INFO - combo.training.tensorboard_writer - UAS                      |     0.929  |       N/A\n",
+      "2023-04-06 23:54:04,143 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:54:04,143 - INFO - combo.training.tensorboard_writer - EM                       |     0.896  |       N/A\n",
+      "2023-04-06 23:54:04,143 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:54:04,143 - INFO - combo.training.trainer - Epoch duration: 0:01:15.561956\n",
+      "2023-04-06 23:54:04,143 - INFO - combo.training.trainer - Estimated training time remaining: 7:40:27\n",
+      "2023-04-06 23:54:04,143 - INFO - allennlp.training.trainer - Epoch 49/399\n",
+      "2023-04-06 23:54:04,144 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:54:04,144 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:54:04,149 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7909, UAS: 0.8954, LAS: 0.8373, UEM: 0.3531, LEM: 0.2014, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9718, partial_loss/deprel_loss: 1.1487, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4685, loss: 1.1159, batch_reg_loss: 0.1552, reg_loss: 0.1552 ||:   4%|3         | 4/111 [00:02<01:10,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9175, LAS: 0.8616, UEM: 0.4567, LEM: 0.2334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3460, partial_loss/deprel_loss: 0.4872, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6142, loss: 0.9446, batch_reg_loss: 0.1553, reg_loss: 0.1552 ||:   7%|7         | 8/111 [00:05<01:06,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8947, UAS: 0.9264, LAS: 0.8697, UEM: 0.5122, LEM: 0.2647, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3347, partial_loss/deprel_loss: 0.5663, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6753, loss: 0.8896, batch_reg_loss: 0.1553, reg_loss: 0.1552 ||:  10%|9         | 11/111 [00:07<01:07,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8149, UAS: 0.9191, LAS: 0.8626, UEM: 0.4610, LEM: 0.2322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7589, partial_loss/deprel_loss: 1.0592, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3545, loss: 0.9608, batch_reg_loss: 0.1554, reg_loss: 0.1553 ||:  14%|#3        | 15/111 [00:09<01:02,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9214, LAS: 0.8657, UEM: 0.4965, LEM: 0.2659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1912, partial_loss/deprel_loss: 0.3556, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4782, loss: 0.9304, batch_reg_loss: 0.1554, reg_loss: 0.1553 ||:  17%|#7        | 19/111 [00:12<00:58,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9223, LAS: 0.8664, UEM: 0.4895, LEM: 0.2537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3587, partial_loss/deprel_loss: 0.5543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6707, loss: 0.9235, batch_reg_loss: 0.1555, reg_loss: 0.1553 ||:  21%|##        | 23/111 [00:14<00:57,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9138, UAS: 0.9252, LAS: 0.8696, UEM: 0.4974, LEM: 0.2570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2637, partial_loss/deprel_loss: 0.3971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5260, loss: 0.8980, batch_reg_loss: 0.1556, reg_loss: 0.1554 ||:  24%|##4       | 27/111 [00:17<00:54,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8481, UAS: 0.9248, LAS: 0.8688, UEM: 0.4822, LEM: 0.2448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9313, partial_loss/deprel_loss: 0.9207, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0785, loss: 0.9065, batch_reg_loss: 0.1556, reg_loss: 0.1554 ||:  27%|##7       | 30/111 [00:19<00:53,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9034, UAS: 0.9285, LAS: 0.8729, UEM: 0.5310, LEM: 0.2872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3969, partial_loss/deprel_loss: 0.4874, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6250, loss: 0.8737, batch_reg_loss: 0.1557, reg_loss: 0.1554 ||:  30%|##9       | 33/111 [00:22<00:55,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9296, LAS: 0.8746, UEM: 0.5256, LEM: 0.2821, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6425, partial_loss/deprel_loss: 0.6280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7866, loss: 0.8591, batch_reg_loss: 0.1558, reg_loss: 0.1554 ||:  33%|###3      | 37/111 [00:24<00:50,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9084, UAS: 0.9294, LAS: 0.8742, UEM: 0.5161, LEM: 0.2751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3167, partial_loss/deprel_loss: 0.4630, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5896, loss: 0.8647, batch_reg_loss: 0.1558, reg_loss: 0.1555 ||:  37%|###6      | 41/111 [00:26<00:44,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8782, UAS: 0.9300, LAS: 0.8749, UEM: 0.5093, LEM: 0.2689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6331, partial_loss/deprel_loss: 0.7067, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8478, loss: 0.8596, batch_reg_loss: 0.1559, reg_loss: 0.1555 ||:  41%|####      | 45/111 [00:29<00:43,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9171, UAS: 0.9313, LAS: 0.8765, UEM: 0.5172, LEM: 0.2726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2331, partial_loss/deprel_loss: 0.4538, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5656, loss: 0.8482, batch_reg_loss: 0.1559, reg_loss: 0.1555 ||:  44%|####4     | 49/111 [00:31<00:39,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9308, LAS: 0.8760, UEM: 0.5255, LEM: 0.2803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3214, partial_loss/deprel_loss: 0.5428, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6545, loss: 0.8538, batch_reg_loss: 0.1560, reg_loss: 0.1556 ||:  48%|####7     | 53/111 [00:34<00:39,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9295, LAS: 0.8748, UEM: 0.5237, LEM: 0.2787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4346, partial_loss/deprel_loss: 0.6295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7466, loss: 0.8677, batch_reg_loss: 0.1560, reg_loss: 0.1556 ||:  50%|#####     | 56/111 [00:37<00:38,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8777, UAS: 0.9301, LAS: 0.8753, UEM: 0.5200, LEM: 0.2719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5485, partial_loss/deprel_loss: 0.6739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8050, loss: 0.8635, batch_reg_loss: 0.1561, reg_loss: 0.1556 ||:  53%|#####3    | 59/111 [00:39<00:36,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9182, UAS: 0.9304, LAS: 0.8758, UEM: 0.5333, LEM: 0.2861, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1874, partial_loss/deprel_loss: 0.3743, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4931, loss: 0.8582, batch_reg_loss: 0.1561, reg_loss: 0.1557 ||:  56%|#####5    | 62/111 [00:41<00:35,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9301, LAS: 0.8755, UEM: 0.5277, LEM: 0.2818, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3650, partial_loss/deprel_loss: 0.5520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6708, loss: 0.8625, batch_reg_loss: 0.1562, reg_loss: 0.1557 ||:  59%|#####8    | 65/111 [00:43<00:32,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8750, UAS: 0.9311, LAS: 0.8764, UEM: 0.5335, LEM: 0.2839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5554, partial_loss/deprel_loss: 0.6621, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7970, loss: 0.8548, batch_reg_loss: 0.1562, reg_loss: 0.1557 ||:  61%|######1   | 68/111 [00:46<00:32,  1.34it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9304, LAS: 0.8755, UEM: 0.5226, LEM: 0.2760, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8234, partial_loss/deprel_loss: 0.7134, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8917, loss: 0.8620, batch_reg_loss: 0.1563, reg_loss: 0.1557 ||:  65%|######4   | 72/111 [00:48<00:28,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8284, UAS: 0.9302, LAS: 0.8751, UEM: 0.5187, LEM: 0.2726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4144, partial_loss/deprel_loss: 1.0153, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2515, loss: 0.8652, batch_reg_loss: 0.1564, reg_loss: 0.1558 ||:  68%|######8   | 76/111 [00:51<00:24,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8980, UAS: 0.9312, LAS: 0.8763, UEM: 0.5408, LEM: 0.2998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4109, partial_loss/deprel_loss: 0.5739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6977, loss: 0.8563, batch_reg_loss: 0.1564, reg_loss: 0.1558 ||:  71%|#######1  | 79/111 [00:54<00:24,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8835, UAS: 0.9311, LAS: 0.8763, UEM: 0.5334, LEM: 0.2934, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5825, partial_loss/deprel_loss: 0.6902, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8251, loss: 0.8572, batch_reg_loss: 0.1565, reg_loss: 0.1558 ||:  75%|#######4  | 83/111 [00:56<00:19,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8287, UAS: 0.9302, LAS: 0.8752, UEM: 0.5287, LEM: 0.2902, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3085, partial_loss/deprel_loss: 1.0597, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2660, loss: 0.8685, batch_reg_loss: 0.1565, reg_loss: 0.1558 ||:  78%|#######8  | 87/111 [00:58<00:16,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9299, LAS: 0.8749, UEM: 0.5339, LEM: 0.2979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1485, partial_loss/deprel_loss: 0.3128, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4365, loss: 0.8724, batch_reg_loss: 0.1566, reg_loss: 0.1559 ||:  81%|########1 | 90/111 [01:01<00:14,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8676, UAS: 0.9307, LAS: 0.8758, UEM: 0.5454, LEM: 0.3116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7527, partial_loss/deprel_loss: 0.7827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9333, loss: 0.8654, batch_reg_loss: 0.1566, reg_loss: 0.1559 ||:  84%|########3 | 93/111 [01:03<00:12,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9312, LAS: 0.8764, UEM: 0.5440, LEM: 0.3083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8018, partial_loss/deprel_loss: 0.8328, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9833, loss: 0.8617, batch_reg_loss: 0.1567, reg_loss: 0.1559 ||:  87%|########7 | 97/111 [01:05<00:09,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8908, UAS: 0.9300, LAS: 0.8753, UEM: 0.5369, LEM: 0.3034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5177, partial_loss/deprel_loss: 0.6388, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7714, loss: 0.8700, batch_reg_loss: 0.1568, reg_loss: 0.1560 ||:  91%|######### | 101/111 [01:07<00:06,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8587, UAS: 0.9295, LAS: 0.8746, UEM: 0.5288, LEM: 0.2978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8003, partial_loss/deprel_loss: 0.8681, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0114, loss: 0.8759, batch_reg_loss: 0.1568, reg_loss: 0.1560 ||:  95%|#########4| 105/111 [01:10<00:03,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8610, UAS: 0.9292, LAS: 0.8742, UEM: 0.5270, LEM: 0.2972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8836, partial_loss/deprel_loss: 0.8153, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9858, loss: 0.8781, batch_reg_loss: 0.1569, reg_loss: 0.1560 ||:  98%|#########8| 109/111 [01:12<00:01,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9294, LAS: 0.8745, UEM: 0.5276, LEM: 0.2970, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2578, partial_loss/deprel_loss: 0.4366, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5578, loss: 0.8755, batch_reg_loss: 0.1569, reg_loss: 0.1560 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
+      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.437  |       N/A\n",
+      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.258  |       N/A\n",
+      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.156  |       N/A\n",
+      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - UEM                      |     0.528  |       N/A\n",
+      "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - LAS                      |     0.874  |       N/A\n",
+      "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - loss                     |     0.876  |       N/A\n",
+      "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - LEM                      |     0.297  |       N/A\n",
+      "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - UAS                      |     0.929  |       N/A\n",
+      "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - EM                       |     0.914  |       N/A\n",
+      "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:55:18,547 - INFO - combo.training.trainer - Epoch duration: 0:01:14.403031\n",
+      "2023-04-06 23:55:18,547 - INFO - combo.training.trainer - Estimated training time remaining: 7:38:38\n",
+      "2023-04-06 23:55:18,547 - INFO - allennlp.training.trainer - Epoch 50/399\n",
+      "2023-04-06 23:55:18,547 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:55:18,547 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:55:18,553 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8449, UAS: 0.9290, LAS: 0.8760, UEM: 0.5054, LEM: 0.2842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1142, partial_loss/deprel_loss: 0.8807, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0844, loss: 0.8502, batch_reg_loss: 0.1570, reg_loss: 0.1570 ||:   3%|2         | 3/111 [00:02<01:19,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9221, LAS: 0.8702, UEM: 0.4812, LEM: 0.2827, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2506, partial_loss/deprel_loss: 0.3848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5150, loss: 0.8912, batch_reg_loss: 0.1571, reg_loss: 0.1570 ||:   6%|6         | 7/111 [00:04<01:14,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9227, UAS: 0.9285, LAS: 0.8777, UEM: 0.5969, LEM: 0.3922, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2795, partial_loss/deprel_loss: 0.4394, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5646, loss: 0.8423, batch_reg_loss: 0.1571, reg_loss: 0.1570 ||:   9%|9         | 10/111 [00:07<01:17,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8914, UAS: 0.9283, LAS: 0.8774, UEM: 0.5628, LEM: 0.3540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5145, partial_loss/deprel_loss: 0.5950, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7361, loss: 0.8468, batch_reg_loss: 0.1572, reg_loss: 0.1571 ||:  12%|#1        | 13/111 [00:09<01:12,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8716, UAS: 0.9320, LAS: 0.8807, UEM: 0.5504, LEM: 0.3256, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7563, partial_loss/deprel_loss: 0.7074, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8744, loss: 0.8170, batch_reg_loss: 0.1572, reg_loss: 0.1571 ||:  15%|#5        | 17/111 [00:12<01:07,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9309, LAS: 0.8794, UEM: 0.5287, LEM: 0.3068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7209, partial_loss/deprel_loss: 0.7438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8965, loss: 0.8283, batch_reg_loss: 0.1573, reg_loss: 0.1571 ||:  18%|#8        | 20/111 [00:14<01:05,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8030, UAS: 0.9249, LAS: 0.8730, UEM: 0.4993, LEM: 0.2896, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9332, partial_loss/deprel_loss: 1.1208, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4406, loss: 0.8825, batch_reg_loss: 0.1573, reg_loss: 0.1571 ||:  21%|##        | 23/111 [00:16<01:03,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9199, UAS: 0.9282, LAS: 0.8763, UEM: 0.5111, LEM: 0.2914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2713, partial_loss/deprel_loss: 0.4207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5482, loss: 0.8626, batch_reg_loss: 0.1574, reg_loss: 0.1572 ||:  24%|##4       | 27/111 [00:18<00:56,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8736, UAS: 0.9296, LAS: 0.8774, UEM: 0.5096, LEM: 0.2850, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7129, partial_loss/deprel_loss: 0.7503, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9003, loss: 0.8551, batch_reg_loss: 0.1574, reg_loss: 0.1572 ||:  27%|##7       | 30/111 [00:21<00:55,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9288, LAS: 0.8761, UEM: 0.5080, LEM: 0.2875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2659, partial_loss/deprel_loss: 0.3883, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5213, loss: 0.8652, batch_reg_loss: 0.1575, reg_loss: 0.1572 ||:  31%|###       | 34/111 [00:23<00:52,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9288, LAS: 0.8758, UEM: 0.5034, LEM: 0.2842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5541, partial_loss/deprel_loss: 0.7148, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8402, loss: 0.8701, batch_reg_loss: 0.1576, reg_loss: 0.1573 ||:  33%|###3      | 37/111 [00:25<00:50,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9306, LAS: 0.8774, UEM: 0.5220, LEM: 0.2958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1300, partial_loss/deprel_loss: 0.3725, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4816, loss: 0.8589, batch_reg_loss: 0.1576, reg_loss: 0.1573 ||:  36%|###6      | 40/111 [00:27<00:49,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8382, UAS: 0.9289, LAS: 0.8753, UEM: 0.5036, LEM: 0.2838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1688, partial_loss/deprel_loss: 0.8952, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1076, loss: 0.8755, batch_reg_loss: 0.1577, reg_loss: 0.1573 ||:  40%|###9      | 44/111 [00:30<00:45,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8863, UAS: 0.9303, LAS: 0.8768, UEM: 0.5211, LEM: 0.2980, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5037, partial_loss/deprel_loss: 0.6167, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7518, loss: 0.8604, batch_reg_loss: 0.1577, reg_loss: 0.1573 ||:  42%|####2     | 47/111 [00:32<00:43,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8513, UAS: 0.9302, LAS: 0.8764, UEM: 0.5122, LEM: 0.2886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8860, partial_loss/deprel_loss: 0.8571, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0207, loss: 0.8628, batch_reg_loss: 0.1578, reg_loss: 0.1574 ||:  45%|####5     | 50/111 [00:34<00:41,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7913, UAS: 0.9295, LAS: 0.8755, UEM: 0.5144, LEM: 0.2883, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9336, partial_loss/deprel_loss: 1.3001, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5847, loss: 0.8703, batch_reg_loss: 0.1578, reg_loss: 0.1574 ||:  48%|####7     | 53/111 [00:37<00:42,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.9300, LAS: 0.8766, UEM: 0.5481, LEM: 0.3316, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5420, partial_loss/deprel_loss: 1.0670, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3199, loss: 0.8646, batch_reg_loss: 0.1579, reg_loss: 0.1574 ||:  50%|#####     | 56/111 [00:39<00:40,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7832, UAS: 0.9297, LAS: 0.8761, UEM: 0.5495, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8045, partial_loss/deprel_loss: 1.2793, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5423, loss: 0.8670, batch_reg_loss: 0.1579, reg_loss: 0.1574 ||:  54%|#####4    | 60/111 [00:42<00:36,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9289, LAS: 0.8751, UEM: 0.5481, LEM: 0.3267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3008, partial_loss/deprel_loss: 0.5128, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6284, loss: 0.8746, batch_reg_loss: 0.1580, reg_loss: 0.1575 ||:  57%|#####6    | 63/111 [00:44<00:34,  1.41it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9290, LAS: 0.8750, UEM: 0.5390, LEM: 0.3177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3938, partial_loss/deprel_loss: 0.5525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6788, loss: 0.8767, batch_reg_loss: 0.1581, reg_loss: 0.1575 ||:  60%|######    | 67/111 [00:46<00:30,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9295, LAS: 0.8755, UEM: 0.5369, LEM: 0.3129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3454, partial_loss/deprel_loss: 0.5430, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6616, loss: 0.8744, batch_reg_loss: 0.1581, reg_loss: 0.1575 ||:  64%|######3   | 71/111 [00:49<00:26,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8429, UAS: 0.9296, LAS: 0.8755, UEM: 0.5377, LEM: 0.3142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0116, partial_loss/deprel_loss: 1.0316, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1858, loss: 0.8755, batch_reg_loss: 0.1582, reg_loss: 0.1576 ||:  67%|######6   | 74/111 [00:51<00:25,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8721, UAS: 0.9294, LAS: 0.8754, UEM: 0.5309, LEM: 0.3089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8416, partial_loss/deprel_loss: 0.7885, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9573, loss: 0.8776, batch_reg_loss: 0.1582, reg_loss: 0.1576 ||:  70%|#######   | 78/111 [00:53<00:21,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8451, UAS: 0.9293, LAS: 0.8752, UEM: 0.5232, LEM: 0.3013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9259, partial_loss/deprel_loss: 0.9234, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0822, loss: 0.8784, batch_reg_loss: 0.1583, reg_loss: 0.1576 ||:  74%|#######3  | 82/111 [00:55<00:18,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9294, LAS: 0.8752, UEM: 0.5207, LEM: 0.2986, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2829, partial_loss/deprel_loss: 0.4930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6093, loss: 0.8777, batch_reg_loss: 0.1583, reg_loss: 0.1577 ||:  77%|#######7  | 86/111 [00:58<00:15,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8559, UAS: 0.9291, LAS: 0.8750, UEM: 0.5146, LEM: 0.2938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1339, partial_loss/deprel_loss: 0.9053, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1094, loss: 0.8806, batch_reg_loss: 0.1584, reg_loss: 0.1577 ||:  81%|########1 | 90/111 [01:01<00:13,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9299, LAS: 0.8757, UEM: 0.5307, LEM: 0.3088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2277, partial_loss/deprel_loss: 0.4237, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5429, loss: 0.8738, batch_reg_loss: 0.1585, reg_loss: 0.1577 ||:  85%|########4 | 94/111 [01:04<00:11,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9301, LAS: 0.8760, UEM: 0.5314, LEM: 0.3079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3976, partial_loss/deprel_loss: 0.5300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6621, loss: 0.8717, batch_reg_loss: 0.1585, reg_loss: 0.1578 ||:  87%|########7 | 97/111 [01:06<00:09,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8842, UAS: 0.9302, LAS: 0.8758, UEM: 0.5269, LEM: 0.3024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5324, partial_loss/deprel_loss: 0.6760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8058, loss: 0.8718, batch_reg_loss: 0.1586, reg_loss: 0.1578 ||:  91%|######### | 101/111 [01:08<00:06,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9307, LAS: 0.8763, UEM: 0.5341, LEM: 0.3073, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2046, partial_loss/deprel_loss: 0.4037, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5225, loss: 0.8681, batch_reg_loss: 0.1586, reg_loss: 0.1578 ||:  95%|#########4| 105/111 [01:11<00:04,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8793, UAS: 0.9308, LAS: 0.8765, UEM: 0.5314, LEM: 0.3036, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5598, partial_loss/deprel_loss: 0.6800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8146, loss: 0.8667, batch_reg_loss: 0.1587, reg_loss: 0.1578 ||:  97%|#########7| 108/111 [01:13<00:02,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9303, LAS: 0.8757, UEM: 0.5319, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2880, partial_loss/deprel_loss: 0.4364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5654, loss: 0.8721, batch_reg_loss: 0.1587, reg_loss: 0.1579 ||: 100%|##########| 111/111 [01:16<00:00,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9303, LAS: 0.8757, UEM: 0.5319, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2880, partial_loss/deprel_loss: 0.4364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5654, loss: 0.8721, batch_reg_loss: 0.1587, reg_loss: 0.1579 ||: 100%|##########| 111/111 [01:16<00:00,  1.46it/s]\n",
+      "2023-04-06 23:56:34,705 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9351, LAS: 0.8773, UEM: 0.4018, LEM: 0.1232, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6037, partial_loss/deprel_loss: 24.7088, partial_loss/cycle_loss: 0.0000, batch_loss: 19.8878, loss: 28.6320, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:09,  1.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9108, UAS: 0.9493, LAS: 0.8951, UEM: 0.6527, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4009, partial_loss/deprel_loss: 26.6414, partial_loss/cycle_loss: 0.0000, batch_loss: 21.3933, loss: 25.2934, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:04<00:07,  1.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8618, UAS: 0.9439, LAS: 0.8897, UEM: 0.5984, LEM: 0.2964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2572, partial_loss/deprel_loss: 49.6530, partial_loss/cycle_loss: 0.0000, batch_loss: 39.9738, loss: 26.4770, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:07<00:04,  1.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8273, UAS: 0.9402, LAS: 0.8860, UEM: 0.5746, LEM: 0.2867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6577, partial_loss/deprel_loss: 58.9864, partial_loss/cycle_loss: 0.0000, batch_loss: 47.5206, loss: 27.0998, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:09<00:01,  1.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8845, UAS: 0.9427, LAS: 0.8904, UEM: 0.6365, LEM: 0.3750, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6548, partial_loss/deprel_loss: 35.0931, partial_loss/cycle_loss: 0.0000, batch_loss: 28.2055, loss: 26.3856, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:11<00:00,  1.10it/s]\n",
+      "2023-04-06 23:56:46,535 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.436  |    35.093\n",
+      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.288  |     0.655\n",
+      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.158  |     0.000\n",
+      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - UEM                      |     0.532  |     0.636\n",
+      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - LAS                      |     0.876  |     0.890\n",
+      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - loss                     |     0.872  |    26.386\n",
+      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - LEM                      |     0.305  |     0.375\n",
+      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-06 23:56:46,537 - INFO - combo.training.tensorboard_writer - UAS                      |     0.930  |     0.943\n",
+      "2023-04-06 23:56:46,537 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-06 23:56:46,537 - INFO - combo.training.tensorboard_writer - EM                       |     0.911  |     0.885\n",
+      "2023-04-06 23:56:46,537 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:56:46,537 - INFO - combo.training.trainer - Epoch duration: 0:01:27.990431\n",
+      "2023-04-06 23:56:46,537 - INFO - combo.training.trainer - Estimated training time remaining: 7:38:24\n",
+      "2023-04-06 23:56:46,537 - INFO - allennlp.training.trainer - Epoch 51/399\n",
+      "2023-04-06 23:56:46,537 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:56:46,538 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:56:46,543 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9240, LAS: 0.8692, UEM: 0.6476, LEM: 0.3819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2921, partial_loss/deprel_loss: 0.4776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5993, loss: 0.9016, batch_reg_loss: 0.1588, reg_loss: 0.1587 ||:   3%|2         | 3/111 [00:02<01:13,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9277, LAS: 0.8749, UEM: 0.6799, LEM: 0.4465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4705, partial_loss/deprel_loss: 0.5734, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7116, loss: 0.8611, batch_reg_loss: 0.1588, reg_loss: 0.1588 ||:   5%|5         | 6/111 [00:04<01:13,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9217, LAS: 0.8687, UEM: 0.6278, LEM: 0.3871, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3600, partial_loss/deprel_loss: 0.4258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5715, loss: 0.9148, batch_reg_loss: 0.1589, reg_loss: 0.1588 ||:   9%|9         | 10/111 [00:06<01:07,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9316, LAS: 0.8807, UEM: 0.6713, LEM: 0.4400, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1199, partial_loss/deprel_loss: 0.2607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3915, loss: 0.8255, batch_reg_loss: 0.1589, reg_loss: 0.1588 ||:  13%|#2        | 14/111 [00:09<01:05,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8761, UAS: 0.9349, LAS: 0.8836, UEM: 0.6458, LEM: 0.4052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6169, partial_loss/deprel_loss: 0.6818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8278, loss: 0.8022, batch_reg_loss: 0.1590, reg_loss: 0.1589 ||:  16%|#6        | 18/111 [00:11<01:00,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8600, UAS: 0.9336, LAS: 0.8810, UEM: 0.6118, LEM: 0.3778, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8011, partial_loss/deprel_loss: 0.8718, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0168, loss: 0.8227, batch_reg_loss: 0.1591, reg_loss: 0.1589 ||:  20%|#9        | 22/111 [00:14<00:58,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9371, LAS: 0.8849, UEM: 0.6244, LEM: 0.3825, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4766, partial_loss/deprel_loss: 0.6570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7800, loss: 0.7951, batch_reg_loss: 0.1591, reg_loss: 0.1589 ||:  23%|##3       | 26/111 [00:17<00:55,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8319, UAS: 0.9349, LAS: 0.8821, UEM: 0.5989, LEM: 0.3635, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2324, partial_loss/deprel_loss: 1.1135, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2964, loss: 0.8195, batch_reg_loss: 0.1592, reg_loss: 0.1590 ||:  26%|##6       | 29/111 [00:19<00:55,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9340, LAS: 0.8813, UEM: 0.5833, LEM: 0.3488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2795, partial_loss/deprel_loss: 0.4729, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5935, loss: 0.8260, batch_reg_loss: 0.1592, reg_loss: 0.1590 ||:  30%|##9       | 33/111 [00:21<00:52,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9356, LAS: 0.8825, UEM: 0.5790, LEM: 0.3380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3626, partial_loss/deprel_loss: 0.5307, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6563, loss: 0.8157, batch_reg_loss: 0.1593, reg_loss: 0.1590 ||:  33%|###3      | 37/111 [00:24<00:48,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8764, UAS: 0.9346, LAS: 0.8810, UEM: 0.5659, LEM: 0.3250, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5879, partial_loss/deprel_loss: 0.6852, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8250, loss: 0.8271, batch_reg_loss: 0.1593, reg_loss: 0.1590 ||:  37%|###6      | 41/111 [00:26<00:44,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9339, LAS: 0.8803, UEM: 0.5605, LEM: 0.3205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3940, partial_loss/deprel_loss: 0.5271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6599, loss: 0.8325, batch_reg_loss: 0.1594, reg_loss: 0.1591 ||:  41%|####      | 45/111 [00:29<00:43,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8878, UAS: 0.9337, LAS: 0.8795, UEM: 0.5521, LEM: 0.3106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4302, partial_loss/deprel_loss: 0.6363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7545, loss: 0.8381, batch_reg_loss: 0.1595, reg_loss: 0.1591 ||:  44%|####4     | 49/111 [00:32<00:41,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9334, LAS: 0.8794, UEM: 0.5531, LEM: 0.3134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3607, partial_loss/deprel_loss: 0.4791, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6150, loss: 0.8376, batch_reg_loss: 0.1595, reg_loss: 0.1591 ||:  47%|####6     | 52/111 [00:34<00:40,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8409, UAS: 0.9332, LAS: 0.8791, UEM: 0.5510, LEM: 0.3121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1740, partial_loss/deprel_loss: 1.0353, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2226, loss: 0.8416, batch_reg_loss: 0.1596, reg_loss: 0.1592 ||:  50%|####9     | 55/111 [00:36<00:38,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9325, LAS: 0.8786, UEM: 0.5527, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2625, partial_loss/deprel_loss: 0.4347, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5599, loss: 0.8446, batch_reg_loss: 0.1596, reg_loss: 0.1592 ||:  53%|#####3    | 59/111 [00:39<00:36,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8565, UAS: 0.9332, LAS: 0.8796, UEM: 0.5727, LEM: 0.3430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9880, partial_loss/deprel_loss: 0.8851, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0654, loss: 0.8385, batch_reg_loss: 0.1597, reg_loss: 0.1592 ||:  56%|#####5    | 62/111 [00:41<00:36,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9340, LAS: 0.8803, UEM: 0.5741, LEM: 0.3408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6115, partial_loss/deprel_loss: 0.6343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7895, loss: 0.8323, batch_reg_loss: 0.1598, reg_loss: 0.1592 ||:  59%|#####8    | 65/111 [00:43<00:33,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8495, UAS: 0.9338, LAS: 0.8803, UEM: 0.5767, LEM: 0.3446, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1369, partial_loss/deprel_loss: 0.9492, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1465, loss: 0.8330, batch_reg_loss: 0.1598, reg_loss: 0.1593 ||:  62%|######2   | 69/111 [00:46<00:28,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8846, UAS: 0.9338, LAS: 0.8799, UEM: 0.5702, LEM: 0.3380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4896, partial_loss/deprel_loss: 0.6765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7990, loss: 0.8342, batch_reg_loss: 0.1599, reg_loss: 0.1593 ||:  66%|######5   | 73/111 [00:48<00:25,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9336, LAS: 0.8800, UEM: 0.5638, LEM: 0.3331, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5143, partial_loss/deprel_loss: 0.6041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7461, loss: 0.8336, batch_reg_loss: 0.1599, reg_loss: 0.1593 ||:  69%|######9   | 77/111 [00:51<00:22,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9337, LAS: 0.8802, UEM: 0.5669, LEM: 0.3362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2365, partial_loss/deprel_loss: 0.4236, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5462, loss: 0.8323, batch_reg_loss: 0.1600, reg_loss: 0.1594 ||:  73%|#######2  | 81/111 [00:53<00:19,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9341, LAS: 0.8807, UEM: 0.5677, LEM: 0.3368, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3866, partial_loss/deprel_loss: 0.5101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6455, loss: 0.8288, batch_reg_loss: 0.1601, reg_loss: 0.1594 ||:  77%|#######6  | 85/111 [00:56<00:17,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9332, LAS: 0.8796, UEM: 0.5588, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7277, partial_loss/deprel_loss: 0.6583, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8323, loss: 0.8376, batch_reg_loss: 0.1601, reg_loss: 0.1594 ||:  80%|########  | 89/111 [00:58<00:13,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8426, UAS: 0.9322, LAS: 0.8785, UEM: 0.5490, LEM: 0.3230, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9825, partial_loss/deprel_loss: 0.9410, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1095, loss: 0.8454, batch_reg_loss: 0.1602, reg_loss: 0.1595 ||:  84%|########3 | 93/111 [01:01<00:11,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9322, LAS: 0.8783, UEM: 0.5471, LEM: 0.3206, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1948, partial_loss/deprel_loss: 0.3857, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5078, loss: 0.8462, batch_reg_loss: 0.1602, reg_loss: 0.1595 ||:  87%|########7 | 97/111 [01:03<00:08,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8692, UAS: 0.9324, LAS: 0.8783, UEM: 0.5435, LEM: 0.3155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6677, partial_loss/deprel_loss: 0.8023, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9356, loss: 0.8459, batch_reg_loss: 0.1603, reg_loss: 0.1595 ||:  91%|######### | 101/111 [01:06<00:06,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8043, UAS: 0.9309, LAS: 0.8766, UEM: 0.5376, LEM: 0.3103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7838, partial_loss/deprel_loss: 1.3054, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5615, loss: 0.8610, batch_reg_loss: 0.1604, reg_loss: 0.1596 ||:  95%|#########4| 105/111 [01:09<00:03,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8459, UAS: 0.9305, LAS: 0.8760, UEM: 0.5314, LEM: 0.3052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2171, partial_loss/deprel_loss: 1.0465, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2410, loss: 0.8685, batch_reg_loss: 0.1604, reg_loss: 0.1596 ||:  98%|#########8| 109/111 [01:11<00:01,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8590, UAS: 0.9298, LAS: 0.8752, UEM: 0.5275, LEM: 0.3028, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0356, partial_loss/deprel_loss: 0.8129, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0179, loss: 0.8747, batch_reg_loss: 0.1605, reg_loss: 0.1596 ||: 100%|##########| 111/111 [01:12<00:00,  1.53it/s]\n",
+      "2023-04-06 23:57:59,081 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.813  |       N/A\n",
+      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.036  |       N/A\n",
+      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.160  |       N/A\n",
+      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - UEM                      |     0.528  |       N/A\n",
+      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - LAS                      |     0.875  |       N/A\n",
+      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - loss                     |     0.875  |       N/A\n",
+      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - LEM                      |     0.303  |       N/A\n",
+      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:57:59,083 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:57:59,083 - INFO - combo.training.tensorboard_writer - UAS                      |     0.930  |       N/A\n",
+      "2023-04-06 23:57:59,083 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:57:59,083 - INFO - combo.training.tensorboard_writer - EM                       |     0.859  |       N/A\n",
+      "2023-04-06 23:57:59,083 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:57:59,083 - INFO - combo.training.trainer - Epoch duration: 0:01:12.545910\n",
+      "2023-04-06 23:57:59,083 - INFO - combo.training.trainer - Estimated training time remaining: 7:36:23\n",
+      "2023-04-06 23:57:59,083 - INFO - allennlp.training.trainer - Epoch 52/399\n",
+      "2023-04-06 23:57:59,084 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:57:59,084 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:57:59,089 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9408, LAS: 0.8872, UEM: 0.4940, LEM: 0.2390, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3542, partial_loss/deprel_loss: 0.5430, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6658, loss: 0.7606, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||:   3%|2         | 3/111 [00:02<01:12,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9258, LAS: 0.8711, UEM: 0.3767, LEM: 0.1598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6446, partial_loss/deprel_loss: 0.7826, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9156, loss: 0.9016, batch_reg_loss: 0.1606, reg_loss: 0.1605 ||:   6%|6         | 7/111 [00:04<01:08,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9247, LAS: 0.8681, UEM: 0.3929, LEM: 0.1730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3376, partial_loss/deprel_loss: 0.5194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6437, loss: 0.9226, batch_reg_loss: 0.1607, reg_loss: 0.1606 ||:  10%|9         | 11/111 [00:06<01:04,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.9313, LAS: 0.8752, UEM: 0.4850, LEM: 0.2418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9508, partial_loss/deprel_loss: 0.9080, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0773, loss: 0.8719, batch_reg_loss: 0.1607, reg_loss: 0.1606 ||:  14%|#3        | 15/111 [00:09<01:01,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8230, UAS: 0.9278, LAS: 0.8711, UEM: 0.4450, LEM: 0.2155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4530, partial_loss/deprel_loss: 1.1169, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3450, loss: 0.9087, batch_reg_loss: 0.1608, reg_loss: 0.1607 ||:  17%|#7        | 19/111 [00:11<00:55,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9078, UAS: 0.9296, LAS: 0.8736, UEM: 0.4856, LEM: 0.2525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4127, partial_loss/deprel_loss: 0.4800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6275, loss: 0.8893, batch_reg_loss: 0.1609, reg_loss: 0.1607 ||:  21%|##        | 23/111 [00:13<00:53,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9339, LAS: 0.8787, UEM: 0.5379, LEM: 0.2897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3198, partial_loss/deprel_loss: 0.4749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6048, loss: 0.8470, batch_reg_loss: 0.1610, reg_loss: 0.1607 ||:  24%|##4       | 27/111 [00:16<00:49,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8564, UAS: 0.9342, LAS: 0.8793, UEM: 0.5529, LEM: 0.3165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7539, partial_loss/deprel_loss: 0.8258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9725, loss: 0.8433, batch_reg_loss: 0.1610, reg_loss: 0.1608 ||:  28%|##7       | 31/111 [00:18<00:48,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9025, UAS: 0.9329, LAS: 0.8781, UEM: 0.5454, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3077, partial_loss/deprel_loss: 0.5190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6378, loss: 0.8515, batch_reg_loss: 0.1611, reg_loss: 0.1608 ||:  32%|###1      | 35/111 [00:21<00:46,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8574, UAS: 0.9309, LAS: 0.8760, UEM: 0.5404, LEM: 0.3105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7887, partial_loss/deprel_loss: 0.8330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9853, loss: 0.8660, batch_reg_loss: 0.1611, reg_loss: 0.1608 ||:  35%|###5      | 39/111 [00:23<00:43,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8541, UAS: 0.9303, LAS: 0.8754, UEM: 0.5276, LEM: 0.2985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9182, partial_loss/deprel_loss: 0.8559, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0296, loss: 0.8703, batch_reg_loss: 0.1612, reg_loss: 0.1609 ||:  39%|###8      | 43/111 [00:26<00:43,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8863, UAS: 0.9305, LAS: 0.8753, UEM: 0.5139, LEM: 0.2856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4979, partial_loss/deprel_loss: 0.6616, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7901, loss: 0.8702, batch_reg_loss: 0.1613, reg_loss: 0.1609 ||:  42%|####2     | 47/111 [00:29<00:41,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9313, LAS: 0.8764, UEM: 0.5228, LEM: 0.2900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3390, partial_loss/deprel_loss: 0.5202, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6453, loss: 0.8633, batch_reg_loss: 0.1613, reg_loss: 0.1609 ||:  46%|####5     | 51/111 [00:32<00:40,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9325, LAS: 0.8777, UEM: 0.5325, LEM: 0.2942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3731, partial_loss/deprel_loss: 0.5001, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6361, loss: 0.8511, batch_reg_loss: 0.1614, reg_loss: 0.1610 ||:  49%|####8     | 54/111 [00:34<00:42,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8530, UAS: 0.9318, LAS: 0.8771, UEM: 0.5251, LEM: 0.2886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0108, partial_loss/deprel_loss: 0.8002, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0038, loss: 0.8569, batch_reg_loss: 0.1614, reg_loss: 0.1610 ||:  51%|#####1    | 57/111 [00:37<00:39,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8456, UAS: 0.9325, LAS: 0.8778, UEM: 0.5387, LEM: 0.3007, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9719, partial_loss/deprel_loss: 0.9103, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0841, loss: 0.8512, batch_reg_loss: 0.1615, reg_loss: 0.1610 ||:  54%|#####4    | 60/111 [00:39<00:36,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8968, UAS: 0.9320, LAS: 0.8774, UEM: 0.5422, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4026, partial_loss/deprel_loss: 0.5979, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7204, loss: 0.8555, batch_reg_loss: 0.1615, reg_loss: 0.1610 ||:  57%|#####6    | 63/111 [00:41<00:34,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7904, UAS: 0.9314, LAS: 0.8768, UEM: 0.5508, LEM: 0.3128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7467, partial_loss/deprel_loss: 1.1340, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4181, loss: 0.8571, batch_reg_loss: 0.1616, reg_loss: 0.1611 ||:  59%|#####9    | 66/111 [00:43<00:32,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8656, UAS: 0.9300, LAS: 0.8752, UEM: 0.5399, LEM: 0.3040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6887, partial_loss/deprel_loss: 0.7504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8997, loss: 0.8692, batch_reg_loss: 0.1616, reg_loss: 0.1611 ||:  63%|######3   | 70/111 [00:45<00:27,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7555, UAS: 0.9286, LAS: 0.8739, UEM: 0.5343, LEM: 0.3004, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.7179, partial_loss/deprel_loss: 1.4741, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8845, loss: 0.8808, batch_reg_loss: 0.1617, reg_loss: 0.1611 ||:  66%|######5   | 73/111 [00:47<00:26,  1.45it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9288, LAS: 0.8740, UEM: 0.5333, LEM: 0.2995, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5149, partial_loss/deprel_loss: 0.6655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7971, loss: 0.8786, batch_reg_loss: 0.1617, reg_loss: 0.1611 ||:  69%|######9   | 77/111 [00:50<00:22,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8485, UAS: 0.9295, LAS: 0.8748, UEM: 0.5507, LEM: 0.3237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9174, partial_loss/deprel_loss: 0.9188, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0803, loss: 0.8734, batch_reg_loss: 0.1618, reg_loss: 0.1612 ||:  72%|#######2  | 80/111 [00:52<00:22,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9300, LAS: 0.8753, UEM: 0.5510, LEM: 0.3238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5307, partial_loss/deprel_loss: 0.6004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7483, loss: 0.8682, batch_reg_loss: 0.1619, reg_loss: 0.1612 ||:  75%|#######4  | 83/111 [00:54<00:19,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8574, UAS: 0.9305, LAS: 0.8758, UEM: 0.5480, LEM: 0.3195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8368, partial_loss/deprel_loss: 0.9219, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0668, loss: 0.8654, batch_reg_loss: 0.1619, reg_loss: 0.1612 ||:  78%|#######8  | 87/111 [00:57<00:15,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8374, UAS: 0.9295, LAS: 0.8745, UEM: 0.5390, LEM: 0.3128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1307, partial_loss/deprel_loss: 0.9379, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1385, loss: 0.8737, batch_reg_loss: 0.1620, reg_loss: 0.1613 ||:  82%|########1 | 91/111 [00:59<00:12,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9304, LAS: 0.8754, UEM: 0.5423, LEM: 0.3122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5534, partial_loss/deprel_loss: 0.6744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8123, loss: 0.8675, batch_reg_loss: 0.1620, reg_loss: 0.1613 ||:  86%|########5 | 95/111 [01:01<00:10,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9307, LAS: 0.8758, UEM: 0.5385, LEM: 0.3075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4924, partial_loss/deprel_loss: 0.6291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7639, loss: 0.8670, batch_reg_loss: 0.1621, reg_loss: 0.1613 ||:  89%|########9 | 99/111 [01:04<00:07,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8665, UAS: 0.9301, LAS: 0.8751, UEM: 0.5371, LEM: 0.3062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8170, partial_loss/deprel_loss: 0.7834, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9523, loss: 0.8710, batch_reg_loss: 0.1622, reg_loss: 0.1613 ||:  93%|#########2| 103/111 [01:07<00:05,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8459, UAS: 0.9301, LAS: 0.8751, UEM: 0.5326, LEM: 0.3018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2890, partial_loss/deprel_loss: 0.9941, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2153, loss: 0.8726, batch_reg_loss: 0.1622, reg_loss: 0.1614 ||:  96%|#########6| 107/111 [01:09<00:02,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9304, LAS: 0.8754, UEM: 0.5313, LEM: 0.2993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4115, partial_loss/deprel_loss: 0.5774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7065, loss: 0.8711, batch_reg_loss: 0.1623, reg_loss: 0.1614 ||: 100%|##########| 111/111 [01:12<00:00,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9304, LAS: 0.8754, UEM: 0.5313, LEM: 0.2993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4115, partial_loss/deprel_loss: 0.5774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7065, loss: 0.8711, batch_reg_loss: 0.1623, reg_loss: 0.1614 ||: 100%|##########| 111/111 [01:12<00:00,  1.53it/s]\n",
+      "2023-04-06 23:59:11,774 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-06 23:59:11,774 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:59:11,774 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:59:11,774 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-06 23:59:11,774 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-06 23:59:11,774 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.577  |       N/A\n",
+      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.412  |       N/A\n",
+      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.161  |       N/A\n",
+      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - UEM                      |     0.531  |       N/A\n",
+      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - LAS                      |     0.875  |       N/A\n",
+      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - loss                     |     0.871  |       N/A\n",
+      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - LEM                      |     0.299  |       N/A\n",
+      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - UAS                      |     0.930  |       N/A\n",
+      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - EM                       |     0.903  |       N/A\n",
+      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-06 23:59:11,776 - INFO - combo.training.trainer - Epoch duration: 0:01:12.692473\n",
+      "2023-04-06 23:59:11,776 - INFO - combo.training.trainer - Estimated training time remaining: 7:34:25\n",
+      "2023-04-06 23:59:11,776 - INFO - allennlp.training.trainer - Epoch 53/399\n",
+      "2023-04-06 23:59:11,776 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-06 23:59:11,776 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-06 23:59:11,782 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9467, LAS: 0.8928, UEM: 0.5404, LEM: 0.2362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5696, partial_loss/deprel_loss: 0.5960, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7530, loss: 0.7637, batch_reg_loss: 0.1623, reg_loss: 0.1623 ||:   3%|2         | 3/111 [00:02<01:12,  1.49it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9464, LAS: 0.8947, UEM: 0.5560, LEM: 0.2780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5968, partial_loss/deprel_loss: 0.5837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7487, loss: 0.7131, batch_reg_loss: 0.1624, reg_loss: 0.1623 ||:   6%|6         | 7/111 [00:04<01:08,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.9365, LAS: 0.8817, UEM: 0.4906, LEM: 0.2320, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8449, partial_loss/deprel_loss: 0.7423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9252, loss: 0.8082, batch_reg_loss: 0.1625, reg_loss: 0.1624 ||:  10%|9         | 11/111 [00:07<01:05,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9394, LAS: 0.8855, UEM: 0.5849, LEM: 0.3407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2795, partial_loss/deprel_loss: 0.4304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5627, loss: 0.7742, batch_reg_loss: 0.1625, reg_loss: 0.1624 ||:  13%|#2        | 14/111 [00:09<01:06,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9397, LAS: 0.8861, UEM: 0.5769, LEM: 0.3257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3935, partial_loss/deprel_loss: 0.5610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6901, loss: 0.7727, batch_reg_loss: 0.1625, reg_loss: 0.1624 ||:  15%|#5        | 17/111 [00:11<01:04,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8868, UAS: 0.9409, LAS: 0.8868, UEM: 0.5687, LEM: 0.3085, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5827, partial_loss/deprel_loss: 0.6183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7738, loss: 0.7743, batch_reg_loss: 0.1626, reg_loss: 0.1624 ||:  19%|#8        | 21/111 [00:13<00:57,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8515, UAS: 0.9382, LAS: 0.8830, UEM: 0.5330, LEM: 0.2812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7980, partial_loss/deprel_loss: 0.8121, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9719, loss: 0.8025, batch_reg_loss: 0.1626, reg_loss: 0.1625 ||:  23%|##2       | 25/111 [00:16<00:54,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8575, UAS: 0.9323, LAS: 0.8767, UEM: 0.5110, LEM: 0.2681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0175, partial_loss/deprel_loss: 0.8682, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0608, loss: 0.8586, batch_reg_loss: 0.1627, reg_loss: 0.1625 ||:  25%|##5       | 28/111 [00:18<00:54,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8408, UAS: 0.9278, LAS: 0.8720, UEM: 0.4900, LEM: 0.2561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1837, partial_loss/deprel_loss: 0.8709, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0962, loss: 0.8946, batch_reg_loss: 0.1627, reg_loss: 0.1625 ||:  28%|##7       | 31/111 [00:20<00:53,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9276, LAS: 0.8718, UEM: 0.4794, LEM: 0.2489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4080, partial_loss/deprel_loss: 0.4971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6420, loss: 0.8936, batch_reg_loss: 0.1628, reg_loss: 0.1625 ||:  31%|###       | 34/111 [00:22<00:52,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9013, UAS: 0.9292, LAS: 0.8736, UEM: 0.4858, LEM: 0.2491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4041, partial_loss/deprel_loss: 0.5663, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6967, loss: 0.8827, batch_reg_loss: 0.1628, reg_loss: 0.1626 ||:  34%|###4      | 38/111 [00:25<00:48,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9295, LAS: 0.8742, UEM: 0.4897, LEM: 0.2530, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4659, partial_loss/deprel_loss: 0.6584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7828, loss: 0.8813, batch_reg_loss: 0.1629, reg_loss: 0.1626 ||:  38%|###7      | 42/111 [00:27<00:44,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9165, UAS: 0.9311, LAS: 0.8761, UEM: 0.5027, LEM: 0.2619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1957, partial_loss/deprel_loss: 0.3736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5010, loss: 0.8652, batch_reg_loss: 0.1630, reg_loss: 0.1626 ||:  41%|####1     | 46/111 [00:30<00:42,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9320, LAS: 0.8773, UEM: 0.5124, LEM: 0.2717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5651, partial_loss/deprel_loss: 0.5854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7444, loss: 0.8546, batch_reg_loss: 0.1630, reg_loss: 0.1627 ||:  45%|####5     | 50/111 [00:33<00:41,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8246, UAS: 0.9308, LAS: 0.8758, UEM: 0.5093, LEM: 0.2702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1829, partial_loss/deprel_loss: 0.9669, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1732, loss: 0.8625, batch_reg_loss: 0.1631, reg_loss: 0.1627 ||:  48%|####7     | 53/111 [00:35<00:40,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8019, UAS: 0.9278, LAS: 0.8724, UEM: 0.4995, LEM: 0.2647, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7117, partial_loss/deprel_loss: 1.1906, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4580, loss: 0.8887, batch_reg_loss: 0.1631, reg_loss: 0.1627 ||:  51%|#####1    | 57/111 [00:37<00:35,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8156, UAS: 0.9276, LAS: 0.8723, UEM: 0.4999, LEM: 0.2658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5744, partial_loss/deprel_loss: 1.0889, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3492, loss: 0.8901, batch_reg_loss: 0.1632, reg_loss: 0.1627 ||:  55%|#####4    | 61/111 [00:39<00:31,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8730, UAS: 0.9285, LAS: 0.8731, UEM: 0.5093, LEM: 0.2738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6473, partial_loss/deprel_loss: 0.7667, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9061, loss: 0.8856, batch_reg_loss: 0.1633, reg_loss: 0.1628 ||:  59%|#####8    | 65/111 [00:42<00:29,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9278, LAS: 0.8724, UEM: 0.5045, LEM: 0.2701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4895, partial_loss/deprel_loss: 0.5364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6903, loss: 0.8913, batch_reg_loss: 0.1633, reg_loss: 0.1628 ||:  62%|######2   | 69/111 [00:45<00:27,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8434, UAS: 0.9266, LAS: 0.8711, UEM: 0.4930, LEM: 0.2620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0492, partial_loss/deprel_loss: 1.0301, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1973, loss: 0.9030, batch_reg_loss: 0.1634, reg_loss: 0.1628 ||:  66%|######5   | 73/111 [00:47<00:24,  1.57it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9267, LAS: 0.8713, UEM: 0.4968, LEM: 0.2664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3645, partial_loss/deprel_loss: 0.5718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6938, loss: 0.9019, batch_reg_loss: 0.1635, reg_loss: 0.1629 ||:  69%|######9   | 77/111 [00:50<00:22,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9279, LAS: 0.8725, UEM: 0.5080, LEM: 0.2731, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4258, partial_loss/deprel_loss: 0.5856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7172, loss: 0.8911, batch_reg_loss: 0.1636, reg_loss: 0.1629 ||:  73%|#######2  | 81/111 [00:53<00:21,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9288, LAS: 0.8735, UEM: 0.5127, LEM: 0.2738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4960, partial_loss/deprel_loss: 0.7325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8488, loss: 0.8845, batch_reg_loss: 0.1636, reg_loss: 0.1629 ||:  76%|#######5  | 84/111 [00:55<00:19,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8745, UAS: 0.9295, LAS: 0.8742, UEM: 0.5182, LEM: 0.2763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6469, partial_loss/deprel_loss: 0.6858, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8417, loss: 0.8779, batch_reg_loss: 0.1637, reg_loss: 0.1630 ||:  78%|#######8  | 87/111 [00:58<00:17,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9290, LAS: 0.8735, UEM: 0.5111, LEM: 0.2713, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9573, partial_loss/deprel_loss: 0.9826, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1413, loss: 0.8841, batch_reg_loss: 0.1637, reg_loss: 0.1630 ||:  81%|########1 | 90/111 [01:00<00:14,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9303, LAS: 0.8751, UEM: 0.5402, LEM: 0.3059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2008, partial_loss/deprel_loss: 0.3759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5046, loss: 0.8728, batch_reg_loss: 0.1637, reg_loss: 0.1630 ||:  84%|########3 | 93/111 [01:02<00:13,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8101, UAS: 0.9297, LAS: 0.8744, UEM: 0.5358, LEM: 0.3025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3972, partial_loss/deprel_loss: 1.1130, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3336, loss: 0.8781, batch_reg_loss: 0.1638, reg_loss: 0.1630 ||:  87%|########7 | 97/111 [01:04<00:09,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8339, UAS: 0.9295, LAS: 0.8743, UEM: 0.5347, LEM: 0.3013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3269, partial_loss/deprel_loss: 1.0957, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3058, loss: 0.8800, batch_reg_loss: 0.1638, reg_loss: 0.1631 ||:  90%|######### | 100/111 [01:07<00:07,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9126, UAS: 0.9296, LAS: 0.8744, UEM: 0.5320, LEM: 0.2980, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3737, partial_loss/deprel_loss: 0.4763, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6197, loss: 0.8794, batch_reg_loss: 0.1639, reg_loss: 0.1631 ||:  94%|#########3| 104/111 [01:09<00:04,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8458, UAS: 0.9301, LAS: 0.8749, UEM: 0.5330, LEM: 0.2968, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9118, partial_loss/deprel_loss: 0.9566, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1116, loss: 0.8764, batch_reg_loss: 0.1639, reg_loss: 0.1631 ||:  97%|#########7| 108/111 [01:12<00:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8401, UAS: 0.9299, LAS: 0.8747, UEM: 0.5328, LEM: 0.2984, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0703, partial_loss/deprel_loss: 0.9871, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1677, loss: 0.8771, batch_reg_loss: 0.1640, reg_loss: 0.1631 ||: 100%|##########| 111/111 [01:14<00:00,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8401, UAS: 0.9299, LAS: 0.8747, UEM: 0.5328, LEM: 0.2984, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0703, partial_loss/deprel_loss: 0.9871, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1677, loss: 0.8771, batch_reg_loss: 0.1640, reg_loss: 0.1631 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
+      "2023-04-07 00:00:26,510 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.987  |       N/A\n",
+      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.070  |       N/A\n",
+      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.163  |       N/A\n",
+      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - UEM                      |     0.533  |       N/A\n",
+      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - LAS                      |     0.875  |       N/A\n",
+      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - loss                     |     0.877  |       N/A\n",
+      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - LEM                      |     0.298  |       N/A\n",
+      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:00:26,512 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:00:26,512 - INFO - combo.training.tensorboard_writer - UAS                      |     0.930  |       N/A\n",
+      "2023-04-07 00:00:26,512 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:00:26,512 - INFO - combo.training.tensorboard_writer - EM                       |     0.840  |       N/A\n",
+      "2023-04-07 00:00:26,512 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:00:26,512 - INFO - combo.training.trainer - Epoch duration: 0:01:14.736354\n",
+      "2023-04-07 00:00:26,513 - INFO - combo.training.trainer - Estimated training time remaining: 7:32:42\n",
+      "2023-04-07 00:00:26,513 - INFO - allennlp.training.trainer - Epoch 54/399\n",
+      "2023-04-07 00:00:26,513 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:00:26,513 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:00:26,520 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9448, LAS: 0.8931, UEM: 0.7116, LEM: 0.4577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2033, partial_loss/deprel_loss: 0.3485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4835, loss: 0.7435, batch_reg_loss: 0.1640, reg_loss: 0.1640 ||:   3%|2         | 3/111 [00:02<01:14,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9409, LAS: 0.8887, UEM: 0.5927, LEM: 0.3441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3385, partial_loss/deprel_loss: 0.4904, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6241, loss: 0.7844, batch_reg_loss: 0.1641, reg_loss: 0.1640 ||:   6%|6         | 7/111 [00:04<01:10,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8577, UAS: 0.9355, LAS: 0.8830, UEM: 0.5229, LEM: 0.2916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8470, partial_loss/deprel_loss: 0.8782, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0361, loss: 0.8226, batch_reg_loss: 0.1641, reg_loss: 0.1641 ||:  10%|9         | 11/111 [00:06<01:05,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9305, LAS: 0.8779, UEM: 0.5623, LEM: 0.3476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1667, partial_loss/deprel_loss: 0.3135, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4483, loss: 0.8639, batch_reg_loss: 0.1642, reg_loss: 0.1641 ||:  13%|#2        | 14/111 [00:09<01:07,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8417, UAS: 0.9307, LAS: 0.8791, UEM: 0.6237, LEM: 0.4441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1766, partial_loss/deprel_loss: 0.9353, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1478, loss: 0.8571, batch_reg_loss: 0.1642, reg_loss: 0.1641 ||:  15%|#5        | 17/111 [00:13<01:29,  1.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8884, UAS: 0.9324, LAS: 0.8798, UEM: 0.5994, LEM: 0.4003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4481, partial_loss/deprel_loss: 0.6010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7347, loss: 0.8410, batch_reg_loss: 0.1643, reg_loss: 0.1641 ||:  19%|#8        | 21/111 [00:16<01:18,  1.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9320, LAS: 0.8789, UEM: 0.5892, LEM: 0.3873, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2499, partial_loss/deprel_loss: 0.4475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5723, loss: 0.8520, batch_reg_loss: 0.1643, reg_loss: 0.1642 ||:  22%|##1       | 24/111 [00:19<01:13,  1.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8887, UAS: 0.9321, LAS: 0.8784, UEM: 0.5624, LEM: 0.3576, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5136, partial_loss/deprel_loss: 0.6196, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7628, loss: 0.8548, batch_reg_loss: 0.1644, reg_loss: 0.1642 ||:  25%|##5       | 28/111 [00:21<01:04,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9341, LAS: 0.8809, UEM: 0.5804, LEM: 0.3688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2605, partial_loss/deprel_loss: 0.3954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5329, loss: 0.8333, batch_reg_loss: 0.1644, reg_loss: 0.1642 ||:  28%|##7       | 31/111 [00:23<01:02,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9053, UAS: 0.9328, LAS: 0.8791, UEM: 0.5736, LEM: 0.3619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2956, partial_loss/deprel_loss: 0.4525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5856, loss: 0.8460, batch_reg_loss: 0.1645, reg_loss: 0.1642 ||:  31%|###       | 34/111 [00:26<00:59,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9333, LAS: 0.8795, UEM: 0.5669, LEM: 0.3517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4214, partial_loss/deprel_loss: 0.5140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6600, loss: 0.8440, batch_reg_loss: 0.1645, reg_loss: 0.1643 ||:  33%|###3      | 37/111 [00:28<00:55,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8372, UAS: 0.9334, LAS: 0.8801, UEM: 0.5717, LEM: 0.3553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3333, partial_loss/deprel_loss: 0.9017, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1526, loss: 0.8380, batch_reg_loss: 0.1646, reg_loss: 0.1643 ||:  36%|###6      | 40/111 [00:30<00:53,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8462, UAS: 0.9321, LAS: 0.8783, UEM: 0.5681, LEM: 0.3506, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1812, partial_loss/deprel_loss: 0.8796, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1046, loss: 0.8479, batch_reg_loss: 0.1646, reg_loss: 0.1643 ||:  39%|###8      | 43/111 [00:32<00:50,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8712, UAS: 0.9331, LAS: 0.8794, UEM: 0.5662, LEM: 0.3420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8001, partial_loss/deprel_loss: 0.7264, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9059, loss: 0.8421, batch_reg_loss: 0.1647, reg_loss: 0.1643 ||:  42%|####2     | 47/111 [00:35<00:45,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9321, LAS: 0.8786, UEM: 0.5562, LEM: 0.3339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3762, partial_loss/deprel_loss: 0.5160, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6528, loss: 0.8515, batch_reg_loss: 0.1647, reg_loss: 0.1644 ||:  46%|####5     | 51/111 [00:37<00:40,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9321, LAS: 0.8786, UEM: 0.5521, LEM: 0.3306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2895, partial_loss/deprel_loss: 0.4472, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5805, loss: 0.8509, batch_reg_loss: 0.1648, reg_loss: 0.1644 ||:  49%|####8     | 54/111 [00:39<00:39,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8934, UAS: 0.9332, LAS: 0.8799, UEM: 0.5667, LEM: 0.3470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4449, partial_loss/deprel_loss: 0.6679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7881, loss: 0.8421, batch_reg_loss: 0.1648, reg_loss: 0.1644 ||:  51%|#####1    | 57/111 [00:41<00:37,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7900, UAS: 0.9308, LAS: 0.8773, UEM: 0.5544, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8413, partial_loss/deprel_loss: 1.2192, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5085, loss: 0.8640, batch_reg_loss: 0.1649, reg_loss: 0.1644 ||:  55%|#####4    | 61/111 [00:44<00:33,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9321, LAS: 0.8786, UEM: 0.5625, LEM: 0.3386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1444, partial_loss/deprel_loss: 0.3851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5019, loss: 0.8516, batch_reg_loss: 0.1649, reg_loss: 0.1645 ||:  59%|#####8    | 65/111 [00:47<00:31,  1.47it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9318, LAS: 0.8784, UEM: 0.5630, LEM: 0.3356, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4898, partial_loss/deprel_loss: 0.6133, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7536, loss: 0.8540, batch_reg_loss: 0.1650, reg_loss: 0.1645 ||:  62%|######2   | 69/111 [00:49<00:28,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9320, LAS: 0.8785, UEM: 0.5594, LEM: 0.3298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3849, partial_loss/deprel_loss: 0.5626, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6921, loss: 0.8529, batch_reg_loss: 0.1651, reg_loss: 0.1645 ||:  65%|######4   | 72/111 [00:52<00:26,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8562, UAS: 0.9308, LAS: 0.8771, UEM: 0.5510, LEM: 0.3240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0675, partial_loss/deprel_loss: 0.8571, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0643, loss: 0.8638, batch_reg_loss: 0.1651, reg_loss: 0.1645 ||:  68%|######7   | 75/111 [00:54<00:24,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8299, UAS: 0.9300, LAS: 0.8759, UEM: 0.5432, LEM: 0.3184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3399, partial_loss/deprel_loss: 0.9877, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2233, loss: 0.8729, batch_reg_loss: 0.1652, reg_loss: 0.1646 ||:  70%|#######   | 78/111 [00:56<00:22,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9305, LAS: 0.8765, UEM: 0.5447, LEM: 0.3189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6205, partial_loss/deprel_loss: 0.7112, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8583, loss: 0.8691, batch_reg_loss: 0.1652, reg_loss: 0.1646 ||:  73%|#######2  | 81/111 [00:58<00:21,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8884, UAS: 0.9294, LAS: 0.8752, UEM: 0.5381, LEM: 0.3131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5750, partial_loss/deprel_loss: 0.6413, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7933, loss: 0.8801, batch_reg_loss: 0.1653, reg_loss: 0.1646 ||:  77%|#######6  | 85/111 [01:00<00:17,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8866, UAS: 0.9299, LAS: 0.8759, UEM: 0.5388, LEM: 0.3119, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5388, partial_loss/deprel_loss: 0.6564, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7982, loss: 0.8754, batch_reg_loss: 0.1653, reg_loss: 0.1646 ||:  79%|#######9  | 88/111 [01:02<00:15,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9307, LAS: 0.8765, UEM: 0.5455, LEM: 0.3163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2060, partial_loss/deprel_loss: 0.3806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5111, loss: 0.8701, batch_reg_loss: 0.1654, reg_loss: 0.1647 ||:  83%|########2 | 92/111 [01:05<00:12,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8516, UAS: 0.9298, LAS: 0.8756, UEM: 0.5412, LEM: 0.3124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0076, partial_loss/deprel_loss: 0.9710, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1438, loss: 0.8782, batch_reg_loss: 0.1655, reg_loss: 0.1647 ||:  86%|########6 | 96/111 [01:08<00:10,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8668, UAS: 0.9303, LAS: 0.8761, UEM: 0.5436, LEM: 0.3130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7639, partial_loss/deprel_loss: 0.8132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9688, loss: 0.8738, batch_reg_loss: 0.1655, reg_loss: 0.1647 ||:  89%|########9 | 99/111 [01:10<00:08,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8463, UAS: 0.9296, LAS: 0.8754, UEM: 0.5380, LEM: 0.3088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1287, partial_loss/deprel_loss: 0.9364, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1404, loss: 0.8794, batch_reg_loss: 0.1656, reg_loss: 0.1648 ||:  92%|#########1| 102/111 [01:12<00:06,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9124, UAS: 0.9302, LAS: 0.8761, UEM: 0.5385, LEM: 0.3065, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2722, partial_loss/deprel_loss: 0.4483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5787, loss: 0.8726, batch_reg_loss: 0.1656, reg_loss: 0.1648 ||:  95%|#########5| 106/111 [01:14<00:03,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8582, UAS: 0.9303, LAS: 0.8761, UEM: 0.5354, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8501, partial_loss/deprel_loss: 0.8843, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0431, loss: 0.8737, batch_reg_loss: 0.1657, reg_loss: 0.1648 ||:  99%|#########9| 110/111 [01:17<00:00,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8651, UAS: 0.9302, LAS: 0.8760, UEM: 0.5334, LEM: 0.3015, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7965, partial_loss/deprel_loss: 0.7209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9017, loss: 0.8739, batch_reg_loss: 0.1657, reg_loss: 0.1648 ||: 100%|##########| 111/111 [01:17<00:00,  1.42it/s]\n",
+      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.721  |       N/A\n",
+      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.797  |       N/A\n",
+      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.165  |       N/A\n",
+      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - UEM                      |     0.533  |       N/A\n",
+      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - LAS                      |     0.876  |       N/A\n",
+      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - loss                     |     0.874  |       N/A\n",
+      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - LEM                      |     0.302  |       N/A\n",
+      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - UAS                      |     0.930  |       N/A\n",
+      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - EM                       |     0.865  |       N/A\n",
+      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:01:44,506 - INFO - combo.training.trainer - Epoch duration: 0:01:17.993194\n",
+      "2023-04-07 00:01:44,506 - INFO - combo.training.trainer - Estimated training time remaining: 7:31:20\n",
+      "2023-04-07 00:01:44,506 - INFO - allennlp.training.trainer - Epoch 55/399\n",
+      "2023-04-07 00:01:44,506 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:01:44,507 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:01:44,513 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8958, UAS: 0.9378, LAS: 0.8843, UEM: 0.6189, LEM: 0.3503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3601, partial_loss/deprel_loss: 0.5774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6997, loss: 0.7860, batch_reg_loss: 0.1657, reg_loss: 0.1657 ||:   3%|2         | 3/111 [00:02<01:17,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8378, UAS: 0.9324, LAS: 0.8764, UEM: 0.4882, LEM: 0.2407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0905, partial_loss/deprel_loss: 1.0808, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2485, loss: 0.8774, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:   6%|6         | 7/111 [00:04<01:12,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8522, UAS: 0.9306, LAS: 0.8749, UEM: 0.4708, LEM: 0.2315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0105, partial_loss/deprel_loss: 0.8525, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0499, loss: 0.8856, batch_reg_loss: 0.1659, reg_loss: 0.1658 ||:  10%|9         | 11/111 [00:07<01:06,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9339, LAS: 0.8782, UEM: 0.5102, LEM: 0.2496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2956, partial_loss/deprel_loss: 0.4273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5669, loss: 0.8600, batch_reg_loss: 0.1659, reg_loss: 0.1658 ||:  14%|#3        | 15/111 [00:09<01:01,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8532, UAS: 0.9279, LAS: 0.8717, UEM: 0.4778, LEM: 0.2334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0383, partial_loss/deprel_loss: 0.8635, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0645, loss: 0.9098, batch_reg_loss: 0.1660, reg_loss: 0.1659 ||:  17%|#7        | 19/111 [00:11<00:58,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8922, UAS: 0.9278, LAS: 0.8715, UEM: 0.4733, LEM: 0.2227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3426, partial_loss/deprel_loss: 0.5423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6684, loss: 0.9059, batch_reg_loss: 0.1661, reg_loss: 0.1659 ||:  21%|##        | 23/111 [00:14<00:55,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9272, LAS: 0.8709, UEM: 0.4712, LEM: 0.2228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2936, partial_loss/deprel_loss: 0.4856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6133, loss: 0.9143, batch_reg_loss: 0.1661, reg_loss: 0.1659 ||:  23%|##3       | 26/111 [00:16<00:55,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8659, UAS: 0.9271, LAS: 0.8711, UEM: 0.4586, LEM: 0.2171, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7521, partial_loss/deprel_loss: 0.7589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9237, loss: 0.9126, batch_reg_loss: 0.1662, reg_loss: 0.1659 ||:  26%|##6       | 29/111 [00:18<00:57,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9291, LAS: 0.8736, UEM: 0.4894, LEM: 0.2468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4697, partial_loss/deprel_loss: 0.6005, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7406, loss: 0.8919, batch_reg_loss: 0.1662, reg_loss: 0.1660 ||:  29%|##8       | 32/111 [00:21<00:57,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9282, LAS: 0.8727, UEM: 0.5098, LEM: 0.2681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1440, partial_loss/deprel_loss: 0.3799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4990, loss: 0.8966, batch_reg_loss: 0.1663, reg_loss: 0.1660 ||:  32%|###2      | 36/111 [00:24<00:54,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9284, LAS: 0.8732, UEM: 0.5109, LEM: 0.2716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2249, partial_loss/deprel_loss: 0.3740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5105, loss: 0.8943, batch_reg_loss: 0.1664, reg_loss: 0.1660 ||:  36%|###6      | 40/111 [00:26<00:50,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9290, LAS: 0.8739, UEM: 0.5005, LEM: 0.2620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5359, partial_loss/deprel_loss: 0.5986, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7525, loss: 0.8865, batch_reg_loss: 0.1664, reg_loss: 0.1661 ||:  40%|###9      | 44/111 [00:29<00:44,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8538, UAS: 0.9300, LAS: 0.8750, UEM: 0.5045, LEM: 0.2663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0223, partial_loss/deprel_loss: 0.9283, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1136, loss: 0.8820, batch_reg_loss: 0.1665, reg_loss: 0.1661 ||:  43%|####3     | 48/111 [00:31<00:41,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9303, LAS: 0.8755, UEM: 0.5021, LEM: 0.2655, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7655, partial_loss/deprel_loss: 0.7056, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8842, loss: 0.8792, batch_reg_loss: 0.1665, reg_loss: 0.1661 ||:  47%|####6     | 52/111 [00:34<00:40,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9302, LAS: 0.8753, UEM: 0.4943, LEM: 0.2582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5434, partial_loss/deprel_loss: 0.5759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7360, loss: 0.8802, batch_reg_loss: 0.1666, reg_loss: 0.1662 ||:  50%|####9     | 55/111 [00:36<00:38,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9292, LAS: 0.8742, UEM: 0.4979, LEM: 0.2597, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3299, partial_loss/deprel_loss: 0.5148, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6445, loss: 0.8854, batch_reg_loss: 0.1666, reg_loss: 0.1662 ||:  52%|#####2    | 58/111 [00:38<00:37,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8848, UAS: 0.9300, LAS: 0.8748, UEM: 0.4960, LEM: 0.2542, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5726, partial_loss/deprel_loss: 0.6414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7943, loss: 0.8809, batch_reg_loss: 0.1667, reg_loss: 0.1662 ||:  56%|#####5    | 62/111 [00:41<00:33,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8270, UAS: 0.9287, LAS: 0.8734, UEM: 0.4838, LEM: 0.2459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3249, partial_loss/deprel_loss: 0.9868, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2212, loss: 0.8900, batch_reg_loss: 0.1668, reg_loss: 0.1662 ||:  59%|#####9    | 66/111 [00:44<00:30,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9292, LAS: 0.8740, UEM: 0.4893, LEM: 0.2502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2609, partial_loss/deprel_loss: 0.4625, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5890, loss: 0.8867, batch_reg_loss: 0.1668, reg_loss: 0.1663 ||:  62%|######2   | 69/111 [00:46<00:29,  1.45it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9279, LAS: 0.8726, UEM: 0.4918, LEM: 0.2529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2447, partial_loss/deprel_loss: 0.3762, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5167, loss: 0.8979, batch_reg_loss: 0.1669, reg_loss: 0.1663 ||:  66%|######5   | 73/111 [00:49<00:26,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9283, LAS: 0.8730, UEM: 0.4954, LEM: 0.2557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4216, partial_loss/deprel_loss: 0.5738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7102, loss: 0.8955, batch_reg_loss: 0.1669, reg_loss: 0.1663 ||:  68%|######8   | 76/111 [00:51<00:24,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9292, LAS: 0.8739, UEM: 0.5096, LEM: 0.2727, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1119, partial_loss/deprel_loss: 0.2691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4047, loss: 0.8890, batch_reg_loss: 0.1670, reg_loss: 0.1663 ||:  71%|#######1  | 79/111 [00:53<00:22,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9568, UAS: 0.9288, LAS: 0.8736, UEM: 0.5289, LEM: 0.3012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0828, partial_loss/deprel_loss: 0.1641, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3149, loss: 0.8923, batch_reg_loss: 0.1670, reg_loss: 0.1664 ||:  74%|#######3  | 82/111 [00:55<00:21,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8655, UAS: 0.9287, LAS: 0.8735, UEM: 0.5236, LEM: 0.2972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8288, partial_loss/deprel_loss: 0.7915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9661, loss: 0.8928, batch_reg_loss: 0.1671, reg_loss: 0.1664 ||:  77%|#######7  | 86/111 [00:58<00:17,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9116, UAS: 0.9293, LAS: 0.8741, UEM: 0.5222, LEM: 0.2947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2973, partial_loss/deprel_loss: 0.4618, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5960, loss: 0.8897, batch_reg_loss: 0.1671, reg_loss: 0.1664 ||:  81%|########1 | 90/111 [01:00<00:14,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9300, LAS: 0.8750, UEM: 0.5309, LEM: 0.3014, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3646, partial_loss/deprel_loss: 0.4656, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6126, loss: 0.8813, batch_reg_loss: 0.1672, reg_loss: 0.1665 ||:  84%|########3 | 93/111 [01:02<00:12,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9304, LAS: 0.8754, UEM: 0.5302, LEM: 0.2991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5344, partial_loss/deprel_loss: 0.6124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7641, loss: 0.8764, batch_reg_loss: 0.1672, reg_loss: 0.1665 ||:  86%|########6 | 96/111 [01:05<00:10,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8599, UAS: 0.9304, LAS: 0.8755, UEM: 0.5246, LEM: 0.2934, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9842, partial_loss/deprel_loss: 0.9223, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1020, loss: 0.8779, batch_reg_loss: 0.1673, reg_loss: 0.1665 ||:  90%|######### | 100/111 [01:07<00:07,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9302, LAS: 0.8752, UEM: 0.5250, LEM: 0.2941, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3074, partial_loss/deprel_loss: 0.3868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5382, loss: 0.8795, batch_reg_loss: 0.1673, reg_loss: 0.1665 ||:  93%|#########2| 103/111 [01:09<00:05,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9021, UAS: 0.9305, LAS: 0.8756, UEM: 0.5243, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3452, partial_loss/deprel_loss: 0.4917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6297, loss: 0.8772, batch_reg_loss: 0.1673, reg_loss: 0.1666 ||:  96%|#########6| 107/111 [01:12<00:02,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8385, UAS: 0.9307, LAS: 0.8759, UEM: 0.5311, LEM: 0.2999, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0582, partial_loss/deprel_loss: 0.8997, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0988, loss: 0.8732, batch_reg_loss: 0.1674, reg_loss: 0.1666 ||:  99%|#########9| 110/111 [01:14<00:00,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9007, UAS: 0.9310, LAS: 0.8761, UEM: 0.5327, LEM: 0.3001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3381, partial_loss/deprel_loss: 0.5684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6897, loss: 0.8716, batch_reg_loss: 0.1674, reg_loss: 0.1666 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
+      "2023-04-07 00:03:00,154 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9457, LAS: 0.8973, UEM: 0.7127, LEM: 0.5238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2112, partial_loss/deprel_loss: 20.6524, partial_loss/cycle_loss: 0.0000, batch_loss: 16.5642, loss: 23.9662, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:09,  1.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8186, UAS: 0.9355, LAS: 0.8835, UEM: 0.6797, LEM: 0.4542, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6319, partial_loss/deprel_loss: 58.9152, partial_loss/cycle_loss: 0.0000, batch_loss: 47.4585, loss: 28.1342, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:05<00:08,  1.01s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8836, UAS: 0.9338, LAS: 0.8808, UEM: 0.6146, LEM: 0.3880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7457, partial_loss/deprel_loss: 30.3347, partial_loss/cycle_loss: 0.0000, batch_loss: 24.4169, loss: 29.2772, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  54%|#####3    | 7/13 [00:07<00:06,  1.01s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9387, LAS: 0.8860, UEM: 0.6328, LEM: 0.3817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5421, partial_loss/deprel_loss: 24.5162, partial_loss/cycle_loss: 0.0000, batch_loss: 19.7214, loss: 27.9239, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  77%|#######6  | 10/13 [00:09<00:02,  1.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9427, LAS: 0.8904, UEM: 0.6369, LEM: 0.3681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7084, partial_loss/deprel_loss: 34.8308, partial_loss/cycle_loss: 0.0000, batch_loss: 28.0063, loss: 26.2605, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9427, LAS: 0.8904, UEM: 0.6369, LEM: 0.3681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7084, partial_loss/deprel_loss: 34.8308, partial_loss/cycle_loss: 0.0000, batch_loss: 28.0063, loss: 26.2605, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.05it/s]\n",
+      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.568  |    34.831\n",
+      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.338  |     0.708\n",
+      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.167  |     0.000\n",
+      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - UEM                      |     0.533  |     0.637\n",
+      "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - LAS                      |     0.876  |     0.890\n",
+      "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - loss                     |     0.872  |    26.260\n",
+      "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - LEM                      |     0.300  |     0.368\n",
+      "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - UAS                      |     0.931  |     0.943\n",
+      "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - EM                       |     0.901  |     0.886\n",
+      "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:03:12,595 - INFO - combo.training.trainer - Epoch duration: 0:01:28.088627\n",
+      "2023-04-07 00:03:12,595 - INFO - combo.training.trainer - Estimated training time remaining: 7:31:01\n",
+      "2023-04-07 00:03:12,595 - INFO - allennlp.training.trainer - Epoch 56/399\n",
+      "2023-04-07 00:03:12,595 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:03:12,595 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:03:12,602 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9052, LAS: 0.8484, UEM: 0.3495, LEM: 0.1702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4177, partial_loss/deprel_loss: 0.5719, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7085, loss: 1.0817, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||:   3%|2         | 3/111 [00:02<01:19,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9245, LAS: 0.8711, UEM: 0.3775, LEM: 0.1822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7256, partial_loss/deprel_loss: 0.7942, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9480, loss: 0.9261, batch_reg_loss: 0.1675, reg_loss: 0.1675 ||:   6%|6         | 7/111 [00:04<01:13,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8121, UAS: 0.9251, LAS: 0.8701, UEM: 0.4158, LEM: 0.1978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5426, partial_loss/deprel_loss: 1.1777, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4182, loss: 0.9325, batch_reg_loss: 0.1675, reg_loss: 0.1675 ||:  10%|9         | 11/111 [00:06<01:06,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8936, UAS: 0.9213, LAS: 0.8668, UEM: 0.4016, LEM: 0.1869, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5635, partial_loss/deprel_loss: 0.6340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7875, loss: 0.9613, batch_reg_loss: 0.1676, reg_loss: 0.1675 ||:  14%|#3        | 15/111 [00:09<01:02,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8866, UAS: 0.9253, LAS: 0.8701, UEM: 0.4440, LEM: 0.2079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4793, partial_loss/deprel_loss: 0.6229, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7618, loss: 0.9270, batch_reg_loss: 0.1676, reg_loss: 0.1675 ||:  16%|#6        | 18/111 [00:11<01:02,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8692, UAS: 0.9262, LAS: 0.8708, UEM: 0.4256, LEM: 0.1955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7134, partial_loss/deprel_loss: 0.7947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9461, loss: 0.9189, batch_reg_loss: 0.1677, reg_loss: 0.1675 ||:  19%|#8        | 21/111 [00:13<01:00,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8419, UAS: 0.9281, LAS: 0.8735, UEM: 0.4891, LEM: 0.2687, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2322, partial_loss/deprel_loss: 0.9139, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1453, loss: 0.8989, batch_reg_loss: 0.1678, reg_loss: 0.1676 ||:  22%|##1       | 24/111 [00:15<00:59,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9323, LAS: 0.8779, UEM: 0.5258, LEM: 0.2887, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6955, partial_loss/deprel_loss: 0.6607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8355, loss: 0.8635, batch_reg_loss: 0.1678, reg_loss: 0.1676 ||:  25%|##5       | 28/111 [00:18<00:55,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9335, LAS: 0.8788, UEM: 0.5304, LEM: 0.2891, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6671, partial_loss/deprel_loss: 0.6794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8448, loss: 0.8535, batch_reg_loss: 0.1679, reg_loss: 0.1676 ||:  29%|##8       | 32/111 [00:20<00:51,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8620, UAS: 0.9307, LAS: 0.8755, UEM: 0.5065, LEM: 0.2739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8566, partial_loss/deprel_loss: 0.7906, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9718, loss: 0.8817, batch_reg_loss: 0.1679, reg_loss: 0.1677 ||:  32%|###2      | 36/111 [00:23<00:47,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8542, UAS: 0.9307, LAS: 0.8759, UEM: 0.5141, LEM: 0.2816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8571, partial_loss/deprel_loss: 0.7935, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9742, loss: 0.8756, batch_reg_loss: 0.1680, reg_loss: 0.1677 ||:  36%|###6      | 40/111 [00:26<00:47,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9301, LAS: 0.8756, UEM: 0.5189, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9675, partial_loss/deprel_loss: 0.9376, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1116, loss: 0.8777, batch_reg_loss: 0.1681, reg_loss: 0.1677 ||:  40%|###9      | 44/111 [00:28<00:43,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9300, LAS: 0.8757, UEM: 0.5087, LEM: 0.2809, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5739, partial_loss/deprel_loss: 0.5392, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7143, loss: 0.8775, batch_reg_loss: 0.1681, reg_loss: 0.1678 ||:  43%|####3     | 48/111 [00:31<00:40,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9298, LAS: 0.8754, UEM: 0.5231, LEM: 0.2937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3955, partial_loss/deprel_loss: 0.6056, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7318, loss: 0.8786, batch_reg_loss: 0.1682, reg_loss: 0.1678 ||:  47%|####6     | 52/111 [00:33<00:38,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9317, LAS: 0.8777, UEM: 0.5608, LEM: 0.3392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3015, partial_loss/deprel_loss: 0.4829, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6149, loss: 0.8624, batch_reg_loss: 0.1683, reg_loss: 0.1678 ||:  50%|#####     | 56/111 [00:36<00:35,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8687, UAS: 0.9320, LAS: 0.8779, UEM: 0.5538, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7732, partial_loss/deprel_loss: 0.8248, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9828, loss: 0.8628, batch_reg_loss: 0.1683, reg_loss: 0.1679 ||:  54%|#####4    | 60/111 [00:38<00:32,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9061, UAS: 0.9315, LAS: 0.8774, UEM: 0.5514, LEM: 0.3265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2844, partial_loss/deprel_loss: 0.4435, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5800, loss: 0.8651, batch_reg_loss: 0.1684, reg_loss: 0.1679 ||:  58%|#####7    | 64/111 [00:41<00:31,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8592, UAS: 0.9296, LAS: 0.8752, UEM: 0.5375, LEM: 0.3173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8510, partial_loss/deprel_loss: 0.7962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9756, loss: 0.8823, batch_reg_loss: 0.1684, reg_loss: 0.1679 ||:  61%|######1   | 68/111 [00:44<00:28,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8740, UAS: 0.9303, LAS: 0.8758, UEM: 0.5345, LEM: 0.3132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6570, partial_loss/deprel_loss: 0.7377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8901, loss: 0.8786, batch_reg_loss: 0.1685, reg_loss: 0.1679 ||:  65%|######4   | 72/111 [00:46<00:25,  1.53it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.9287, LAS: 0.8742, UEM: 0.5252, LEM: 0.3058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5470, partial_loss/deprel_loss: 0.9589, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2450, loss: 0.8900, batch_reg_loss: 0.1686, reg_loss: 0.1680 ||:  68%|######8   | 76/111 [00:49<00:22,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8437, UAS: 0.9281, LAS: 0.8733, UEM: 0.5200, LEM: 0.3022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0865, partial_loss/deprel_loss: 0.9616, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1552, loss: 0.8975, batch_reg_loss: 0.1686, reg_loss: 0.1680 ||:  72%|#######2  | 80/111 [00:51<00:19,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9276, LAS: 0.8728, UEM: 0.5178, LEM: 0.3011, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2355, partial_loss/deprel_loss: 0.3739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5149, loss: 0.9017, batch_reg_loss: 0.1687, reg_loss: 0.1680 ||:  76%|#######5  | 84/111 [00:54<00:17,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8545, UAS: 0.9287, LAS: 0.8741, UEM: 0.5313, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9235, partial_loss/deprel_loss: 0.8001, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9935, loss: 0.8910, batch_reg_loss: 0.1688, reg_loss: 0.1681 ||:  79%|#######9  | 88/111 [00:57<00:15,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9295, LAS: 0.8749, UEM: 0.5379, LEM: 0.3145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2532, partial_loss/deprel_loss: 0.3850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5275, loss: 0.8835, batch_reg_loss: 0.1688, reg_loss: 0.1681 ||:  82%|########1 | 91/111 [00:59<00:13,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8366, UAS: 0.9292, LAS: 0.8745, UEM: 0.5322, LEM: 0.3098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2230, partial_loss/deprel_loss: 1.0392, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2448, loss: 0.8888, batch_reg_loss: 0.1689, reg_loss: 0.1681 ||:  85%|########4 | 94/111 [01:01<00:11,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8414, UAS: 0.9293, LAS: 0.8746, UEM: 0.5293, LEM: 0.3064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1261, partial_loss/deprel_loss: 0.9523, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1560, loss: 0.8880, batch_reg_loss: 0.1689, reg_loss: 0.1681 ||:  87%|########7 | 97/111 [01:04<00:10,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9299, LAS: 0.8754, UEM: 0.5300, LEM: 0.3063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3975, partial_loss/deprel_loss: 0.5280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6709, loss: 0.8825, batch_reg_loss: 0.1690, reg_loss: 0.1682 ||:  91%|######### | 101/111 [01:06<00:06,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8993, UAS: 0.9300, LAS: 0.8756, UEM: 0.5286, LEM: 0.3041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4520, partial_loss/deprel_loss: 0.5662, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7124, loss: 0.8817, batch_reg_loss: 0.1690, reg_loss: 0.1682 ||:  94%|#########3| 104/111 [01:08<00:04,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9309, LAS: 0.8767, UEM: 0.5328, LEM: 0.3061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3614, partial_loss/deprel_loss: 0.5570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6869, loss: 0.8740, batch_reg_loss: 0.1691, reg_loss: 0.1682 ||:  97%|#########7| 108/111 [01:11<00:02,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9313, LAS: 0.8771, UEM: 0.5337, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3501, partial_loss/deprel_loss: 0.5126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6492, loss: 0.8706, batch_reg_loss: 0.1691, reg_loss: 0.1683 ||: 100%|##########| 111/111 [01:14<00:00,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9313, LAS: 0.8771, UEM: 0.5337, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3501, partial_loss/deprel_loss: 0.5126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6492, loss: 0.8706, batch_reg_loss: 0.1691, reg_loss: 0.1683 ||: 100%|##########| 111/111 [01:14<00:00,  1.50it/s]\n",
+      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.513  |       N/A\n",
+      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.350  |       N/A\n",
+      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.168  |       N/A\n",
+      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - UEM                      |     0.534  |       N/A\n",
+      "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - LAS                      |     0.877  |       N/A\n",
+      "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - loss                     |     0.871  |       N/A\n",
+      "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - LEM                      |     0.305  |       N/A\n",
+      "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - UAS                      |     0.931  |       N/A\n",
+      "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - EM                       |     0.904  |       N/A\n",
+      "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:04:26,675 - INFO - combo.training.trainer - Epoch duration: 0:01:14.079801\n",
+      "2023-04-07 00:04:26,675 - INFO - combo.training.trainer - Estimated training time remaining: 7:29:14\n",
+      "2023-04-07 00:04:26,675 - INFO - allennlp.training.trainer - Epoch 57/399\n",
+      "2023-04-07 00:04:26,675 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:04:26,675 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:04:26,683 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9574, LAS: 0.9082, UEM: 0.6799, LEM: 0.3935, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2009, partial_loss/deprel_loss: 0.3836, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5162, loss: 0.6548, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||:   3%|2         | 3/111 [00:02<01:22,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8609, UAS: 0.9448, LAS: 0.8923, UEM: 0.5579, LEM: 0.2907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8817, partial_loss/deprel_loss: 0.7887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9765, loss: 0.7685, batch_reg_loss: 0.1692, reg_loss: 0.1692 ||:   5%|5         | 6/111 [00:04<01:21,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9053, UAS: 0.9418, LAS: 0.8873, UEM: 0.5336, LEM: 0.2565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4015, partial_loss/deprel_loss: 0.5489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6886, loss: 0.8019, batch_reg_loss: 0.1692, reg_loss: 0.1692 ||:   8%|8         | 9/111 [00:06<01:15,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9361, LAS: 0.8815, UEM: 0.5493, LEM: 0.2631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2932, partial_loss/deprel_loss: 0.4796, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6116, loss: 0.8263, batch_reg_loss: 0.1692, reg_loss: 0.1692 ||:  11%|#         | 12/111 [00:08<01:13,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8893, UAS: 0.9336, LAS: 0.8793, UEM: 0.5382, LEM: 0.2618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5175, partial_loss/deprel_loss: 0.6198, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7686, loss: 0.8427, batch_reg_loss: 0.1693, reg_loss: 0.1692 ||:  14%|#3        | 15/111 [00:10<01:09,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9344, LAS: 0.8807, UEM: 0.5316, LEM: 0.2545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3015, partial_loss/deprel_loss: 0.4974, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6276, loss: 0.8396, batch_reg_loss: 0.1693, reg_loss: 0.1692 ||:  16%|#6        | 18/111 [00:13<01:06,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9383, LAS: 0.8858, UEM: 0.5676, LEM: 0.2897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2669, partial_loss/deprel_loss: 0.4513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5838, loss: 0.8026, batch_reg_loss: 0.1694, reg_loss: 0.1692 ||:  20%|#9        | 22/111 [00:15<01:03,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8943, UAS: 0.9375, LAS: 0.8848, UEM: 0.5659, LEM: 0.2910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4388, partial_loss/deprel_loss: 0.5643, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7086, loss: 0.8037, batch_reg_loss: 0.1694, reg_loss: 0.1693 ||:  23%|##2       | 25/111 [00:17<01:01,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8627, UAS: 0.9375, LAS: 0.8849, UEM: 0.5632, LEM: 0.2917, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9904, partial_loss/deprel_loss: 0.8711, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0644, loss: 0.8074, batch_reg_loss: 0.1695, reg_loss: 0.1693 ||:  25%|##5       | 28/111 [00:20<01:00,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9383, LAS: 0.8857, UEM: 0.5685, LEM: 0.2989, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2511, partial_loss/deprel_loss: 0.4079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5460, loss: 0.7991, batch_reg_loss: 0.1695, reg_loss: 0.1693 ||:  28%|##7       | 31/111 [00:22<00:59,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8757, UAS: 0.9386, LAS: 0.8856, UEM: 0.5538, LEM: 0.2834, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6780, partial_loss/deprel_loss: 0.7338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8922, loss: 0.8009, batch_reg_loss: 0.1695, reg_loss: 0.1693 ||:  32%|###1      | 35/111 [00:24<00:53,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9393, LAS: 0.8863, UEM: 0.5712, LEM: 0.3050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1683, partial_loss/deprel_loss: 0.3453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4795, loss: 0.7953, batch_reg_loss: 0.1696, reg_loss: 0.1693 ||:  34%|###4      | 38/111 [00:27<00:50,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8656, UAS: 0.9381, LAS: 0.8853, UEM: 0.5535, LEM: 0.2932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8753, partial_loss/deprel_loss: 0.8562, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0296, loss: 0.8056, batch_reg_loss: 0.1696, reg_loss: 0.1694 ||:  38%|###7      | 42/111 [00:29<00:45,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9391, LAS: 0.8863, UEM: 0.5589, LEM: 0.2964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2931, partial_loss/deprel_loss: 0.4550, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5923, loss: 0.7981, batch_reg_loss: 0.1697, reg_loss: 0.1694 ||:  41%|####1     | 46/111 [00:32<00:45,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8319, UAS: 0.9383, LAS: 0.8852, UEM: 0.5596, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2342, partial_loss/deprel_loss: 0.9472, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1743, loss: 0.8052, batch_reg_loss: 0.1697, reg_loss: 0.1694 ||:  44%|####4     | 49/111 [00:34<00:43,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9382, LAS: 0.8851, UEM: 0.5530, LEM: 0.2922, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4239, partial_loss/deprel_loss: 0.4945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6501, loss: 0.8059, batch_reg_loss: 0.1698, reg_loss: 0.1694 ||:  47%|####6     | 52/111 [00:36<00:41,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9035, UAS: 0.9379, LAS: 0.8845, UEM: 0.5488, LEM: 0.2867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3379, partial_loss/deprel_loss: 0.5204, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6537, loss: 0.8090, batch_reg_loss: 0.1698, reg_loss: 0.1695 ||:  50%|#####     | 56/111 [00:39<00:37,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8372, UAS: 0.9379, LAS: 0.8848, UEM: 0.5595, LEM: 0.3004, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2587, partial_loss/deprel_loss: 0.9625, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1916, loss: 0.8063, batch_reg_loss: 0.1699, reg_loss: 0.1695 ||:  53%|#####3    | 59/111 [00:41<00:35,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8707, UAS: 0.9372, LAS: 0.8841, UEM: 0.5497, LEM: 0.2937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8368, partial_loss/deprel_loss: 0.7492, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9366, loss: 0.8141, batch_reg_loss: 0.1699, reg_loss: 0.1695 ||:  56%|#####5    | 62/111 [00:43<00:35,  1.40it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9372, LAS: 0.8840, UEM: 0.5502, LEM: 0.2970, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2499, partial_loss/deprel_loss: 0.3824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5258, loss: 0.8138, batch_reg_loss: 0.1699, reg_loss: 0.1695 ||:  59%|#####8    | 65/111 [00:46<00:33,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8664, UAS: 0.9362, LAS: 0.8828, UEM: 0.5413, LEM: 0.2903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8034, partial_loss/deprel_loss: 0.7748, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9505, loss: 0.8236, batch_reg_loss: 0.1700, reg_loss: 0.1695 ||:  61%|######1   | 68/111 [00:48<00:30,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9134, UAS: 0.9372, LAS: 0.8837, UEM: 0.5485, LEM: 0.2933, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2735, partial_loss/deprel_loss: 0.4689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5999, loss: 0.8154, batch_reg_loss: 0.1700, reg_loss: 0.1696 ||:  65%|######4   | 72/111 [00:50<00:27,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8537, UAS: 0.9369, LAS: 0.8832, UEM: 0.5447, LEM: 0.2896, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8168, partial_loss/deprel_loss: 0.7835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9603, loss: 0.8159, batch_reg_loss: 0.1701, reg_loss: 0.1696 ||:  68%|######8   | 76/111 [00:53<00:23,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9351, LAS: 0.8814, UEM: 0.5352, LEM: 0.2840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8657, partial_loss/deprel_loss: 0.9087, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0703, loss: 0.8321, batch_reg_loss: 0.1702, reg_loss: 0.1696 ||:  72%|#######2  | 80/111 [00:55<00:20,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8396, UAS: 0.9344, LAS: 0.8804, UEM: 0.5286, LEM: 0.2782, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3138, partial_loss/deprel_loss: 0.9856, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2214, loss: 0.8418, batch_reg_loss: 0.1702, reg_loss: 0.1696 ||:  76%|#######5  | 84/111 [00:58<00:17,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7678, UAS: 0.9332, LAS: 0.8793, UEM: 0.5226, LEM: 0.2739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4154, partial_loss/deprel_loss: 1.4659, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8261, loss: 0.8530, batch_reg_loss: 0.1703, reg_loss: 0.1697 ||:  79%|#######9  | 88/111 [01:00<00:15,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8031, UAS: 0.9315, LAS: 0.8773, UEM: 0.5138, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6813, partial_loss/deprel_loss: 1.2116, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4759, loss: 0.8697, batch_reg_loss: 0.1704, reg_loss: 0.1697 ||:  83%|########2 | 92/111 [01:03<00:12,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8146, UAS: 0.9307, LAS: 0.8762, UEM: 0.5060, LEM: 0.2642, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5085, partial_loss/deprel_loss: 1.0874, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3421, loss: 0.8791, batch_reg_loss: 0.1704, reg_loss: 0.1697 ||:  86%|########6 | 96/111 [01:06<00:10,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8565, UAS: 0.9313, LAS: 0.8770, UEM: 0.5214, LEM: 0.2812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8799, partial_loss/deprel_loss: 0.7930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9809, loss: 0.8718, batch_reg_loss: 0.1705, reg_loss: 0.1698 ||:  89%|########9 | 99/111 [01:08<00:08,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8170, UAS: 0.9314, LAS: 0.8773, UEM: 0.5363, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5947, partial_loss/deprel_loss: 1.1252, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3897, loss: 0.8706, batch_reg_loss: 0.1705, reg_loss: 0.1698 ||:  92%|#########1| 102/111 [01:10<00:06,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9312, LAS: 0.8771, UEM: 0.5340, LEM: 0.3009, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3184, partial_loss/deprel_loss: 0.5107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6428, loss: 0.8734, batch_reg_loss: 0.1706, reg_loss: 0.1698 ||:  95%|#########4| 105/111 [01:12<00:04,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9314, LAS: 0.8773, UEM: 0.5357, LEM: 0.3026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1379, partial_loss/deprel_loss: 0.4026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5203, loss: 0.8727, batch_reg_loss: 0.1707, reg_loss: 0.1698 ||:  98%|#########8| 109/111 [01:15<00:01,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8319, UAS: 0.9312, LAS: 0.8771, UEM: 0.5351, LEM: 0.3020, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3903, partial_loss/deprel_loss: 1.0609, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2975, loss: 0.8749, batch_reg_loss: 0.1707, reg_loss: 0.1698 ||: 100%|##########| 111/111 [01:16<00:00,  1.44it/s]\n",
+      "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.061  |       N/A\n",
+      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.390  |       N/A\n",
+      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.170  |       N/A\n",
+      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - UEM                      |     0.535  |       N/A\n",
+      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - LAS                      |     0.877  |       N/A\n",
+      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - loss                     |     0.875  |       N/A\n",
+      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - LEM                      |     0.302  |       N/A\n",
+      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - UAS                      |     0.931  |       N/A\n",
+      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - EM                       |     0.832  |       N/A\n",
+      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:05:43,648 - INFO - combo.training.trainer - Epoch duration: 0:01:16.973170\n",
+      "2023-04-07 00:05:43,648 - INFO - combo.training.trainer - Estimated training time remaining: 7:27:46\n",
+      "2023-04-07 00:05:43,648 - INFO - allennlp.training.trainer - Epoch 58/399\n",
+      "2023-04-07 00:05:43,649 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:05:43,649 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:05:43,656 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9596, UAS: 0.9595, LAS: 0.9153, UEM: 0.8286, LEM: 0.6638, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0595, partial_loss/deprel_loss: 0.1632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3132, loss: 0.6007, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:   3%|2         | 3/111 [00:02<01:31,  1.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9561, LAS: 0.9084, UEM: 0.7561, LEM: 0.5438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3785, partial_loss/deprel_loss: 0.5578, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6927, loss: 0.6717, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:   5%|5         | 6/111 [00:04<01:24,  1.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9398, LAS: 0.8906, UEM: 0.6781, LEM: 0.4762, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4555, partial_loss/deprel_loss: 0.6072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7477, loss: 0.8015, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:   8%|8         | 9/111 [00:06<01:19,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9390, LAS: 0.8898, UEM: 0.6879, LEM: 0.4847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1247, partial_loss/deprel_loss: 0.2886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4267, loss: 0.7959, batch_reg_loss: 0.1709, reg_loss: 0.1708 ||:  11%|#         | 12/111 [00:09<01:16,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9394, LAS: 0.8893, UEM: 0.6638, LEM: 0.4483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4382, partial_loss/deprel_loss: 0.5194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6741, loss: 0.7959, batch_reg_loss: 0.1709, reg_loss: 0.1708 ||:  14%|#3        | 15/111 [00:11<01:13,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9375, LAS: 0.8866, UEM: 0.6227, LEM: 0.4106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4958, partial_loss/deprel_loss: 0.5977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7483, loss: 0.8116, batch_reg_loss: 0.1710, reg_loss: 0.1708 ||:  16%|#6        | 18/111 [00:13<01:09,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9390, LAS: 0.8878, UEM: 0.6204, LEM: 0.3971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3002, partial_loss/deprel_loss: 0.5513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6721, loss: 0.7963, batch_reg_loss: 0.1710, reg_loss: 0.1709 ||:  19%|#8        | 21/111 [00:15<01:06,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8683, UAS: 0.9392, LAS: 0.8883, UEM: 0.6134, LEM: 0.3908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7934, partial_loss/deprel_loss: 0.7961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9666, loss: 0.7907, batch_reg_loss: 0.1711, reg_loss: 0.1709 ||:  22%|##1       | 24/111 [00:17<01:03,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9363, LAS: 0.8847, UEM: 0.5900, LEM: 0.3708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5115, partial_loss/deprel_loss: 0.6097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7612, loss: 0.8143, batch_reg_loss: 0.1711, reg_loss: 0.1709 ||:  24%|##4       | 27/111 [00:19<01:01,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8642, UAS: 0.9362, LAS: 0.8844, UEM: 0.5729, LEM: 0.3494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9451, partial_loss/deprel_loss: 0.7701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9762, loss: 0.8149, batch_reg_loss: 0.1712, reg_loss: 0.1709 ||:  28%|##7       | 31/111 [00:22<00:55,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8648, UAS: 0.9355, LAS: 0.8831, UEM: 0.5606, LEM: 0.3357, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8069, partial_loss/deprel_loss: 0.7371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9223, loss: 0.8263, batch_reg_loss: 0.1712, reg_loss: 0.1710 ||:  31%|###       | 34/111 [00:24<00:52,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8912, UAS: 0.9365, LAS: 0.8844, UEM: 0.5572, LEM: 0.3297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5529, partial_loss/deprel_loss: 0.6048, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7657, loss: 0.8172, batch_reg_loss: 0.1712, reg_loss: 0.1710 ||:  33%|###3      | 37/111 [00:26<00:50,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8538, UAS: 0.9357, LAS: 0.8834, UEM: 0.5464, LEM: 0.3201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0253, partial_loss/deprel_loss: 0.8089, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0234, loss: 0.8234, batch_reg_loss: 0.1713, reg_loss: 0.1710 ||:  37%|###6      | 41/111 [00:29<00:47,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9355, LAS: 0.8831, UEM: 0.5659, LEM: 0.3355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2456, partial_loss/deprel_loss: 0.4127, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5506, loss: 0.8257, batch_reg_loss: 0.1713, reg_loss: 0.1710 ||:  40%|###9      | 44/111 [00:31<00:46,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8660, UAS: 0.9308, LAS: 0.8782, UEM: 0.5494, LEM: 0.3243, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9662, partial_loss/deprel_loss: 0.8248, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0244, loss: 0.8680, batch_reg_loss: 0.1714, reg_loss: 0.1711 ||:  43%|####3     | 48/111 [00:33<00:42,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9077, UAS: 0.9301, LAS: 0.8776, UEM: 0.5468, LEM: 0.3233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3291, partial_loss/deprel_loss: 0.4619, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6068, loss: 0.8733, batch_reg_loss: 0.1714, reg_loss: 0.1711 ||:  46%|####5     | 51/111 [00:36<00:42,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9141, UAS: 0.9301, LAS: 0.8774, UEM: 0.5459, LEM: 0.3225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2580, partial_loss/deprel_loss: 0.4262, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5641, loss: 0.8732, batch_reg_loss: 0.1715, reg_loss: 0.1711 ||:  49%|####8     | 54/111 [00:38<00:39,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8443, UAS: 0.9303, LAS: 0.8775, UEM: 0.5463, LEM: 0.3237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9609, partial_loss/deprel_loss: 0.8621, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0534, loss: 0.8687, batch_reg_loss: 0.1716, reg_loss: 0.1711 ||:  51%|#####1    | 57/111 [00:40<00:38,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8988, UAS: 0.9323, LAS: 0.8796, UEM: 0.5627, LEM: 0.3346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4283, partial_loss/deprel_loss: 0.5501, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6973, loss: 0.8529, batch_reg_loss: 0.1716, reg_loss: 0.1712 ||:  55%|#####4    | 61/111 [00:42<00:34,  1.44it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8381, UAS: 0.9310, LAS: 0.8782, UEM: 0.5520, LEM: 0.3267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1179, partial_loss/deprel_loss: 0.8586, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0821, loss: 0.8627, batch_reg_loss: 0.1717, reg_loss: 0.1712 ||:  59%|#####8    | 65/111 [00:45<00:31,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9320, LAS: 0.8792, UEM: 0.5555, LEM: 0.3268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5933, partial_loss/deprel_loss: 0.6654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8227, loss: 0.8550, batch_reg_loss: 0.1717, reg_loss: 0.1712 ||:  61%|######1   | 68/111 [00:47<00:29,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9326, LAS: 0.8796, UEM: 0.5645, LEM: 0.3340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1658, partial_loss/deprel_loss: 0.4269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5465, loss: 0.8516, batch_reg_loss: 0.1718, reg_loss: 0.1712 ||:  64%|######3   | 71/111 [00:49<00:28,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8692, UAS: 0.9329, LAS: 0.8797, UEM: 0.5560, LEM: 0.3247, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6251, partial_loss/deprel_loss: 0.7558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9015, loss: 0.8517, batch_reg_loss: 0.1718, reg_loss: 0.1713 ||:  68%|######7   | 75/111 [00:52<00:23,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8435, UAS: 0.9324, LAS: 0.8787, UEM: 0.5451, LEM: 0.3162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0988, partial_loss/deprel_loss: 0.9087, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1186, loss: 0.8610, batch_reg_loss: 0.1719, reg_loss: 0.1713 ||:  71%|#######1  | 79/111 [00:54<00:21,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9328, LAS: 0.8791, UEM: 0.5434, LEM: 0.3127, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3353, partial_loss/deprel_loss: 0.5287, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6619, loss: 0.8598, batch_reg_loss: 0.1719, reg_loss: 0.1713 ||:  74%|#######3  | 82/111 [00:57<00:19,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9323, LAS: 0.8787, UEM: 0.5416, LEM: 0.3104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7752, partial_loss/deprel_loss: 0.7615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9362, loss: 0.8612, batch_reg_loss: 0.1719, reg_loss: 0.1713 ||:  77%|#######6  | 85/111 [00:59<00:18,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9317, LAS: 0.8779, UEM: 0.5354, LEM: 0.3063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5456, partial_loss/deprel_loss: 0.5851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7492, loss: 0.8666, batch_reg_loss: 0.1720, reg_loss: 0.1714 ||:  79%|#######9  | 88/111 [01:01<00:15,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9319, LAS: 0.8783, UEM: 0.5453, LEM: 0.3187, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1393, partial_loss/deprel_loss: 0.2585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4067, loss: 0.8646, batch_reg_loss: 0.1720, reg_loss: 0.1714 ||:  83%|########2 | 92/111 [01:04<00:13,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8494, UAS: 0.9318, LAS: 0.8782, UEM: 0.5385, LEM: 0.3119, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9511, partial_loss/deprel_loss: 0.9121, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0920, loss: 0.8661, batch_reg_loss: 0.1721, reg_loss: 0.1714 ||:  86%|########6 | 96/111 [01:06<00:10,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8852, UAS: 0.9316, LAS: 0.8780, UEM: 0.5317, LEM: 0.3060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6062, partial_loss/deprel_loss: 0.6751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8335, loss: 0.8693, batch_reg_loss: 0.1722, reg_loss: 0.1714 ||:  90%|######### | 100/111 [01:09<00:07,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9321, LAS: 0.8787, UEM: 0.5358, LEM: 0.3087, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2498, partial_loss/deprel_loss: 0.3508, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5029, loss: 0.8622, batch_reg_loss: 0.1722, reg_loss: 0.1715 ||:  94%|#########3| 104/111 [01:11<00:04,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8788, UAS: 0.9325, LAS: 0.8791, UEM: 0.5368, LEM: 0.3090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6178, partial_loss/deprel_loss: 0.7346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8835, loss: 0.8581, batch_reg_loss: 0.1723, reg_loss: 0.1715 ||:  96%|#########6| 107/111 [01:13<00:02,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9318, LAS: 0.8783, UEM: 0.5331, LEM: 0.3068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2776, partial_loss/deprel_loss: 0.4357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5764, loss: 0.8651, batch_reg_loss: 0.1723, reg_loss: 0.1715 ||: 100%|##########| 111/111 [01:16<00:00,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9318, LAS: 0.8783, UEM: 0.5331, LEM: 0.3068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2776, partial_loss/deprel_loss: 0.4357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5764, loss: 0.8651, batch_reg_loss: 0.1723, reg_loss: 0.1715 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
+      "2023-04-07 00:07:00,259 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:07:00,259 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:07:00,259 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.436  |       N/A\n",
+      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.278  |       N/A\n",
+      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.172  |       N/A\n",
+      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - UEM                      |     0.533  |       N/A\n",
+      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - LAS                      |     0.878  |       N/A\n",
+      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - loss                     |     0.865  |       N/A\n",
+      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:07:00,261 - INFO - combo.training.tensorboard_writer - LEM                      |     0.307  |       N/A\n",
+      "2023-04-07 00:07:00,261 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:07:00,261 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:07:00,261 - INFO - combo.training.tensorboard_writer - UAS                      |     0.932  |       N/A\n",
+      "2023-04-07 00:07:00,261 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:07:00,261 - INFO - combo.training.tensorboard_writer - EM                       |     0.913  |       N/A\n",
+      "2023-04-07 00:07:00,261 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:07:00,262 - INFO - combo.training.trainer - Epoch duration: 0:01:16.613383\n",
+      "2023-04-07 00:07:00,262 - INFO - combo.training.trainer - Estimated training time remaining: 7:26:16\n",
+      "2023-04-07 00:07:00,262 - INFO - allennlp.training.trainer - Epoch 59/399\n",
+      "2023-04-07 00:07:00,262 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:07:00,263 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:07:00,270 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8762, UAS: 0.9336, LAS: 0.8775, UEM: 0.3808, LEM: 0.1360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7637, partial_loss/deprel_loss: 0.6570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8507, loss: 0.8668, batch_reg_loss: 0.1724, reg_loss: 0.1724 ||:   4%|3         | 4/111 [00:02<01:07,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9333, LAS: 0.8780, UEM: 0.5207, LEM: 0.2574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2748, partial_loss/deprel_loss: 0.4359, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5761, loss: 0.8606, batch_reg_loss: 0.1724, reg_loss: 0.1724 ||:   6%|6         | 7/111 [00:04<01:08,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8552, UAS: 0.9347, LAS: 0.8794, UEM: 0.4916, LEM: 0.2364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9107, partial_loss/deprel_loss: 0.8228, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0128, loss: 0.8498, batch_reg_loss: 0.1725, reg_loss: 0.1724 ||:   9%|9         | 10/111 [00:06<01:07,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8452, UAS: 0.9266, LAS: 0.8729, UEM: 0.4409, LEM: 0.2103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3004, partial_loss/deprel_loss: 0.9704, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2089, loss: 0.8981, batch_reg_loss: 0.1725, reg_loss: 0.1724 ||:  12%|#1        | 13/111 [00:08<01:05,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9335, LAS: 0.8811, UEM: 0.5484, LEM: 0.3001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1577, partial_loss/deprel_loss: 0.3573, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4900, loss: 0.8355, batch_reg_loss: 0.1726, reg_loss: 0.1725 ||:  14%|#4        | 16/111 [00:11<01:06,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8034, UAS: 0.9277, LAS: 0.8738, UEM: 0.4982, LEM: 0.2656, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9376, partial_loss/deprel_loss: 1.0868, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4295, loss: 0.8938, batch_reg_loss: 0.1726, reg_loss: 0.1725 ||:  18%|#8        | 20/111 [00:13<01:00,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9292, LAS: 0.8751, UEM: 0.5387, LEM: 0.3178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1075, partial_loss/deprel_loss: 0.2709, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4109, loss: 0.8872, batch_reg_loss: 0.1727, reg_loss: 0.1725 ||:  21%|##        | 23/111 [00:15<00:59,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9124, UAS: 0.9307, LAS: 0.8770, UEM: 0.5338, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3092, partial_loss/deprel_loss: 0.4545, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5981, loss: 0.8721, batch_reg_loss: 0.1727, reg_loss: 0.1725 ||:  23%|##3       | 26/111 [00:18<01:01,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9296, LAS: 0.8759, UEM: 0.5318, LEM: 0.3076, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5820, partial_loss/deprel_loss: 0.6105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7775, loss: 0.8817, batch_reg_loss: 0.1728, reg_loss: 0.1726 ||:  26%|##6       | 29/111 [00:20<00:58,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9292, LAS: 0.8753, UEM: 0.5118, LEM: 0.2923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8447, partial_loss/deprel_loss: 0.8250, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0018, loss: 0.8869, batch_reg_loss: 0.1728, reg_loss: 0.1726 ||:  29%|##8       | 32/111 [00:22<00:55,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9321, LAS: 0.8791, UEM: 0.5550, LEM: 0.3284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2176, partial_loss/deprel_loss: 0.3670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5100, loss: 0.8576, batch_reg_loss: 0.1728, reg_loss: 0.1726 ||:  32%|###1      | 35/111 [00:24<00:54,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9508, UAS: 0.9342, LAS: 0.8816, UEM: 0.5933, LEM: 0.3763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0539, partial_loss/deprel_loss: 0.1786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3265, loss: 0.8401, batch_reg_loss: 0.1729, reg_loss: 0.1726 ||:  34%|###4      | 38/111 [00:27<00:56,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8712, UAS: 0.9332, LAS: 0.8807, UEM: 0.5845, LEM: 0.3686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8210, partial_loss/deprel_loss: 0.7104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9054, loss: 0.8468, batch_reg_loss: 0.1729, reg_loss: 0.1726 ||:  37%|###6      | 41/111 [00:29<00:52,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8345, UAS: 0.9329, LAS: 0.8802, UEM: 0.5758, LEM: 0.3590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0728, partial_loss/deprel_loss: 0.9505, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1480, loss: 0.8477, batch_reg_loss: 0.1730, reg_loss: 0.1727 ||:  40%|###9      | 44/111 [00:31<00:49,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9333, LAS: 0.8805, UEM: 0.5705, LEM: 0.3506, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3542, partial_loss/deprel_loss: 0.4947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6395, loss: 0.8465, batch_reg_loss: 0.1730, reg_loss: 0.1727 ||:  42%|####2     | 47/111 [00:33<00:46,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9328, LAS: 0.8799, UEM: 0.5733, LEM: 0.3577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1635, partial_loss/deprel_loss: 0.3313, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4708, loss: 0.8541, batch_reg_loss: 0.1730, reg_loss: 0.1727 ||:  46%|####5     | 51/111 [00:36<00:43,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9341, LAS: 0.8814, UEM: 0.5789, LEM: 0.3594, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3308, partial_loss/deprel_loss: 0.5056, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6438, loss: 0.8426, batch_reg_loss: 0.1731, reg_loss: 0.1727 ||:  49%|####8     | 54/111 [00:38<00:41,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9337, LAS: 0.8810, UEM: 0.5784, LEM: 0.3584, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2728, partial_loss/deprel_loss: 0.4433, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5823, loss: 0.8452, batch_reg_loss: 0.1731, reg_loss: 0.1727 ||:  51%|#####1    | 57/111 [00:40<00:39,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9347, LAS: 0.8819, UEM: 0.5824, LEM: 0.3589, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5877, partial_loss/deprel_loss: 0.6521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8124, loss: 0.8381, batch_reg_loss: 0.1732, reg_loss: 0.1728 ||:  54%|#####4    | 60/111 [00:43<00:38,  1.33it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8242, UAS: 0.9333, LAS: 0.8805, UEM: 0.5715, LEM: 0.3503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4308, partial_loss/deprel_loss: 1.1157, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3520, loss: 0.8506, batch_reg_loss: 0.1732, reg_loss: 0.1728 ||:  57%|#####6    | 63/111 [00:45<00:35,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8745, UAS: 0.9334, LAS: 0.8804, UEM: 0.5614, LEM: 0.3395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7164, partial_loss/deprel_loss: 0.7620, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9261, loss: 0.8528, batch_reg_loss: 0.1733, reg_loss: 0.1728 ||:  60%|######    | 67/111 [00:47<00:29,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8562, UAS: 0.9334, LAS: 0.8803, UEM: 0.5556, LEM: 0.3320, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9412, partial_loss/deprel_loss: 0.8262, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0225, loss: 0.8533, batch_reg_loss: 0.1733, reg_loss: 0.1728 ||:  64%|######3   | 71/111 [00:49<00:25,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9320, LAS: 0.8785, UEM: 0.5549, LEM: 0.3308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1992, partial_loss/deprel_loss: 0.3865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5224, loss: 0.8659, batch_reg_loss: 0.1734, reg_loss: 0.1729 ||:  68%|######7   | 75/111 [00:52<00:23,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8442, UAS: 0.9316, LAS: 0.8779, UEM: 0.5463, LEM: 0.3221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0091, partial_loss/deprel_loss: 0.9599, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1432, loss: 0.8711, batch_reg_loss: 0.1734, reg_loss: 0.1729 ||:  71%|#######1  | 79/111 [00:55<00:21,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9326, LAS: 0.8789, UEM: 0.5523, LEM: 0.3229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2824, partial_loss/deprel_loss: 0.4500, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5900, loss: 0.8622, batch_reg_loss: 0.1735, reg_loss: 0.1729 ||:  75%|#######4  | 83/111 [00:58<00:19,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9327, LAS: 0.8790, UEM: 0.5486, LEM: 0.3190, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2842, partial_loss/deprel_loss: 0.5412, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6634, loss: 0.8606, batch_reg_loss: 0.1735, reg_loss: 0.1729 ||:  77%|#######7  | 86/111 [01:00<00:17,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9320, LAS: 0.8782, UEM: 0.5492, LEM: 0.3182, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2800, partial_loss/deprel_loss: 0.4778, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6118, loss: 0.8675, batch_reg_loss: 0.1736, reg_loss: 0.1730 ||:  80%|########  | 89/111 [01:02<00:15,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9325, LAS: 0.8787, UEM: 0.5477, LEM: 0.3148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6621, partial_loss/deprel_loss: 0.7544, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9096, loss: 0.8624, batch_reg_loss: 0.1736, reg_loss: 0.1730 ||:  84%|########3 | 93/111 [01:04<00:12,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8652, UAS: 0.9321, LAS: 0.8784, UEM: 0.5426, LEM: 0.3108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9823, partial_loss/deprel_loss: 0.8097, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0179, loss: 0.8656, batch_reg_loss: 0.1737, reg_loss: 0.1730 ||:  86%|########6 | 96/111 [01:06<00:10,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9319, LAS: 0.8782, UEM: 0.5405, LEM: 0.3084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4858, partial_loss/deprel_loss: 0.6298, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7747, loss: 0.8675, batch_reg_loss: 0.1737, reg_loss: 0.1730 ||:  90%|######### | 100/111 [01:09<00:07,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9323, LAS: 0.8785, UEM: 0.5404, LEM: 0.3064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5189, partial_loss/deprel_loss: 0.6216, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7748, loss: 0.8655, batch_reg_loss: 0.1738, reg_loss: 0.1731 ||:  94%|#########3| 104/111 [01:12<00:04,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9324, LAS: 0.8785, UEM: 0.5361, LEM: 0.3023, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4727, partial_loss/deprel_loss: 0.5968, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7458, loss: 0.8654, batch_reg_loss: 0.1738, reg_loss: 0.1731 ||:  96%|#########6| 107/111 [01:14<00:02,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8647, UAS: 0.9322, LAS: 0.8783, UEM: 0.5396, LEM: 0.3066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7106, partial_loss/deprel_loss: 0.7900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9480, loss: 0.8659, batch_reg_loss: 0.1739, reg_loss: 0.1731 ||:  99%|#########9| 110/111 [01:16<00:00,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8374, UAS: 0.9319, LAS: 0.8779, UEM: 0.5374, LEM: 0.3052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1673, partial_loss/deprel_loss: 0.9337, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1543, loss: 0.8685, batch_reg_loss: 0.1739, reg_loss: 0.1731 ||: 100%|##########| 111/111 [01:17<00:00,  1.44it/s]\n",
+      "2023-04-07 00:08:17,587 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:08:17,587 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:08:17,587 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.934  |       N/A\n",
+      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.167  |       N/A\n",
+      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.173  |       N/A\n",
+      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - UEM                      |     0.537  |       N/A\n",
+      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - LAS                      |     0.878  |       N/A\n",
+      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - loss                     |     0.869  |       N/A\n",
+      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - LEM                      |     0.305  |       N/A\n",
+      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:08:17,589 - INFO - combo.training.tensorboard_writer - UAS                      |     0.932  |       N/A\n",
+      "2023-04-07 00:08:17,589 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:08:17,589 - INFO - combo.training.tensorboard_writer - EM                       |     0.837  |       N/A\n",
+      "2023-04-07 00:08:17,589 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:08:17,589 - INFO - combo.training.trainer - Epoch duration: 0:01:17.327204\n",
+      "2023-04-07 00:08:17,589 - INFO - combo.training.trainer - Estimated training time remaining: 7:24:51\n",
+      "2023-04-07 00:08:17,590 - INFO - allennlp.training.trainer - Epoch 60/399\n",
+      "2023-04-07 00:08:17,590 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:08:17,590 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:08:17,598 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9362, LAS: 0.8814, UEM: 0.3503, LEM: 0.1203, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8053, partial_loss/deprel_loss: 0.7054, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8993, loss: 0.8470, batch_reg_loss: 0.1739, reg_loss: 0.1739 ||:   3%|2         | 3/111 [00:02<01:20,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8333, UAS: 0.9321, LAS: 0.8779, UEM: 0.3913, LEM: 0.1676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2081, partial_loss/deprel_loss: 0.9663, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1886, loss: 0.8611, batch_reg_loss: 0.1740, reg_loss: 0.1739 ||:   6%|6         | 7/111 [00:04<01:13,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7929, UAS: 0.9231, LAS: 0.8686, UEM: 0.3932, LEM: 0.1813, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0036, partial_loss/deprel_loss: 1.1850, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5227, loss: 0.9405, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||:   9%|9         | 10/111 [00:07<01:13,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9264, LAS: 0.8725, UEM: 0.4786, LEM: 0.2742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1777, partial_loss/deprel_loss: 0.3238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4686, loss: 0.9067, batch_reg_loss: 0.1741, reg_loss: 0.1740 ||:  12%|#1        | 13/111 [00:09<01:14,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9316, LAS: 0.8780, UEM: 0.5387, LEM: 0.3116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6095, partial_loss/deprel_loss: 0.6517, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8174, loss: 0.8575, batch_reg_loss: 0.1741, reg_loss: 0.1740 ||:  14%|#4        | 16/111 [00:11<01:10,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9362, LAS: 0.8836, UEM: 0.6020, LEM: 0.3786, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0994, partial_loss/deprel_loss: 0.2475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3920, loss: 0.8120, batch_reg_loss: 0.1742, reg_loss: 0.1740 ||:  18%|#8        | 20/111 [00:14<01:04,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8839, UAS: 0.9373, LAS: 0.8850, UEM: 0.5973, LEM: 0.3707, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5161, partial_loss/deprel_loss: 0.6815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8226, loss: 0.8053, batch_reg_loss: 0.1742, reg_loss: 0.1741 ||:  22%|##1       | 24/111 [00:16<00:59,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8917, UAS: 0.9403, LAS: 0.8883, UEM: 0.6151, LEM: 0.3769, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4976, partial_loss/deprel_loss: 0.6561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7986, loss: 0.7819, batch_reg_loss: 0.1742, reg_loss: 0.1741 ||:  25%|##5       | 28/111 [00:19<00:54,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8948, UAS: 0.9413, LAS: 0.8891, UEM: 0.6076, LEM: 0.3650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4554, partial_loss/deprel_loss: 0.5114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6744, loss: 0.7749, batch_reg_loss: 0.1743, reg_loss: 0.1741 ||:  28%|##7       | 31/111 [00:21<00:54,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9397, LAS: 0.8876, UEM: 0.6007, LEM: 0.3613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2657, partial_loss/deprel_loss: 0.4361, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5763, loss: 0.7878, batch_reg_loss: 0.1743, reg_loss: 0.1741 ||:  31%|###       | 34/111 [00:23<00:53,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8368, UAS: 0.9376, LAS: 0.8857, UEM: 0.5841, LEM: 0.3488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2452, partial_loss/deprel_loss: 0.9293, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1668, loss: 0.8026, batch_reg_loss: 0.1743, reg_loss: 0.1741 ||:  33%|###3      | 37/111 [00:25<00:52,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9343, LAS: 0.8819, UEM: 0.5689, LEM: 0.3378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8595, partial_loss/deprel_loss: 0.8019, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9878, loss: 0.8301, batch_reg_loss: 0.1743, reg_loss: 0.1741 ||:  36%|###6      | 40/111 [00:27<00:50,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8483, UAS: 0.9321, LAS: 0.8796, UEM: 0.5564, LEM: 0.3279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1939, partial_loss/deprel_loss: 0.9149, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1451, loss: 0.8517, batch_reg_loss: 0.1744, reg_loss: 0.1742 ||:  40%|###9      | 44/111 [00:30<00:47,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9335, LAS: 0.8809, UEM: 0.5663, LEM: 0.3323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3052, partial_loss/deprel_loss: 0.4650, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6075, loss: 0.8412, batch_reg_loss: 0.1744, reg_loss: 0.1742 ||:  42%|####2     | 47/111 [00:32<00:46,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8790, UAS: 0.9348, LAS: 0.8828, UEM: 0.5920, LEM: 0.3681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6005, partial_loss/deprel_loss: 0.6092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7820, loss: 0.8263, batch_reg_loss: 0.1745, reg_loss: 0.1742 ||:  45%|####5     | 50/111 [00:35<00:47,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8130, UAS: 0.9329, LAS: 0.8806, UEM: 0.5860, LEM: 0.3640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5709, partial_loss/deprel_loss: 1.0503, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3290, loss: 0.8424, batch_reg_loss: 0.1745, reg_loss: 0.1742 ||:  48%|####7     | 53/111 [00:38<00:45,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8496, UAS: 0.9336, LAS: 0.8812, UEM: 0.5811, LEM: 0.3567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9414, partial_loss/deprel_loss: 0.9016, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0842, loss: 0.8390, batch_reg_loss: 0.1746, reg_loss: 0.1742 ||:  51%|#####1    | 57/111 [00:40<00:39,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8404, UAS: 0.9304, LAS: 0.8778, UEM: 0.5673, LEM: 0.3474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2525, partial_loss/deprel_loss: 0.9174, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1591, loss: 0.8677, batch_reg_loss: 0.1746, reg_loss: 0.1743 ||:  55%|#####4    | 61/111 [00:43<00:35,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8513, UAS: 0.9310, LAS: 0.8782, UEM: 0.5702, LEM: 0.3472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9025, partial_loss/deprel_loss: 0.9015, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0764, loss: 0.8632, batch_reg_loss: 0.1747, reg_loss: 0.1743 ||:  58%|#####7    | 64/111 [00:45<00:33,  1.39it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9320, LAS: 0.8794, UEM: 0.5685, LEM: 0.3426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3395, partial_loss/deprel_loss: 0.4841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6300, loss: 0.8545, batch_reg_loss: 0.1748, reg_loss: 0.1743 ||:  61%|######1   | 68/111 [00:47<00:29,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8648, UAS: 0.9312, LAS: 0.8783, UEM: 0.5588, LEM: 0.3351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7327, partial_loss/deprel_loss: 0.7282, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9039, loss: 0.8620, batch_reg_loss: 0.1748, reg_loss: 0.1743 ||:  64%|######3   | 71/111 [00:50<00:28,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8554, UAS: 0.9307, LAS: 0.8778, UEM: 0.5490, LEM: 0.3263, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0077, partial_loss/deprel_loss: 0.8423, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0502, loss: 0.8669, batch_reg_loss: 0.1749, reg_loss: 0.1744 ||:  68%|######7   | 75/111 [00:52<00:24,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9031, UAS: 0.9306, LAS: 0.8776, UEM: 0.5447, LEM: 0.3214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3445, partial_loss/deprel_loss: 0.5258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6645, loss: 0.8677, batch_reg_loss: 0.1749, reg_loss: 0.1744 ||:  70%|#######   | 78/111 [00:54<00:22,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9295, LAS: 0.8763, UEM: 0.5389, LEM: 0.3160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3530, partial_loss/deprel_loss: 0.5616, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6949, loss: 0.8791, batch_reg_loss: 0.1750, reg_loss: 0.1744 ||:  74%|#######3  | 82/111 [00:57<00:19,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8676, UAS: 0.9295, LAS: 0.8762, UEM: 0.5307, LEM: 0.3081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8574, partial_loss/deprel_loss: 0.7822, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9723, loss: 0.8802, batch_reg_loss: 0.1750, reg_loss: 0.1744 ||:  77%|#######7  | 86/111 [00:59<00:16,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9299, LAS: 0.8766, UEM: 0.5393, LEM: 0.3177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1638, partial_loss/deprel_loss: 0.3223, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4657, loss: 0.8764, batch_reg_loss: 0.1751, reg_loss: 0.1745 ||:  81%|########1 | 90/111 [01:02<00:14,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9300, LAS: 0.8768, UEM: 0.5359, LEM: 0.3142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4274, partial_loss/deprel_loss: 0.5398, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6925, loss: 0.8751, batch_reg_loss: 0.1751, reg_loss: 0.1745 ||:  84%|########3 | 93/111 [01:05<00:12,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9306, LAS: 0.8774, UEM: 0.5408, LEM: 0.3163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2533, partial_loss/deprel_loss: 0.4176, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5599, loss: 0.8691, batch_reg_loss: 0.1752, reg_loss: 0.1745 ||:  87%|########7 | 97/111 [01:07<00:09,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9311, LAS: 0.8780, UEM: 0.5431, LEM: 0.3172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5743, partial_loss/deprel_loss: 0.6671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8238, loss: 0.8644, batch_reg_loss: 0.1752, reg_loss: 0.1745 ||:  90%|######### | 100/111 [01:10<00:08,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8498, UAS: 0.9306, LAS: 0.8773, UEM: 0.5365, LEM: 0.3118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0491, partial_loss/deprel_loss: 0.9409, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1378, loss: 0.8708, batch_reg_loss: 0.1753, reg_loss: 0.1746 ||:  94%|#########3| 104/111 [01:12<00:04,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9302, LAS: 0.8767, UEM: 0.5311, LEM: 0.3074, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4103, partial_loss/deprel_loss: 0.5165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6706, loss: 0.8771, batch_reg_loss: 0.1753, reg_loss: 0.1746 ||:  97%|#########7| 108/111 [01:14<00:01,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8729, UAS: 0.9305, LAS: 0.8769, UEM: 0.5294, LEM: 0.3047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6519, partial_loss/deprel_loss: 0.7411, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8986, loss: 0.8754, batch_reg_loss: 0.1754, reg_loss: 0.1746 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
+      "2023-04-07 00:09:34,322 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8962, UAS: 0.9379, LAS: 0.8794, UEM: 0.4599, LEM: 0.1283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5266, partial_loss/deprel_loss: 24.2651, partial_loss/cycle_loss: 0.0000, batch_loss: 19.5174, loss: 24.7563, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:08,  1.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9527, LAS: 0.8970, UEM: 0.6623, LEM: 0.3284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4145, partial_loss/deprel_loss: 26.3179, partial_loss/cycle_loss: 0.0000, batch_loss: 21.1372, loss: 22.3640, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:06,  1.11it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9426, LAS: 0.8873, UEM: 0.6137, LEM: 0.2966, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6098, partial_loss/deprel_loss: 34.3925, partial_loss/cycle_loss: 0.0000, batch_loss: 27.6359, loss: 26.0534, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:07<00:04,  1.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8674, UAS: 0.9435, LAS: 0.8887, UEM: 0.5935, LEM: 0.2872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0499, partial_loss/deprel_loss: 43.7402, partial_loss/cycle_loss: 0.0000, batch_loss: 35.2022, loss: 25.6088, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:10<00:01,  1.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8610, UAS: 0.9441, LAS: 0.8910, UEM: 0.6411, LEM: 0.3718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3157, partial_loss/deprel_loss: 48.7881, partial_loss/cycle_loss: 0.0000, batch_loss: 39.2936, loss: 25.9567, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8610, UAS: 0.9441, LAS: 0.8910, UEM: 0.6411, LEM: 0.3718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3157, partial_loss/deprel_loss: 48.7881, partial_loss/cycle_loss: 0.0000, batch_loss: 39.2936, loss: 25.9567, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.04it/s]\n",
+      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.741  |    48.788\n",
+      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.652  |     1.316\n",
+      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.175  |     0.000\n",
+      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - UEM                      |     0.529  |     0.641\n",
+      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - LAS                      |     0.877  |     0.891\n",
+      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - loss                     |     0.875  |    25.957\n",
+      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - LEM                      |     0.305  |     0.372\n",
+      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - UAS                      |     0.930  |     0.944\n",
+      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - EM                       |     0.873  |     0.861\n",
+      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:09:49,183 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 00:09:50,393 - INFO - combo.training.trainer - Epoch duration: 0:01:32.803051\n",
+      "2023-04-07 00:09:50,393 - INFO - combo.training.trainer - Estimated training time remaining: 7:24:52\n",
+      "2023-04-07 00:09:50,393 - INFO - allennlp.training.trainer - Epoch 61/399\n",
+      "2023-04-07 00:09:50,393 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:09:50,393 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:09:50,399 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8676, UAS: 0.9301, LAS: 0.8725, UEM: 0.4525, LEM: 0.2185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7400, partial_loss/deprel_loss: 0.8407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9960, loss: 0.8934, batch_reg_loss: 0.1754, reg_loss: 0.1754 ||:   3%|2         | 3/111 [00:02<01:12,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8804, UAS: 0.9359, LAS: 0.8807, UEM: 0.5602, LEM: 0.3259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5457, partial_loss/deprel_loss: 0.6338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7916, loss: 0.8117, batch_reg_loss: 0.1755, reg_loss: 0.1754 ||:   5%|5         | 6/111 [00:04<01:12,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9390, LAS: 0.8858, UEM: 0.5364, LEM: 0.3008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4178, partial_loss/deprel_loss: 0.5122, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6688, loss: 0.7848, batch_reg_loss: 0.1755, reg_loss: 0.1754 ||:   8%|8         | 9/111 [00:06<01:10,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7975, UAS: 0.9267, LAS: 0.8726, UEM: 0.4816, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7705, partial_loss/deprel_loss: 1.2301, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5137, loss: 0.9004, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  11%|#         | 12/111 [00:08<01:11,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9329, LAS: 0.8789, UEM: 0.5466, LEM: 0.3070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4847, partial_loss/deprel_loss: 0.5487, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7115, loss: 0.8472, batch_reg_loss: 0.1756, reg_loss: 0.1755 ||:  14%|#3        | 15/111 [00:10<01:07,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8232, UAS: 0.9263, LAS: 0.8721, UEM: 0.4951, LEM: 0.2746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4953, partial_loss/deprel_loss: 0.9569, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2402, loss: 0.9045, batch_reg_loss: 0.1757, reg_loss: 0.1755 ||:  17%|#7        | 19/111 [00:13<01:02,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9278, LAS: 0.8743, UEM: 0.5035, LEM: 0.2797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2306, partial_loss/deprel_loss: 0.3509, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5025, loss: 0.8852, batch_reg_loss: 0.1757, reg_loss: 0.1755 ||:  20%|#9        | 22/111 [00:15<01:00,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9288, LAS: 0.8748, UEM: 0.4971, LEM: 0.2717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2908, partial_loss/deprel_loss: 0.5508, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6746, loss: 0.8829, batch_reg_loss: 0.1758, reg_loss: 0.1756 ||:  23%|##2       | 25/111 [00:17<01:00,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9293, LAS: 0.8759, UEM: 0.5267, LEM: 0.2979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2407, partial_loss/deprel_loss: 0.4070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5496, loss: 0.8696, batch_reg_loss: 0.1758, reg_loss: 0.1756 ||:  25%|##5       | 28/111 [00:19<00:59,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8130, UAS: 0.9297, LAS: 0.8768, UEM: 0.5495, LEM: 0.3195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5913, partial_loss/deprel_loss: 1.1328, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4003, loss: 0.8653, batch_reg_loss: 0.1758, reg_loss: 0.1756 ||:  28%|##7       | 31/111 [00:21<00:58,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8659, UAS: 0.9309, LAS: 0.8782, UEM: 0.5469, LEM: 0.3167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7353, partial_loss/deprel_loss: 0.8071, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9686, loss: 0.8547, batch_reg_loss: 0.1759, reg_loss: 0.1756 ||:  31%|###       | 34/111 [00:24<00:56,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8492, UAS: 0.9306, LAS: 0.8777, UEM: 0.5350, LEM: 0.3066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9533, partial_loss/deprel_loss: 0.8344, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0341, loss: 0.8590, batch_reg_loss: 0.1759, reg_loss: 0.1757 ||:  33%|###3      | 37/111 [00:26<00:54,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9295, LAS: 0.8769, UEM: 0.5536, LEM: 0.3278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4604, partial_loss/deprel_loss: 0.5286, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6909, loss: 0.8681, batch_reg_loss: 0.1760, reg_loss: 0.1757 ||:  36%|###6      | 40/111 [00:28<00:53,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9025, UAS: 0.9295, LAS: 0.8769, UEM: 0.5425, LEM: 0.3175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4519, partial_loss/deprel_loss: 0.5442, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7018, loss: 0.8705, batch_reg_loss: 0.1760, reg_loss: 0.1757 ||:  39%|###8      | 43/111 [00:30<00:49,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8691, UAS: 0.9290, LAS: 0.8759, UEM: 0.5314, LEM: 0.3073, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6497, partial_loss/deprel_loss: 0.7674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9200, loss: 0.8797, batch_reg_loss: 0.1761, reg_loss: 0.1757 ||:  42%|####2     | 47/111 [00:33<00:44,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8567, UAS: 0.9299, LAS: 0.8766, UEM: 0.5275, LEM: 0.3006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0313, partial_loss/deprel_loss: 0.9238, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1214, loss: 0.8750, batch_reg_loss: 0.1761, reg_loss: 0.1758 ||:  46%|####5     | 51/111 [00:35<00:40,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9301, LAS: 0.8769, UEM: 0.5190, LEM: 0.2921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5316, partial_loss/deprel_loss: 0.5359, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7112, loss: 0.8718, batch_reg_loss: 0.1762, reg_loss: 0.1758 ||:  49%|####8     | 54/111 [00:38<00:39,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9306, LAS: 0.8773, UEM: 0.5160, LEM: 0.2865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5170, partial_loss/deprel_loss: 0.6902, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8318, loss: 0.8682, batch_reg_loss: 0.1762, reg_loss: 0.1758 ||:  52%|#####2    | 58/111 [00:40<00:35,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8467, UAS: 0.9301, LAS: 0.8768, UEM: 0.5379, LEM: 0.3110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9494, partial_loss/deprel_loss: 0.8664, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0593, loss: 0.8701, batch_reg_loss: 0.1763, reg_loss: 0.1758 ||:  56%|#####5    | 62/111 [00:43<00:35,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9310, LAS: 0.8777, UEM: 0.5382, LEM: 0.3078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3715, partial_loss/deprel_loss: 0.5127, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6608, loss: 0.8643, batch_reg_loss: 0.1763, reg_loss: 0.1759 ||:  59%|#####8    | 65/111 [00:45<00:32,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9318, LAS: 0.8785, UEM: 0.5475, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3592, partial_loss/deprel_loss: 0.5754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7085, loss: 0.8581, batch_reg_loss: 0.1764, reg_loss: 0.1759 ||:  61%|######1   | 68/111 [00:48<00:32,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9326, LAS: 0.8792, UEM: 0.5501, LEM: 0.3122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4939, partial_loss/deprel_loss: 0.6939, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8303, loss: 0.8533, batch_reg_loss: 0.1764, reg_loss: 0.1759 ||:  64%|######3   | 71/111 [00:50<00:29,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8675, UAS: 0.9329, LAS: 0.8796, UEM: 0.5458, LEM: 0.3075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8771, partial_loss/deprel_loss: 0.8076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9980, loss: 0.8528, batch_reg_loss: 0.1764, reg_loss: 0.1759 ||:  68%|######7   | 75/111 [00:52<00:24,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8787, UAS: 0.9329, LAS: 0.8795, UEM: 0.5392, LEM: 0.3021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7339, partial_loss/deprel_loss: 0.8141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9745, loss: 0.8561, batch_reg_loss: 0.1765, reg_loss: 0.1760 ||:  70%|#######   | 78/111 [00:54<00:22,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8550, UAS: 0.9331, LAS: 0.8798, UEM: 0.5351, LEM: 0.2974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9806, partial_loss/deprel_loss: 0.8367, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0420, loss: 0.8542, batch_reg_loss: 0.1765, reg_loss: 0.1760 ||:  74%|#######3  | 82/111 [00:57<00:19,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8505, UAS: 0.9331, LAS: 0.8796, UEM: 0.5288, LEM: 0.2907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9883, partial_loss/deprel_loss: 0.8582, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0608, loss: 0.8549, batch_reg_loss: 0.1766, reg_loss: 0.1760 ||:  77%|#######7  | 86/111 [00:59<00:16,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8371, UAS: 0.9325, LAS: 0.8789, UEM: 0.5258, LEM: 0.2895, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1699, partial_loss/deprel_loss: 0.9620, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1802, loss: 0.8598, batch_reg_loss: 0.1766, reg_loss: 0.1760 ||:  81%|########1 | 90/111 [01:02<00:14,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9327, LAS: 0.8790, UEM: 0.5229, LEM: 0.2861, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5761, partial_loss/deprel_loss: 0.7385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8827, loss: 0.8601, batch_reg_loss: 0.1767, reg_loss: 0.1761 ||:  85%|########4 | 94/111 [01:05<00:11,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9327, LAS: 0.8789, UEM: 0.5254, LEM: 0.2875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2904, partial_loss/deprel_loss: 0.4370, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5844, loss: 0.8596, batch_reg_loss: 0.1767, reg_loss: 0.1761 ||:  88%|########8 | 98/111 [01:08<00:09,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.9322, LAS: 0.8783, UEM: 0.5222, LEM: 0.2851, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8614, partial_loss/deprel_loss: 0.8358, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0177, loss: 0.8647, batch_reg_loss: 0.1768, reg_loss: 0.1761 ||:  92%|#########1| 102/111 [01:11<00:06,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8329, UAS: 0.9325, LAS: 0.8787, UEM: 0.5388, LEM: 0.3065, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3338, partial_loss/deprel_loss: 0.9728, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2218, loss: 0.8622, batch_reg_loss: 0.1768, reg_loss: 0.1761 ||:  95%|#########4| 105/111 [01:13<00:04,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8788, UAS: 0.9322, LAS: 0.8784, UEM: 0.5361, LEM: 0.3039, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6211, partial_loss/deprel_loss: 0.6854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8494, loss: 0.8656, batch_reg_loss: 0.1769, reg_loss: 0.1762 ||:  98%|#########8| 109/111 [01:16<00:01,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8162, UAS: 0.9319, LAS: 0.8781, UEM: 0.5376, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5148, partial_loss/deprel_loss: 1.0411, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3128, loss: 0.8674, batch_reg_loss: 0.1769, reg_loss: 0.1762 ||: 100%|##########| 111/111 [01:17<00:00,  1.43it/s]\n",
+      "2023-04-07 00:11:10,307 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:11:10,307 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.041  |       N/A\n",
+      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.515  |       N/A\n",
+      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.176  |       N/A\n",
+      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - UEM                      |     0.538  |       N/A\n",
+      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - LAS                      |     0.878  |       N/A\n",
+      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - loss                     |     0.867  |       N/A\n",
+      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - LEM                      |     0.305  |       N/A\n",
+      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - UAS                      |     0.932  |       N/A\n",
+      "2023-04-07 00:11:10,309 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:11:10,309 - INFO - combo.training.tensorboard_writer - EM                       |     0.816  |       N/A\n",
+      "2023-04-07 00:11:10,309 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:11:10,313 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:11:15,962 - INFO - combo.training.trainer - Epoch duration: 0:01:25.568982\n",
+      "2023-04-07 00:11:15,962 - INFO - combo.training.trainer - Estimated training time remaining: 7:24:11\n",
+      "2023-04-07 00:11:15,962 - INFO - allennlp.training.trainer - Epoch 62/399\n",
+      "2023-04-07 00:11:15,963 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:11:15,963 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:11:15,970 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9461, LAS: 0.8929, UEM: 0.6482, LEM: 0.3817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8178, partial_loss/deprel_loss: 0.7325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9265, loss: 0.7051, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||:   3%|2         | 3/111 [00:02<01:19,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8685, UAS: 0.9367, LAS: 0.8823, UEM: 0.5942, LEM: 0.3705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6823, partial_loss/deprel_loss: 0.8525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9954, loss: 0.8175, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||:   6%|6         | 7/111 [00:04<01:12,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7817, UAS: 0.9301, LAS: 0.8763, UEM: 0.5643, LEM: 0.3362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2934, partial_loss/deprel_loss: 1.3399, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7076, loss: 0.8878, batch_reg_loss: 0.1770, reg_loss: 0.1769 ||:   9%|9         | 10/111 [00:06<01:10,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9312, LAS: 0.8783, UEM: 0.5568, LEM: 0.3322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2351, partial_loss/deprel_loss: 0.3993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5434, loss: 0.8788, batch_reg_loss: 0.1770, reg_loss: 0.1769 ||:  13%|#2        | 14/111 [00:09<01:05,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9361, LAS: 0.8829, UEM: 0.5695, LEM: 0.3216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4688, partial_loss/deprel_loss: 0.5094, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6782, loss: 0.8412, batch_reg_loss: 0.1770, reg_loss: 0.1769 ||:  15%|#5        | 17/111 [00:11<01:06,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8554, UAS: 0.9335, LAS: 0.8806, UEM: 0.5433, LEM: 0.3050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0345, partial_loss/deprel_loss: 0.7780, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0062, loss: 0.8508, batch_reg_loss: 0.1770, reg_loss: 0.1770 ||:  18%|#8        | 20/111 [00:13<01:03,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8884, UAS: 0.9343, LAS: 0.8818, UEM: 0.5205, LEM: 0.2839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6520, partial_loss/deprel_loss: 0.6173, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8012, loss: 0.8428, batch_reg_loss: 0.1770, reg_loss: 0.1770 ||:  22%|##1       | 24/111 [00:16<00:58,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9322, LAS: 0.8798, UEM: 0.4931, LEM: 0.2629, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7861, partial_loss/deprel_loss: 0.7325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9202, loss: 0.8579, batch_reg_loss: 0.1770, reg_loss: 0.1770 ||:  25%|##5       | 28/111 [00:18<00:55,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9330, LAS: 0.8811, UEM: 0.5272, LEM: 0.3073, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1210, partial_loss/deprel_loss: 0.2362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3901, loss: 0.8492, batch_reg_loss: 0.1770, reg_loss: 0.1770 ||:  28%|##7       | 31/111 [00:21<00:56,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9329, LAS: 0.8809, UEM: 0.5126, LEM: 0.2930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5720, partial_loss/deprel_loss: 0.6731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8298, loss: 0.8500, batch_reg_loss: 0.1769, reg_loss: 0.1770 ||:  31%|###       | 34/111 [00:23<00:54,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8891, UAS: 0.9333, LAS: 0.8813, UEM: 0.5162, LEM: 0.2939, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5572, partial_loss/deprel_loss: 0.5714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7455, loss: 0.8451, batch_reg_loss: 0.1769, reg_loss: 0.1770 ||:  33%|###3      | 37/111 [00:25<00:53,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9343, LAS: 0.8824, UEM: 0.5142, LEM: 0.2895, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4571, partial_loss/deprel_loss: 0.6004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7487, loss: 0.8359, batch_reg_loss: 0.1769, reg_loss: 0.1770 ||:  36%|###6      | 40/111 [00:27<00:52,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9351, LAS: 0.8832, UEM: 0.5291, LEM: 0.2997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3019, partial_loss/deprel_loss: 0.4755, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6177, loss: 0.8277, batch_reg_loss: 0.1769, reg_loss: 0.1770 ||:  39%|###8      | 43/111 [00:30<00:50,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9371, LAS: 0.8861, UEM: 0.5756, LEM: 0.3583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2111, partial_loss/deprel_loss: 0.3450, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4951, loss: 0.8072, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||:  41%|####1     | 46/111 [00:32<00:49,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8542, UAS: 0.9372, LAS: 0.8862, UEM: 0.5747, LEM: 0.3562, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0707, partial_loss/deprel_loss: 0.8576, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0771, loss: 0.8040, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||:  44%|####4     | 49/111 [00:34<00:47,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9126, UAS: 0.9382, LAS: 0.8872, UEM: 0.5813, LEM: 0.3621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4093, partial_loss/deprel_loss: 0.4927, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6529, loss: 0.7991, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||:  47%|####6     | 52/111 [00:36<00:43,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8502, UAS: 0.9379, LAS: 0.8868, UEM: 0.5728, LEM: 0.3537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9311, partial_loss/deprel_loss: 0.9079, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0894, loss: 0.8040, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||:  50%|#####     | 56/111 [00:39<00:37,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9370, LAS: 0.8861, UEM: 0.5686, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2738, partial_loss/deprel_loss: 0.4237, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5706, loss: 0.8109, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||:  53%|#####3    | 59/111 [00:41<00:36,  1.44it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9375, LAS: 0.8867, UEM: 0.5667, LEM: 0.3447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4263, partial_loss/deprel_loss: 0.6020, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7437, loss: 0.8056, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||:  56%|#####5    | 62/111 [00:43<00:34,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9110, UAS: 0.9370, LAS: 0.8863, UEM: 0.5694, LEM: 0.3457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3908, partial_loss/deprel_loss: 0.5036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6579, loss: 0.8078, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  59%|#####8    | 65/111 [00:45<00:33,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9366, LAS: 0.8859, UEM: 0.5667, LEM: 0.3430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2895, partial_loss/deprel_loss: 0.3820, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5403, loss: 0.8122, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  61%|######1   | 68/111 [00:47<00:30,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8628, UAS: 0.9359, LAS: 0.8850, UEM: 0.5564, LEM: 0.3342, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8085, partial_loss/deprel_loss: 0.8201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9946, loss: 0.8185, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  65%|######4   | 72/111 [00:50<00:26,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8626, UAS: 0.9351, LAS: 0.8842, UEM: 0.5619, LEM: 0.3422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0201, partial_loss/deprel_loss: 0.7898, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0127, loss: 0.8247, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  68%|######7   | 75/111 [00:52<00:25,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9361, LAS: 0.8853, UEM: 0.5672, LEM: 0.3431, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3834, partial_loss/deprel_loss: 0.5284, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6762, loss: 0.8170, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  70%|#######   | 78/111 [00:54<00:23,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9357, LAS: 0.8848, UEM: 0.5614, LEM: 0.3388, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2974, partial_loss/deprel_loss: 0.4016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5576, loss: 0.8223, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  74%|#######3  | 82/111 [00:57<00:20,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9364, LAS: 0.8856, UEM: 0.5646, LEM: 0.3391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3102, partial_loss/deprel_loss: 0.5018, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6403, loss: 0.8165, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  77%|#######6  | 85/111 [00:59<00:17,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9356, LAS: 0.8847, UEM: 0.5610, LEM: 0.3358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6688, partial_loss/deprel_loss: 0.6762, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8515, loss: 0.8214, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  80%|########  | 89/111 [01:01<00:14,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9349, LAS: 0.8840, UEM: 0.5549, LEM: 0.3313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9371, partial_loss/deprel_loss: 0.8498, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0440, loss: 0.8271, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  84%|########3 | 93/111 [01:04<00:11,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8845, UAS: 0.9349, LAS: 0.8841, UEM: 0.5478, LEM: 0.3248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6846, partial_loss/deprel_loss: 0.6411, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8266, loss: 0.8268, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  87%|########7 | 97/111 [01:06<00:08,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9355, LAS: 0.8848, UEM: 0.5496, LEM: 0.3244, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3925, partial_loss/deprel_loss: 0.5808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7199, loss: 0.8227, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  91%|######### | 101/111 [01:09<00:06,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9350, LAS: 0.8839, UEM: 0.5418, LEM: 0.3178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5451, partial_loss/deprel_loss: 0.6392, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7972, loss: 0.8280, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  95%|#########4| 105/111 [01:12<00:03,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9350, LAS: 0.8839, UEM: 0.5435, LEM: 0.3193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7372, partial_loss/deprel_loss: 0.6851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8723, loss: 0.8279, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  98%|#########8| 109/111 [01:15<00:01,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9352, LAS: 0.8843, UEM: 0.5459, LEM: 0.3214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2081, partial_loss/deprel_loss: 0.3644, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5099, loss: 0.8251, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
+      "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.364  |       N/A\n",
+      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.208  |       N/A\n",
+      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.177  |       N/A\n",
+      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - UEM                      |     0.546  |       N/A\n",
+      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - LAS                      |     0.884  |       N/A\n",
+      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - loss                     |     0.825  |       N/A\n",
+      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - LEM                      |     0.321  |       N/A\n",
+      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - UAS                      |     0.935  |       N/A\n",
+      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - EM                       |     0.926  |       N/A\n",
+      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:12:35,734 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:12:40,483 - INFO - combo.training.trainer - Epoch duration: 0:01:24.520495\n",
+      "2023-04-07 00:12:40,484 - INFO - combo.training.trainer - Estimated training time remaining: 7:23:22\n",
+      "2023-04-07 00:12:40,484 - INFO - allennlp.training.trainer - Epoch 63/399\n",
+      "2023-04-07 00:12:40,484 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:12:40,485 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:12:40,495 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9622, LAS: 0.9136, UEM: 0.7143, LEM: 0.3932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2952, partial_loss/deprel_loss: 0.4429, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5901, loss: 0.5662, batch_reg_loss: 0.1767, reg_loss: 0.1768 ||:   3%|2         | 3/111 [00:02<01:17,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9647, LAS: 0.9167, UEM: 0.7773, LEM: 0.5015, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1387, partial_loss/deprel_loss: 0.3915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5177, loss: 0.5657, batch_reg_loss: 0.1767, reg_loss: 0.1767 ||:   5%|5         | 6/111 [00:04<01:17,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9528, LAS: 0.9026, UEM: 0.7066, LEM: 0.4420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2673, partial_loss/deprel_loss: 0.3965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5474, loss: 0.6629, batch_reg_loss: 0.1767, reg_loss: 0.1767 ||:   9%|9         | 10/111 [00:07<01:11,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8438, UAS: 0.9508, LAS: 0.8998, UEM: 0.6968, LEM: 0.4310, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0591, partial_loss/deprel_loss: 0.9699, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1644, loss: 0.6890, batch_reg_loss: 0.1767, reg_loss: 0.1767 ||:  12%|#1        | 13/111 [00:09<01:10,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9486, LAS: 0.8977, UEM: 0.6604, LEM: 0.3974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3376, partial_loss/deprel_loss: 0.4769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6258, loss: 0.7111, batch_reg_loss: 0.1767, reg_loss: 0.1767 ||:  15%|#5        | 17/111 [00:11<01:04,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9484, LAS: 0.8977, UEM: 0.6432, LEM: 0.3808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2738, partial_loss/deprel_loss: 0.4217, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5688, loss: 0.7174, batch_reg_loss: 0.1767, reg_loss: 0.1767 ||:  19%|#8        | 21/111 [00:14<01:01,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9471, LAS: 0.8968, UEM: 0.6249, LEM: 0.3658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3350, partial_loss/deprel_loss: 0.4300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5877, loss: 0.7248, batch_reg_loss: 0.1767, reg_loss: 0.1767 ||:  22%|##1       | 24/111 [00:16<01:00,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9000, UAS: 0.9458, LAS: 0.8951, UEM: 0.6095, LEM: 0.3516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3742, partial_loss/deprel_loss: 0.5653, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7037, loss: 0.7378, batch_reg_loss: 0.1767, reg_loss: 0.1767 ||:  24%|##4       | 27/111 [00:18<00:58,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9469, LAS: 0.8963, UEM: 0.6098, LEM: 0.3461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2797, partial_loss/deprel_loss: 0.5113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6416, loss: 0.7258, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  28%|##7       | 31/111 [00:21<00:54,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9419, LAS: 0.8912, UEM: 0.5994, LEM: 0.3402, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3695, partial_loss/deprel_loss: 0.4635, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6213, loss: 0.7673, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  31%|###       | 34/111 [00:23<00:54,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8787, UAS: 0.9405, LAS: 0.8897, UEM: 0.5848, LEM: 0.3277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7267, partial_loss/deprel_loss: 0.6768, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8634, loss: 0.7788, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  33%|###3      | 37/111 [00:25<00:52,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8613, UAS: 0.9384, LAS: 0.8874, UEM: 0.5624, LEM: 0.3122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9695, partial_loss/deprel_loss: 0.7204, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9468, loss: 0.7958, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  37%|###6      | 41/111 [00:28<00:49,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9389, LAS: 0.8880, UEM: 0.5617, LEM: 0.3114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3551, partial_loss/deprel_loss: 0.4208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5843, loss: 0.7929, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  40%|###9      | 44/111 [00:30<00:48,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8821, UAS: 0.9394, LAS: 0.8883, UEM: 0.5660, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5540, partial_loss/deprel_loss: 0.6572, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8132, loss: 0.7888, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  42%|####2     | 47/111 [00:33<00:47,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9408, LAS: 0.8902, UEM: 0.5851, LEM: 0.3367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4763, partial_loss/deprel_loss: 0.5986, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7508, loss: 0.7764, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  45%|####5     | 50/111 [00:35<00:47,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8593, UAS: 0.9396, LAS: 0.8890, UEM: 0.5734, LEM: 0.3276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9640, partial_loss/deprel_loss: 0.7751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9895, loss: 0.7859, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  48%|####7     | 53/111 [00:38<00:44,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9395, LAS: 0.8891, UEM: 0.5686, LEM: 0.3225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4899, partial_loss/deprel_loss: 0.5436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7095, loss: 0.7854, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  50%|#####     | 56/111 [00:40<00:41,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9399, LAS: 0.8895, UEM: 0.5699, LEM: 0.3219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2513, partial_loss/deprel_loss: 0.4202, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5631, loss: 0.7826, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  53%|#####3    | 59/111 [00:42<00:39,  1.30it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8977, UAS: 0.9391, LAS: 0.8886, UEM: 0.5616, LEM: 0.3157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4519, partial_loss/deprel_loss: 0.5807, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7315, loss: 0.7914, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  56%|#####5    | 62/111 [00:44<00:36,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9392, LAS: 0.8885, UEM: 0.5575, LEM: 0.3106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2907, partial_loss/deprel_loss: 0.5125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6448, loss: 0.7910, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  59%|#####9    | 66/111 [00:47<00:32,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9386, LAS: 0.8878, UEM: 0.5526, LEM: 0.3064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6683, partial_loss/deprel_loss: 0.7764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9313, loss: 0.7982, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  62%|######2   | 69/111 [00:49<00:29,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9385, LAS: 0.8875, UEM: 0.5494, LEM: 0.3030, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3060, partial_loss/deprel_loss: 0.5013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6389, loss: 0.8003, batch_reg_loss: 0.1766, reg_loss: 0.1766 ||:  65%|######4   | 72/111 [00:51<00:28,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9390, LAS: 0.8885, UEM: 0.5791, LEM: 0.3432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1575, partial_loss/deprel_loss: 0.2822, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4339, loss: 0.7948, batch_reg_loss: 0.1766, reg_loss: 0.1766 ||:  68%|######7   | 75/111 [00:54<00:27,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8232, UAS: 0.9369, LAS: 0.8863, UEM: 0.5684, LEM: 0.3360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7013, partial_loss/deprel_loss: 0.9147, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2486, loss: 0.8097, batch_reg_loss: 0.1766, reg_loss: 0.1766 ||:  71%|#######1  | 79/111 [00:56<00:23,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9371, LAS: 0.8866, UEM: 0.5699, LEM: 0.3353, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2117, partial_loss/deprel_loss: 0.3626, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5090, loss: 0.8084, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||:  75%|#######4  | 83/111 [00:59<00:19,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9266, UAS: 0.9383, LAS: 0.8878, UEM: 0.5797, LEM: 0.3419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1914, partial_loss/deprel_loss: 0.3426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4889, loss: 0.7984, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||:  78%|#######8  | 87/111 [01:02<00:16,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9379, LAS: 0.8874, UEM: 0.5752, LEM: 0.3376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3438, partial_loss/deprel_loss: 0.4141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5766, loss: 0.8011, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||:  82%|########1 | 91/111 [01:04<00:13,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9383, LAS: 0.8878, UEM: 0.5733, LEM: 0.3339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3745, partial_loss/deprel_loss: 0.4885, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6422, loss: 0.7969, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||:  85%|########4 | 94/111 [01:06<00:11,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8664, UAS: 0.9383, LAS: 0.8879, UEM: 0.5673, LEM: 0.3279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7117, partial_loss/deprel_loss: 0.7441, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9141, loss: 0.7961, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||:  88%|########8 | 98/111 [01:09<00:08,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9386, LAS: 0.8882, UEM: 0.5673, LEM: 0.3276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2380, partial_loss/deprel_loss: 0.3630, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5145, loss: 0.7950, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||:  92%|#########1| 102/111 [01:12<00:06,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9243, UAS: 0.9391, LAS: 0.8888, UEM: 0.5696, LEM: 0.3285, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2042, partial_loss/deprel_loss: 0.3583, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5040, loss: 0.7909, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||:  95%|#########4| 105/111 [01:14<00:04,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8744, UAS: 0.9389, LAS: 0.8884, UEM: 0.5633, LEM: 0.3233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7002, partial_loss/deprel_loss: 0.7096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8842, loss: 0.7945, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||:  98%|#########8| 109/111 [01:16<00:01,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8158, UAS: 0.9386, LAS: 0.8880, UEM: 0.5631, LEM: 0.3230, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5034, partial_loss/deprel_loss: 1.0496, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3169, loss: 0.7973, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||: 100%|##########| 111/111 [01:17<00:00,  1.43it/s]\n",
+      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.050  |       N/A\n",
+      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.503  |       N/A\n",
+      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.177  |       N/A\n",
+      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - UEM                      |     0.563  |       N/A\n",
+      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - LAS                      |     0.888  |       N/A\n",
+      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - loss                     |     0.797  |       N/A\n",
+      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - LEM                      |     0.323  |       N/A\n",
+      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - UAS                      |     0.939  |       N/A\n",
+      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - EM                       |     0.816  |       N/A\n",
+      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:14:00,976 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:14:07,569 - INFO - combo.training.trainer - Epoch duration: 0:01:27.085147\n",
+      "2023-04-07 00:14:07,569 - INFO - combo.training.trainer - Estimated training time remaining: 7:22:46\n",
+      "2023-04-07 00:14:07,570 - INFO - allennlp.training.trainer - Epoch 64/399\n",
+      "2023-04-07 00:14:07,570 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:14:07,570 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:14:07,579 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9424, LAS: 0.8965, UEM: 0.7553, LEM: 0.5743, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4184, partial_loss/deprel_loss: 0.5698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7159, loss: 0.7365, batch_reg_loss: 0.1765, reg_loss: 0.1765 ||:   3%|2         | 3/111 [00:02<01:20,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9456, LAS: 0.8991, UEM: 0.6562, LEM: 0.4308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4812, partial_loss/deprel_loss: 0.5967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7501, loss: 0.7251, batch_reg_loss: 0.1764, reg_loss: 0.1765 ||:   6%|6         | 7/111 [00:04<01:13,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9400, LAS: 0.8915, UEM: 0.5800, LEM: 0.3541, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4154, partial_loss/deprel_loss: 0.5672, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7133, loss: 0.7932, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  10%|9         | 11/111 [00:07<01:10,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9398, LAS: 0.8908, UEM: 0.5572, LEM: 0.3242, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3106, partial_loss/deprel_loss: 0.4770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6202, loss: 0.7940, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  13%|#2        | 14/111 [00:09<01:08,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9379, LAS: 0.8888, UEM: 0.5385, LEM: 0.3089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5457, partial_loss/deprel_loss: 0.6542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8089, loss: 0.8111, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  15%|#5        | 17/111 [00:11<01:07,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9404, LAS: 0.8915, UEM: 0.5680, LEM: 0.3306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2816, partial_loss/deprel_loss: 0.4403, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5850, loss: 0.7857, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  18%|#8        | 20/111 [00:14<01:05,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7952, UAS: 0.9377, LAS: 0.8885, UEM: 0.5705, LEM: 0.3313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2371, partial_loss/deprel_loss: 1.3617, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7132, loss: 0.8161, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  21%|##        | 23/111 [00:16<01:04,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9395, LAS: 0.8902, UEM: 0.5696, LEM: 0.3252, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4209, partial_loss/deprel_loss: 0.4874, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6505, loss: 0.8001, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  23%|##3       | 26/111 [00:18<01:00,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9428, LAS: 0.8938, UEM: 0.6109, LEM: 0.3625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2672, partial_loss/deprel_loss: 0.4811, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6147, loss: 0.7724, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  26%|##6       | 29/111 [00:20<00:58,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8613, UAS: 0.9427, LAS: 0.8934, UEM: 0.6043, LEM: 0.3556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8892, partial_loss/deprel_loss: 0.7627, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9644, loss: 0.7738, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  29%|##8       | 32/111 [00:22<00:55,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9042, UAS: 0.9429, LAS: 0.8938, UEM: 0.5867, LEM: 0.3388, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4316, partial_loss/deprel_loss: 0.5089, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6698, loss: 0.7712, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  32%|###2      | 36/111 [00:25<00:51,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8462, UAS: 0.9414, LAS: 0.8917, UEM: 0.5679, LEM: 0.3216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9932, partial_loss/deprel_loss: 0.8972, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0928, loss: 0.7831, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  36%|###6      | 40/111 [00:27<00:46,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.9402, LAS: 0.8901, UEM: 0.5609, LEM: 0.3142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4805, partial_loss/deprel_loss: 1.1199, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3684, loss: 0.7962, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  40%|###9      | 44/111 [00:30<00:43,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9421, LAS: 0.8927, UEM: 0.5967, LEM: 0.3622, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2505, partial_loss/deprel_loss: 0.4069, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5520, loss: 0.7783, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||:  43%|####3     | 48/111 [00:33<00:44,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9430, LAS: 0.8937, UEM: 0.5972, LEM: 0.3581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2783, partial_loss/deprel_loss: 0.5068, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6374, loss: 0.7690, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||:  47%|####6     | 52/111 [00:36<00:41,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8687, UAS: 0.9428, LAS: 0.8935, UEM: 0.5909, LEM: 0.3517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7752, partial_loss/deprel_loss: 0.7210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9082, loss: 0.7704, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||:  50%|#####     | 56/111 [00:38<00:37,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9439, LAS: 0.8947, UEM: 0.6005, LEM: 0.3591, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4300, partial_loss/deprel_loss: 0.4863, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6514, loss: 0.7624, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||:  53%|#####3    | 59/111 [00:40<00:36,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8199, UAS: 0.9417, LAS: 0.8926, UEM: 0.5902, LEM: 0.3526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6636, partial_loss/deprel_loss: 0.9961, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3059, loss: 0.7789, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||:  56%|#####5    | 62/111 [00:42<00:33,  1.45it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8640, UAS: 0.9413, LAS: 0.8921, UEM: 0.5894, LEM: 0.3530, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0166, partial_loss/deprel_loss: 0.8454, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0559, loss: 0.7818, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||:  59%|#####8    | 65/111 [00:45<00:32,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9409, LAS: 0.8915, UEM: 0.5879, LEM: 0.3506, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2982, partial_loss/deprel_loss: 0.4384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5866, loss: 0.7857, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||:  61%|######1   | 68/111 [00:47<00:30,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8827, UAS: 0.9415, LAS: 0.8921, UEM: 0.5966, LEM: 0.3589, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7684, partial_loss/deprel_loss: 0.6968, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8874, loss: 0.7806, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||:  64%|######3   | 71/111 [00:49<00:29,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9415, LAS: 0.8920, UEM: 0.5889, LEM: 0.3513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3207, partial_loss/deprel_loss: 0.4941, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6357, loss: 0.7809, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||:  68%|######7   | 75/111 [00:52<00:25,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8619, UAS: 0.9410, LAS: 0.8913, UEM: 0.5785, LEM: 0.3428, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9618, partial_loss/deprel_loss: 0.8121, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0183, loss: 0.7868, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||:  71%|#######1  | 79/111 [00:54<00:20,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9413, LAS: 0.8918, UEM: 0.5854, LEM: 0.3498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9237, partial_loss/deprel_loss: 0.8028, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0032, loss: 0.7828, batch_reg_loss: 0.1762, reg_loss: 0.1764 ||:  75%|#######4  | 83/111 [00:57<00:18,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9031, UAS: 0.9416, LAS: 0.8921, UEM: 0.5822, LEM: 0.3472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3736, partial_loss/deprel_loss: 0.5020, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6526, loss: 0.7811, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||:  78%|#######8  | 87/111 [01:00<00:17,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9419, LAS: 0.8924, UEM: 0.5824, LEM: 0.3462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2289, partial_loss/deprel_loss: 0.3876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5321, loss: 0.7777, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||:  81%|########1 | 90/111 [01:02<00:15,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9424, LAS: 0.8931, UEM: 0.5877, LEM: 0.3496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3492, partial_loss/deprel_loss: 0.5226, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6642, loss: 0.7721, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||:  84%|########3 | 93/111 [01:04<00:12,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9426, LAS: 0.8934, UEM: 0.5861, LEM: 0.3472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3260, partial_loss/deprel_loss: 0.4986, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6403, loss: 0.7709, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||:  87%|########7 | 97/111 [01:07<00:09,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8197, UAS: 0.9416, LAS: 0.8925, UEM: 0.5812, LEM: 0.3430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8202, partial_loss/deprel_loss: 0.9301, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2843, loss: 0.7767, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||:  91%|######### | 101/111 [01:09<00:06,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9417, LAS: 0.8925, UEM: 0.5748, LEM: 0.3369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5971, partial_loss/deprel_loss: 0.7558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9002, loss: 0.7791, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||:  95%|#########4| 105/111 [01:12<00:04,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8726, UAS: 0.9416, LAS: 0.8923, UEM: 0.5710, LEM: 0.3332, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7785, partial_loss/deprel_loss: 0.7124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9018, loss: 0.7798, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||:  97%|#########7| 108/111 [01:14<00:02,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9410, LAS: 0.8915, UEM: 0.5651, LEM: 0.3290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9154, partial_loss/deprel_loss: 0.8018, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0006, loss: 0.7854, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||: 100%|##########| 111/111 [01:16<00:00,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9410, LAS: 0.8915, UEM: 0.5651, LEM: 0.3290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9154, partial_loss/deprel_loss: 0.8018, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0006, loss: 0.7854, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
+      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.802  |       N/A\n",
+      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.915  |       N/A\n",
+      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.176  |       N/A\n",
+      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - UEM                      |     0.565  |       N/A\n",
+      "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - LAS                      |     0.892  |       N/A\n",
+      "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - loss                     |     0.785  |       N/A\n",
+      "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - LEM                      |     0.329  |       N/A\n",
+      "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - UAS                      |     0.941  |       N/A\n",
+      "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - EM                       |     0.855  |       N/A\n",
+      "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:15:27,598 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:15:34,868 - INFO - combo.training.trainer - Epoch duration: 0:01:27.298867\n",
+      "2023-04-07 00:15:34,869 - INFO - combo.training.trainer - Estimated training time remaining: 7:22:09\n",
+      "2023-04-07 00:15:34,869 - INFO - allennlp.training.trainer - Epoch 65/399\n",
+      "2023-04-07 00:15:34,869 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:15:34,869 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:15:34,876 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9188, UAS: 0.9502, LAS: 0.9006, UEM: 0.4792, LEM: 0.2152, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3437, partial_loss/deprel_loss: 0.4806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6294, loss: 0.7186, batch_reg_loss: 0.1762, reg_loss: 0.1762 ||:   3%|2         | 3/111 [00:02<01:17,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9285, LAS: 0.8794, UEM: 0.3964, LEM: 0.1731, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6617, partial_loss/deprel_loss: 0.5697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7642, loss: 0.8714, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:   5%|5         | 6/111 [00:04<01:15,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9329, LAS: 0.8837, UEM: 0.4081, LEM: 0.1828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5837, partial_loss/deprel_loss: 0.6297, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7967, loss: 0.8328, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:   8%|8         | 9/111 [00:06<01:13,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8397, UAS: 0.9340, LAS: 0.8848, UEM: 0.4359, LEM: 0.2012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1888, partial_loss/deprel_loss: 0.8942, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1292, loss: 0.8237, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  12%|#1        | 13/111 [00:09<01:08,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9166, UAS: 0.9390, LAS: 0.8905, UEM: 0.5050, LEM: 0.2569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2596, partial_loss/deprel_loss: 0.3912, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5410, loss: 0.7799, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  14%|#4        | 16/111 [00:11<01:07,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9417, LAS: 0.8939, UEM: 0.5398, LEM: 0.2875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4567, partial_loss/deprel_loss: 0.5314, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6926, loss: 0.7536, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  17%|#7        | 19/111 [00:13<01:06,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8952, UAS: 0.9426, LAS: 0.8944, UEM: 0.5453, LEM: 0.2903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5512, partial_loss/deprel_loss: 0.5817, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7518, loss: 0.7517, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  20%|#9        | 22/111 [00:15<01:03,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8684, UAS: 0.9405, LAS: 0.8917, UEM: 0.5186, LEM: 0.2715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9198, partial_loss/deprel_loss: 0.7851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9881, loss: 0.7773, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  23%|##2       | 25/111 [00:17<01:00,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9414, LAS: 0.8929, UEM: 0.5435, LEM: 0.2940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3073, partial_loss/deprel_loss: 0.4587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6046, loss: 0.7677, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  25%|##5       | 28/111 [00:19<00:57,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9427, LAS: 0.8947, UEM: 0.5851, LEM: 0.3425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0904, partial_loss/deprel_loss: 0.2188, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3692, loss: 0.7532, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  28%|##7       | 31/111 [00:22<00:58,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9421, LAS: 0.8936, UEM: 0.5740, LEM: 0.3302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7529, partial_loss/deprel_loss: 0.8034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9694, loss: 0.7675, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  31%|###       | 34/111 [00:24<00:54,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9422, LAS: 0.8932, UEM: 0.5649, LEM: 0.3197, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5704, partial_loss/deprel_loss: 0.6786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8331, loss: 0.7708, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  33%|###3      | 37/111 [00:26<00:52,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8517, UAS: 0.9389, LAS: 0.8896, UEM: 0.5482, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9369, partial_loss/deprel_loss: 0.8963, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0805, loss: 0.7991, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  36%|###6      | 40/111 [00:28<00:51,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9398, LAS: 0.8907, UEM: 0.5574, LEM: 0.3179, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2348, partial_loss/deprel_loss: 0.3746, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5227, loss: 0.7898, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  39%|###8      | 43/111 [00:30<00:49,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9402, LAS: 0.8911, UEM: 0.5758, LEM: 0.3358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0961, partial_loss/deprel_loss: 0.3030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4377, loss: 0.7841, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  41%|####1     | 46/111 [00:33<00:48,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9412, LAS: 0.8924, UEM: 0.5791, LEM: 0.3347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3451, partial_loss/deprel_loss: 0.4574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6110, loss: 0.7733, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  44%|####4     | 49/111 [00:35<00:48,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8615, UAS: 0.9405, LAS: 0.8913, UEM: 0.5642, LEM: 0.3226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9953, partial_loss/deprel_loss: 0.8299, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0390, loss: 0.7814, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||:  48%|####7     | 53/111 [00:38<00:42,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9404, LAS: 0.8914, UEM: 0.5579, LEM: 0.3160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3034, partial_loss/deprel_loss: 0.4683, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6113, loss: 0.7792, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||:  51%|#####1    | 57/111 [00:40<00:37,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9410, LAS: 0.8922, UEM: 0.5655, LEM: 0.3256, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4643, partial_loss/deprel_loss: 0.6052, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7531, loss: 0.7743, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||:  54%|#####4    | 60/111 [00:42<00:36,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9420, LAS: 0.8935, UEM: 0.5793, LEM: 0.3406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4151, partial_loss/deprel_loss: 0.4695, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6346, loss: 0.7633, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||:  57%|#####6    | 63/111 [00:45<00:35,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9692, UAS: 0.9420, LAS: 0.8940, UEM: 0.6043, LEM: 0.3750, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0402, partial_loss/deprel_loss: 0.1250, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2840, loss: 0.7604, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||:  59%|#####9    | 66/111 [00:47<00:34,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9424, LAS: 0.8945, UEM: 0.6072, LEM: 0.3778, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8798, partial_loss/deprel_loss: 0.7190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9271, loss: 0.7567, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||:  62%|######2   | 69/111 [00:50<00:32,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8730, UAS: 0.9417, LAS: 0.8937, UEM: 0.5964, LEM: 0.3689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9134, partial_loss/deprel_loss: 0.6988, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9177, loss: 0.7623, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||:  66%|######5   | 73/111 [00:52<00:27,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.9425, LAS: 0.8946, UEM: 0.6038, LEM: 0.3737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8754, partial_loss/deprel_loss: 0.7352, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9392, loss: 0.7569, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||:  69%|######9   | 77/111 [00:57<00:30,  1.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9430, LAS: 0.8949, UEM: 0.6048, LEM: 0.3707, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2401, partial_loss/deprel_loss: 0.4459, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5807, loss: 0.7545, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||:  72%|#######2  | 80/111 [01:00<00:26,  1.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8322, UAS: 0.9423, LAS: 0.8940, UEM: 0.6014, LEM: 0.3674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3299, partial_loss/deprel_loss: 1.0192, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2573, loss: 0.7618, batch_reg_loss: 0.1759, reg_loss: 0.1761 ||:  75%|#######4  | 83/111 [01:02<00:22,  1.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9428, LAS: 0.8945, UEM: 0.6022, LEM: 0.3674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8188, partial_loss/deprel_loss: 0.7814, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9648, loss: 0.7589, batch_reg_loss: 0.1759, reg_loss: 0.1761 ||:  78%|#######8  | 87/111 [01:04<00:18,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9432, LAS: 0.8950, UEM: 0.6033, LEM: 0.3691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4792, partial_loss/deprel_loss: 0.5202, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6879, loss: 0.7550, batch_reg_loss: 0.1759, reg_loss: 0.1761 ||:  81%|########1 | 90/111 [01:06<00:15,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8641, UAS: 0.9432, LAS: 0.8948, UEM: 0.5973, LEM: 0.3630, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7809, partial_loss/deprel_loss: 0.8364, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0012, loss: 0.7570, batch_reg_loss: 0.1759, reg_loss: 0.1760 ||:  85%|########4 | 94/111 [01:09<00:12,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8751, UAS: 0.9430, LAS: 0.8947, UEM: 0.5933, LEM: 0.3590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0805, partial_loss/deprel_loss: 0.7475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9900, loss: 0.7587, batch_reg_loss: 0.1759, reg_loss: 0.1760 ||:  87%|########7 | 97/111 [01:11<00:09,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8796, UAS: 0.9429, LAS: 0.8944, UEM: 0.5915, LEM: 0.3562, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6612, partial_loss/deprel_loss: 0.7524, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9101, loss: 0.7615, batch_reg_loss: 0.1759, reg_loss: 0.1760 ||:  91%|######### | 101/111 [01:14<00:06,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8512, UAS: 0.9425, LAS: 0.8939, UEM: 0.5845, LEM: 0.3498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2449, partial_loss/deprel_loss: 0.8082, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0714, loss: 0.7650, batch_reg_loss: 0.1759, reg_loss: 0.1760 ||:  95%|#########4| 105/111 [01:16<00:03,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9423, LAS: 0.8940, UEM: 0.5795, LEM: 0.3461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3786, partial_loss/deprel_loss: 0.4375, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6016, loss: 0.7645, batch_reg_loss: 0.1759, reg_loss: 0.1760 ||:  98%|#########8| 109/111 [01:18<00:01,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8829, UAS: 0.9422, LAS: 0.8938, UEM: 0.5751, LEM: 0.3426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6651, partial_loss/deprel_loss: 0.6879, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8592, loss: 0.7658, batch_reg_loss: 0.1759, reg_loss: 0.1760 ||: 100%|##########| 111/111 [01:20<00:00,  1.39it/s]\n",
+      "2023-04-07 00:16:58,127 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8947, UAS: 0.9622, LAS: 0.9118, UEM: 0.7073, LEM: 0.3706, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5903, partial_loss/deprel_loss: 24.2431, partial_loss/cycle_loss: 0.0000, batch_loss: 19.5125, loss: 18.2181, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:09,  1.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8670, UAS: 0.9523, LAS: 0.9049, UEM: 0.7137, LEM: 0.4660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2693, partial_loss/deprel_loss: 48.4043, partial_loss/cycle_loss: 0.0000, batch_loss: 38.9773, loss: 22.4714, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:06,  1.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8718, UAS: 0.9472, LAS: 0.8970, UEM: 0.6454, LEM: 0.3894, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1023, partial_loss/deprel_loss: 43.3819, partial_loss/cycle_loss: 0.0000, batch_loss: 34.9260, loss: 24.5970, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  69%|######9   | 9/13 [00:08<00:03,  1.02it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9084, UAS: 0.9499, LAS: 0.8993, UEM: 0.6645, LEM: 0.3914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4265, partial_loss/deprel_loss: 24.5629, partial_loss/cycle_loss: 0.0000, batch_loss: 19.7356, loss: 24.1319, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  92%|#########2| 12/13 [00:11<00:00,  1.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8269, UAS: 0.9448, LAS: 0.8937, UEM: 0.6475, LEM: 0.3805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6012, partial_loss/deprel_loss: 57.6302, partial_loss/cycle_loss: 0.0000, batch_loss: 46.4244, loss: 25.8467, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.01it/s]\n",
+      "2023-04-07 00:17:10,952 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:17:10,952 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:17:10,952 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:17:10,952 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.688  |    57.630\n",
+      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.665  |     1.601\n",
+      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.176  |     0.000\n",
+      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - UEM                      |     0.575  |     0.648\n",
+      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - LAS                      |     0.894  |     0.894\n",
+      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - loss                     |     0.766  |    25.847\n",
+      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - LEM                      |     0.343  |     0.381\n",
+      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - UAS                      |     0.942  |     0.945\n",
+      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:17:10,954 - INFO - combo.training.tensorboard_writer - EM                       |     0.883  |     0.827\n",
+      "2023-04-07 00:17:10,954 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:17:10,958 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 00:17:15,921 - INFO - combo.training.trainer - Epoch duration: 0:01:41.052355\n",
+      "2023-04-07 00:17:15,922 - INFO - combo.training.trainer - Estimated training time remaining: 7:22:41\n",
+      "2023-04-07 00:17:15,928 - INFO - allennlp.training.trainer - Epoch 66/399\n",
+      "2023-04-07 00:17:15,930 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:17:15,930 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:17:15,938 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9503, LAS: 0.9045, UEM: 0.6977, LEM: 0.5070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1065, partial_loss/deprel_loss: 0.2698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4130, loss: 0.6921, batch_reg_loss: 0.1759, reg_loss: 0.1759 ||:   3%|2         | 3/111 [00:02<01:20,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8694, UAS: 0.9330, LAS: 0.8820, UEM: 0.5288, LEM: 0.3498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8724, partial_loss/deprel_loss: 0.7974, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9882, loss: 0.8708, batch_reg_loss: 0.1759, reg_loss: 0.1759 ||:   6%|6         | 7/111 [00:04<01:13,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9319, LAS: 0.8828, UEM: 0.4824, LEM: 0.2958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5042, partial_loss/deprel_loss: 0.6965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8339, loss: 0.8558, batch_reg_loss: 0.1758, reg_loss: 0.1759 ||:  10%|9         | 11/111 [00:07<01:08,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9382, LAS: 0.8904, UEM: 0.5645, LEM: 0.3581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2334, partial_loss/deprel_loss: 0.3449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4984, loss: 0.7947, batch_reg_loss: 0.1758, reg_loss: 0.1759 ||:  13%|#2        | 14/111 [00:09<01:08,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8779, UAS: 0.9392, LAS: 0.8913, UEM: 0.5810, LEM: 0.3711, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7095, partial_loss/deprel_loss: 0.7485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9165, loss: 0.7856, batch_reg_loss: 0.1758, reg_loss: 0.1759 ||:  15%|#5        | 17/111 [00:11<01:06,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9393, LAS: 0.8918, UEM: 0.5778, LEM: 0.3715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2544, partial_loss/deprel_loss: 0.3554, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5111, loss: 0.7788, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||:  18%|#8        | 20/111 [00:13<01:06,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9420, LAS: 0.8949, UEM: 0.5900, LEM: 0.3719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2620, partial_loss/deprel_loss: 0.4336, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5751, loss: 0.7566, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||:  21%|##        | 23/111 [00:16<01:04,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8643, UAS: 0.9413, LAS: 0.8942, UEM: 0.5750, LEM: 0.3566, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0092, partial_loss/deprel_loss: 0.7582, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9842, loss: 0.7636, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||:  23%|##3       | 26/111 [00:18<01:02,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9425, LAS: 0.8950, UEM: 0.5722, LEM: 0.3489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6922, partial_loss/deprel_loss: 0.7588, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9213, loss: 0.7595, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||:  26%|##6       | 29/111 [00:20<00:58,  1.40it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9426, LAS: 0.8947, UEM: 0.5539, LEM: 0.3315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5699, partial_loss/deprel_loss: 0.6186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7846, loss: 0.7658, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||:  30%|##9       | 33/111 [00:22<00:54,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8579, UAS: 0.9409, LAS: 0.8928, UEM: 0.5364, LEM: 0.3184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2077, partial_loss/deprel_loss: 0.7697, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0331, loss: 0.7801, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||:  32%|###2      | 36/111 [00:25<00:53,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9417, LAS: 0.8936, UEM: 0.5383, LEM: 0.3137, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6008, partial_loss/deprel_loss: 0.6349, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8038, loss: 0.7737, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||:  35%|###5      | 39/111 [00:27<00:50,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8771, UAS: 0.9419, LAS: 0.8937, UEM: 0.5330, LEM: 0.3057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7104, partial_loss/deprel_loss: 0.6737, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8568, loss: 0.7698, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||:  39%|###8      | 43/111 [00:30<00:47,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9435, LAS: 0.8958, UEM: 0.5762, LEM: 0.3582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4251, partial_loss/deprel_loss: 0.5221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6784, loss: 0.7536, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||:  41%|####1     | 46/111 [00:32<00:49,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9450, LAS: 0.8975, UEM: 0.6032, LEM: 0.3863, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1083, partial_loss/deprel_loss: 0.2278, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3797, loss: 0.7388, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||:  44%|####4     | 49/111 [00:35<00:50,  1.22it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8851, UAS: 0.9446, LAS: 0.8970, UEM: 0.5923, LEM: 0.3751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5940, partial_loss/deprel_loss: 0.6613, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8236, loss: 0.7427, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||:  47%|####6     | 52/111 [00:37<00:46,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8753, UAS: 0.9449, LAS: 0.8972, UEM: 0.5905, LEM: 0.3697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9129, partial_loss/deprel_loss: 0.7567, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9636, loss: 0.7413, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||:  50%|#####     | 56/111 [00:40<00:40,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9460, LAS: 0.8985, UEM: 0.6008, LEM: 0.3761, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2598, partial_loss/deprel_loss: 0.4018, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5491, loss: 0.7311, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||:  53%|#####3    | 59/111 [00:42<00:38,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8576, UAS: 0.9449, LAS: 0.8970, UEM: 0.5994, LEM: 0.3741, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9877, partial_loss/deprel_loss: 0.8369, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0427, loss: 0.7406, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||:  56%|#####5    | 62/111 [00:44<00:36,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8152, UAS: 0.9420, LAS: 0.8940, UEM: 0.5910, LEM: 0.3686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7323, partial_loss/deprel_loss: 0.9653, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2944, loss: 0.7644, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||:  59%|#####8    | 65/111 [00:46<00:33,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9423, LAS: 0.8944, UEM: 0.5933, LEM: 0.3714, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1783, partial_loss/deprel_loss: 0.3056, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4558, loss: 0.7605, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||:  61%|######1   | 68/111 [00:49<00:31,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9416, LAS: 0.8937, UEM: 0.5844, LEM: 0.3637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5059, partial_loss/deprel_loss: 0.5656, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7293, loss: 0.7655, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||:  65%|######4   | 72/111 [00:51<00:27,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8737, UAS: 0.9416, LAS: 0.8939, UEM: 0.5826, LEM: 0.3602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8336, partial_loss/deprel_loss: 0.6601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8705, loss: 0.7631, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||:  68%|######7   | 75/111 [00:53<00:25,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9319, UAS: 0.9426, LAS: 0.8951, UEM: 0.5931, LEM: 0.3691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2431, partial_loss/deprel_loss: 0.3982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5429, loss: 0.7539, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||:  70%|#######   | 78/111 [00:56<00:24,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8882, UAS: 0.9429, LAS: 0.8955, UEM: 0.5893, LEM: 0.3641, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6002, partial_loss/deprel_loss: 0.7296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8794, loss: 0.7525, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||:  74%|#######3  | 82/111 [00:58<00:20,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9429, LAS: 0.8955, UEM: 0.5864, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3258, partial_loss/deprel_loss: 0.4505, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6012, loss: 0.7537, batch_reg_loss: 0.1756, reg_loss: 0.1758 ||:  77%|#######6  | 85/111 [01:00<00:18,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9425, LAS: 0.8951, UEM: 0.5812, LEM: 0.3552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7507, partial_loss/deprel_loss: 0.7151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8979, loss: 0.7580, batch_reg_loss: 0.1756, reg_loss: 0.1758 ||:  79%|#######9  | 88/111 [01:02<00:16,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8893, UAS: 0.9421, LAS: 0.8945, UEM: 0.5720, LEM: 0.3474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5785, partial_loss/deprel_loss: 0.6467, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8087, loss: 0.7620, batch_reg_loss: 0.1756, reg_loss: 0.1758 ||:  83%|########2 | 92/111 [01:05<00:13,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9420, LAS: 0.8944, UEM: 0.5703, LEM: 0.3458, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2231, partial_loss/deprel_loss: 0.4463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5773, loss: 0.7642, batch_reg_loss: 0.1756, reg_loss: 0.1758 ||:  86%|########5 | 95/111 [01:07<00:11,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9420, LAS: 0.8944, UEM: 0.5656, LEM: 0.3414, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3783, partial_loss/deprel_loss: 0.4944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6468, loss: 0.7654, batch_reg_loss: 0.1756, reg_loss: 0.1757 ||:  88%|########8 | 98/111 [01:09<00:09,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9425, LAS: 0.8950, UEM: 0.5688, LEM: 0.3418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2546, partial_loss/deprel_loss: 0.4079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5528, loss: 0.7615, batch_reg_loss: 0.1756, reg_loss: 0.1757 ||:  91%|######### | 101/111 [01:12<00:07,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8398, UAS: 0.9421, LAS: 0.8945, UEM: 0.5678, LEM: 0.3398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2186, partial_loss/deprel_loss: 0.9452, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1755, loss: 0.7646, batch_reg_loss: 0.1756, reg_loss: 0.1757 ||:  95%|#########4| 105/111 [01:14<00:04,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8529, UAS: 0.9422, LAS: 0.8945, UEM: 0.5710, LEM: 0.3428, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1337, partial_loss/deprel_loss: 0.8690, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0975, loss: 0.7643, batch_reg_loss: 0.1756, reg_loss: 0.1757 ||:  97%|#########7| 108/111 [01:16<00:02,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9424, LAS: 0.8947, UEM: 0.5696, LEM: 0.3410, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4207, partial_loss/deprel_loss: 0.5379, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6900, loss: 0.7623, batch_reg_loss: 0.1756, reg_loss: 0.1757 ||: 100%|##########| 111/111 [01:18<00:00,  1.41it/s]\n",
+      "2023-04-07 00:18:37,817 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.538  |       N/A\n",
+      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.421  |       N/A\n",
+      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.176  |       N/A\n",
+      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - UEM                      |     0.570  |       N/A\n",
+      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - LAS                      |     0.895  |       N/A\n",
+      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - loss                     |     0.762  |       N/A\n",
+      "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - LEM                      |     0.341  |       N/A\n",
+      "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - UAS                      |     0.942  |       N/A\n",
+      "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - EM                       |     0.905  |       N/A\n",
+      "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:18:37,824 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 00:18:43,756 - INFO - combo.training.trainer - Epoch duration: 0:01:27.828285\n",
+      "2023-04-07 00:18:43,756 - INFO - combo.training.trainer - Estimated training time remaining: 7:22:02\n",
+      "2023-04-07 00:18:43,756 - INFO - allennlp.training.trainer - Epoch 67/399\n",
+      "2023-04-07 00:18:43,756 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:18:43,757 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:18:43,764 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9642, LAS: 0.9136, UEM: 0.7103, LEM: 0.4176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4133, partial_loss/deprel_loss: 0.5074, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6642, loss: 0.5930, batch_reg_loss: 0.1756, reg_loss: 0.1756 ||:   3%|2         | 3/111 [00:02<01:17,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9569, LAS: 0.9091, UEM: 0.6867, LEM: 0.4183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8104, partial_loss/deprel_loss: 0.7143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9091, loss: 0.6318, batch_reg_loss: 0.1756, reg_loss: 0.1756 ||:   5%|5         | 6/111 [00:04<01:15,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8706, UAS: 0.9488, LAS: 0.9010, UEM: 0.6200, LEM: 0.3721, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8166, partial_loss/deprel_loss: 0.7593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9463, loss: 0.6963, batch_reg_loss: 0.1756, reg_loss: 0.1756 ||:   8%|8         | 9/111 [00:06<01:11,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9508, LAS: 0.9041, UEM: 0.6444, LEM: 0.3996, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5798, partial_loss/deprel_loss: 0.5682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7461, loss: 0.6720, batch_reg_loss: 0.1755, reg_loss: 0.1756 ||:  11%|#         | 12/111 [00:08<01:12,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8375, UAS: 0.9467, LAS: 0.8998, UEM: 0.6254, LEM: 0.3844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4919, partial_loss/deprel_loss: 0.8657, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1665, loss: 0.7057, batch_reg_loss: 0.1755, reg_loss: 0.1756 ||:  14%|#3        | 15/111 [00:10<01:10,  1.36it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9469, LAS: 0.8998, UEM: 0.6047, LEM: 0.3613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5035, partial_loss/deprel_loss: 0.5987, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7551, loss: 0.7078, batch_reg_loss: 0.1755, reg_loss: 0.1756 ||:  16%|#6        | 18/111 [00:12<01:06,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8705, UAS: 0.9442, LAS: 0.8963, UEM: 0.5739, LEM: 0.3340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7310, partial_loss/deprel_loss: 0.7217, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8991, loss: 0.7291, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  20%|#9        | 22/111 [00:15<01:01,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9013, UAS: 0.9430, LAS: 0.8945, UEM: 0.5612, LEM: 0.3196, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3415, partial_loss/deprel_loss: 0.5077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6500, loss: 0.7442, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  23%|##3       | 26/111 [00:18<00:57,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8734, UAS: 0.9418, LAS: 0.8931, UEM: 0.5430, LEM: 0.3052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8382, partial_loss/deprel_loss: 0.7788, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9661, loss: 0.7568, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  26%|##6       | 29/111 [00:20<00:56,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9279, UAS: 0.9410, LAS: 0.8926, UEM: 0.5419, LEM: 0.3050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1855, partial_loss/deprel_loss: 0.3591, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4999, loss: 0.7624, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  29%|##8       | 32/111 [00:22<00:54,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9414, LAS: 0.8931, UEM: 0.5294, LEM: 0.2942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4009, partial_loss/deprel_loss: 0.4967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6530, loss: 0.7629, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  32%|###2      | 36/111 [00:24<00:50,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9408, LAS: 0.8920, UEM: 0.5319, LEM: 0.2971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2387, partial_loss/deprel_loss: 0.4094, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5507, loss: 0.7721, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  35%|###5      | 39/111 [00:27<00:50,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9387, LAS: 0.8896, UEM: 0.5138, LEM: 0.2844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7333, partial_loss/deprel_loss: 0.7696, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9378, loss: 0.7934, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  39%|###8      | 43/111 [00:29<00:46,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9402, LAS: 0.8909, UEM: 0.5172, LEM: 0.2789, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4004, partial_loss/deprel_loss: 0.5476, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6936, loss: 0.7838, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  42%|####2     | 47/111 [00:32<00:41,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9420, LAS: 0.8928, UEM: 0.5398, LEM: 0.2949, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2967, partial_loss/deprel_loss: 0.4850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6228, loss: 0.7686, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  46%|####5     | 51/111 [00:34<00:40,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8131, UAS: 0.9405, LAS: 0.8912, UEM: 0.5303, LEM: 0.2880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9220, partial_loss/deprel_loss: 1.1761, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5007, loss: 0.7840, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  49%|####8     | 54/111 [00:37<00:38,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9656, UAS: 0.9420, LAS: 0.8931, UEM: 0.5650, LEM: 0.3310, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0461, partial_loss/deprel_loss: 0.1304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2890, loss: 0.7724, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  51%|#####1    | 57/111 [00:39<00:40,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8863, UAS: 0.9416, LAS: 0.8928, UEM: 0.5562, LEM: 0.3234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6266, partial_loss/deprel_loss: 0.6746, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8405, loss: 0.7761, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  55%|#####4    | 61/111 [00:42<00:35,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8867, UAS: 0.9413, LAS: 0.8928, UEM: 0.5574, LEM: 0.3264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8080, partial_loss/deprel_loss: 0.7247, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9168, loss: 0.7787, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  58%|#####7    | 64/111 [00:44<00:33,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9412, LAS: 0.8928, UEM: 0.5553, LEM: 0.3234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2988, partial_loss/deprel_loss: 0.4409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5880, loss: 0.7789, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  61%|######1   | 68/111 [00:46<00:29,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9407, LAS: 0.8924, UEM: 0.5512, LEM: 0.3204, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4814, partial_loss/deprel_loss: 0.5985, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7505, loss: 0.7839, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  65%|######4   | 72/111 [00:49<00:26,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9412, LAS: 0.8931, UEM: 0.5510, LEM: 0.3184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2814, partial_loss/deprel_loss: 0.3595, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5193, loss: 0.7792, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  68%|######8   | 76/111 [00:51<00:22,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9425, LAS: 0.8948, UEM: 0.5767, LEM: 0.3478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1161, partial_loss/deprel_loss: 0.2586, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4055, loss: 0.7664, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  72%|#######2  | 80/111 [00:54<00:21,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8449, UAS: 0.9419, LAS: 0.8942, UEM: 0.5766, LEM: 0.3485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3649, partial_loss/deprel_loss: 0.9268, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1898, loss: 0.7712, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  76%|#######5  | 84/111 [00:57<00:18,  1.50it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9419, LAS: 0.8943, UEM: 0.5731, LEM: 0.3455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8962, partial_loss/deprel_loss: 0.7475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9527, loss: 0.7723, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  79%|#######9  | 88/111 [01:00<00:15,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8731, UAS: 0.9417, LAS: 0.8942, UEM: 0.5688, LEM: 0.3422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0678, partial_loss/deprel_loss: 0.7556, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9934, loss: 0.7736, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  83%|########2 | 92/111 [01:02<00:12,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9423, LAS: 0.8947, UEM: 0.5730, LEM: 0.3437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3825, partial_loss/deprel_loss: 0.4802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6360, loss: 0.7677, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  86%|########5 | 95/111 [01:05<00:11,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8799, UAS: 0.9423, LAS: 0.8947, UEM: 0.5699, LEM: 0.3403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6675, partial_loss/deprel_loss: 0.6876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8590, loss: 0.7672, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  88%|########8 | 98/111 [01:07<00:09,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9031, UAS: 0.9425, LAS: 0.8949, UEM: 0.5694, LEM: 0.3394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4298, partial_loss/deprel_loss: 0.5523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7032, loss: 0.7656, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  91%|######### | 101/111 [01:09<00:07,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9427, LAS: 0.8950, UEM: 0.5679, LEM: 0.3363, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8124, partial_loss/deprel_loss: 0.7865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9671, loss: 0.7648, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  94%|#########3| 104/111 [01:12<00:05,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8479, UAS: 0.9427, LAS: 0.8950, UEM: 0.5721, LEM: 0.3398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1232, partial_loss/deprel_loss: 0.8301, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0640, loss: 0.7638, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  96%|#########6| 107/111 [01:14<00:02,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9429, LAS: 0.8952, UEM: 0.5712, LEM: 0.3392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4432, partial_loss/deprel_loss: 0.5331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6905, loss: 0.7619, batch_reg_loss: 0.1753, reg_loss: 0.1755 ||: 100%|##########| 111/111 [01:16<00:00,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9429, LAS: 0.8952, UEM: 0.5712, LEM: 0.3392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4432, partial_loss/deprel_loss: 0.5331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6905, loss: 0.7619, batch_reg_loss: 0.1753, reg_loss: 0.1755 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
+      "2023-04-07 00:20:03,747 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:20:03,747 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:20:03,747 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:20:03,747 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:20:03,747 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.533  |       N/A\n",
+      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.443  |       N/A\n",
+      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.175  |       N/A\n",
+      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - UEM                      |     0.571  |       N/A\n",
+      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - LAS                      |     0.895  |       N/A\n",
+      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - loss                     |     0.762  |       N/A\n",
+      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - LEM                      |     0.339  |       N/A\n",
+      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - UAS                      |     0.943  |       N/A\n",
+      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - EM                       |     0.898  |       N/A\n",
+      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:20:03,753 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 00:20:08,702 - INFO - combo.training.trainer - Epoch duration: 0:01:24.945331\n",
+      "2023-04-07 00:20:08,702 - INFO - combo.training.trainer - Estimated training time remaining: 7:21:09\n",
+      "2023-04-07 00:20:08,702 - INFO - allennlp.training.trainer - Epoch 68/399\n",
+      "2023-04-07 00:20:08,703 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:20:08,703 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:20:08,712 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9535, LAS: 0.9120, UEM: 0.6017, LEM: 0.3548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3017, partial_loss/deprel_loss: 0.4315, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5809, loss: 0.6322, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||:   4%|3         | 4/111 [00:02<01:05,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8080, UAS: 0.9387, LAS: 0.8935, UEM: 0.5898, LEM: 0.3554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9282, partial_loss/deprel_loss: 1.0957, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4375, loss: 0.7649, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||:   7%|7         | 8/111 [00:05<01:05,  1.57it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9419, LAS: 0.8966, UEM: 0.6199, LEM: 0.3896, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1184, partial_loss/deprel_loss: 0.2622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4087, loss: 0.7419, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||:  10%|9         | 11/111 [00:07<01:07,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8727, UAS: 0.9371, LAS: 0.8921, UEM: 0.6124, LEM: 0.3958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9503, partial_loss/deprel_loss: 0.7199, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9412, loss: 0.7698, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||:  13%|#2        | 14/111 [00:09<01:07,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8850, UAS: 0.9398, LAS: 0.8943, UEM: 0.5887, LEM: 0.3609, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6932, partial_loss/deprel_loss: 0.7136, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8848, loss: 0.7637, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||:  16%|#6        | 18/111 [00:11<01:01,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9373, LAS: 0.8906, UEM: 0.5553, LEM: 0.3335, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4083, partial_loss/deprel_loss: 0.5014, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6580, loss: 0.7922, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||:  20%|#9        | 22/111 [00:14<00:57,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9363, LAS: 0.8891, UEM: 0.5288, LEM: 0.3147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6937, partial_loss/deprel_loss: 0.7187, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8890, loss: 0.8091, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||:  23%|##3       | 26/111 [00:16<00:52,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9110, UAS: 0.9373, LAS: 0.8901, UEM: 0.5235, LEM: 0.3052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3720, partial_loss/deprel_loss: 0.4579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6160, loss: 0.7941, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||:  27%|##7       | 30/111 [00:19<00:50,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8641, UAS: 0.9370, LAS: 0.8900, UEM: 0.5187, LEM: 0.3013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1057, partial_loss/deprel_loss: 0.7296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9801, loss: 0.7943, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||:  31%|###       | 34/111 [00:21<00:46,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9386, LAS: 0.8917, UEM: 0.5275, LEM: 0.3025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2765, partial_loss/deprel_loss: 0.3947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5464, loss: 0.7792, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||:  34%|###4      | 38/111 [00:24<00:45,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9375, LAS: 0.8906, UEM: 0.5236, LEM: 0.3001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2414, partial_loss/deprel_loss: 0.3580, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5099, loss: 0.7878, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  38%|###7      | 42/111 [00:26<00:44,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9376, LAS: 0.8906, UEM: 0.5201, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4612, partial_loss/deprel_loss: 0.5141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6788, loss: 0.7886, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  41%|####1     | 46/111 [00:30<00:44,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8714, UAS: 0.9371, LAS: 0.8898, UEM: 0.5100, LEM: 0.2858, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8646, partial_loss/deprel_loss: 0.7190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9233, loss: 0.7953, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  45%|####5     | 50/111 [00:32<00:40,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9379, LAS: 0.8905, UEM: 0.5044, LEM: 0.2793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3146, partial_loss/deprel_loss: 0.5010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6390, loss: 0.7904, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  49%|####8     | 54/111 [00:35<00:37,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9390, LAS: 0.8916, UEM: 0.5100, LEM: 0.2795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7704, partial_loss/deprel_loss: 0.6965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8865, loss: 0.7837, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  52%|#####2    | 58/111 [00:37<00:34,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9404, LAS: 0.8931, UEM: 0.5284, LEM: 0.2965, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2296, partial_loss/deprel_loss: 0.3919, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5346, loss: 0.7733, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  56%|#####5    | 62/111 [00:40<00:33,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9407, LAS: 0.8932, UEM: 0.5270, LEM: 0.2935, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9076, partial_loss/deprel_loss: 0.7910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9895, loss: 0.7728, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  59%|#####8    | 65/111 [00:42<00:31,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8835, UAS: 0.9411, LAS: 0.8936, UEM: 0.5325, LEM: 0.3001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7607, partial_loss/deprel_loss: 0.6914, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8805, loss: 0.7690, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  61%|######1   | 68/111 [00:45<00:31,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8679, UAS: 0.9413, LAS: 0.8941, UEM: 0.5542, LEM: 0.3325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8555, partial_loss/deprel_loss: 0.7473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9442, loss: 0.7660, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  64%|######3   | 71/111 [00:47<00:30,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9424, LAS: 0.8953, UEM: 0.5672, LEM: 0.3410, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2020, partial_loss/deprel_loss: 0.3738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5146, loss: 0.7573, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  67%|######6   | 74/111 [00:49<00:27,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9429, LAS: 0.8959, UEM: 0.5668, LEM: 0.3399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3585, partial_loss/deprel_loss: 0.4436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6018, loss: 0.7541, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  69%|######9   | 77/111 [00:52<00:25,  1.33it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9074, UAS: 0.9430, LAS: 0.8959, UEM: 0.5699, LEM: 0.3420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3904, partial_loss/deprel_loss: 0.5182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6678, loss: 0.7540, batch_reg_loss: 0.1752, reg_loss: 0.1752 ||:  72%|#######2  | 80/111 [00:54<00:23,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8795, UAS: 0.9431, LAS: 0.8959, UEM: 0.5689, LEM: 0.3386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7975, partial_loss/deprel_loss: 0.6776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8768, loss: 0.7528, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||:  76%|#######5  | 84/111 [00:57<00:19,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9435, LAS: 0.8963, UEM: 0.5747, LEM: 0.3448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4846, partial_loss/deprel_loss: 0.5977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7502, loss: 0.7493, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||:  78%|#######8  | 87/111 [00:59<00:17,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9434, LAS: 0.8962, UEM: 0.5679, LEM: 0.3372, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4348, partial_loss/deprel_loss: 0.5119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6716, loss: 0.7515, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||:  82%|########1 | 91/111 [01:01<00:13,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9430, LAS: 0.8956, UEM: 0.5675, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3792, partial_loss/deprel_loss: 0.5264, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6721, loss: 0.7560, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||:  86%|########5 | 95/111 [01:04<00:10,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8835, UAS: 0.9425, LAS: 0.8951, UEM: 0.5604, LEM: 0.3317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6581, partial_loss/deprel_loss: 0.6357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8153, loss: 0.7601, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||:  88%|########8 | 98/111 [01:06<00:09,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9430, LAS: 0.8956, UEM: 0.5657, LEM: 0.3356, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2269, partial_loss/deprel_loss: 0.3150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4725, loss: 0.7555, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||:  91%|######### | 101/111 [01:09<00:07,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9042, UAS: 0.9434, LAS: 0.8958, UEM: 0.5635, LEM: 0.3316, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3605, partial_loss/deprel_loss: 0.6125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7372, loss: 0.7544, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||:  94%|#########3| 104/111 [01:11<00:05,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9468, UAS: 0.9443, LAS: 0.8970, UEM: 0.5796, LEM: 0.3480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1041, partial_loss/deprel_loss: 0.2231, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3744, loss: 0.7458, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||:  97%|#########7| 108/111 [01:14<00:02,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.9443, LAS: 0.8969, UEM: 0.5791, LEM: 0.3471, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1234, partial_loss/deprel_loss: 0.8039, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0429, loss: 0.7461, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||: 100%|##########| 111/111 [01:15<00:00,  1.46it/s]\n",
+      "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.804  |       N/A\n",
+      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.123  |       N/A\n",
+      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.175  |       N/A\n",
+      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - UEM                      |     0.579  |       N/A\n",
+      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - LAS                      |     0.897  |       N/A\n",
+      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - loss                     |     0.746  |       N/A\n",
+      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - LEM                      |     0.347  |       N/A\n",
+      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - UAS                      |     0.944  |       N/A\n",
+      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - EM                       |     0.867  |       N/A\n",
+      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:21:27,343 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 00:21:31,579 - INFO - combo.training.trainer - Epoch duration: 0:01:22.876591\n",
+      "2023-04-07 00:21:31,579 - INFO - combo.training.trainer - Estimated training time remaining: 7:20:04\n",
+      "2023-04-07 00:21:31,580 - INFO - allennlp.training.trainer - Epoch 69/399\n",
+      "2023-04-07 00:21:31,580 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:21:31,580 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:21:31,588 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9372, LAS: 0.8856, UEM: 0.3389, LEM: 0.1217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4732, partial_loss/deprel_loss: 0.4556, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6342, loss: 0.8309, batch_reg_loss: 0.1751, reg_loss: 0.1751 ||:   4%|3         | 4/111 [00:02<01:07,  1.59it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9488, LAS: 0.9004, UEM: 0.5510, LEM: 0.2977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2803, partial_loss/deprel_loss: 0.4075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5571, loss: 0.7200, batch_reg_loss: 0.1750, reg_loss: 0.1751 ||:   7%|7         | 8/111 [00:04<01:02,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9457, LAS: 0.8972, UEM: 0.5200, LEM: 0.2623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4084, partial_loss/deprel_loss: 0.4927, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6509, loss: 0.7452, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  11%|#         | 12/111 [00:07<01:01,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8633, UAS: 0.9434, LAS: 0.8948, UEM: 0.5249, LEM: 0.2788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9379, partial_loss/deprel_loss: 0.8857, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0712, loss: 0.7653, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  14%|#3        | 15/111 [00:09<01:02,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9402, LAS: 0.8918, UEM: 0.5390, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2273, partial_loss/deprel_loss: 0.3256, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4810, loss: 0.7944, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  16%|#6        | 18/111 [00:11<01:03,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9430, LAS: 0.8945, UEM: 0.5717, LEM: 0.3261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3787, partial_loss/deprel_loss: 0.5596, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6984, loss: 0.7723, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  19%|#8        | 21/111 [00:14<01:02,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8528, UAS: 0.9404, LAS: 0.8918, UEM: 0.5454, LEM: 0.3059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2247, partial_loss/deprel_loss: 0.8758, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1205, loss: 0.7921, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  22%|##1       | 24/111 [00:16<01:00,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8304, UAS: 0.9382, LAS: 0.8897, UEM: 0.5276, LEM: 0.2917, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6034, partial_loss/deprel_loss: 0.8647, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1875, loss: 0.8006, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  24%|##4       | 27/111 [00:18<00:58,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9380, LAS: 0.8899, UEM: 0.5353, LEM: 0.3041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2211, partial_loss/deprel_loss: 0.3530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5016, loss: 0.8007, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  27%|##7       | 30/111 [00:20<00:59,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9380, LAS: 0.8903, UEM: 0.5375, LEM: 0.3127, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2206, partial_loss/deprel_loss: 0.3535, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5019, loss: 0.7981, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  30%|##9       | 33/111 [00:22<00:57,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9395, LAS: 0.8919, UEM: 0.5439, LEM: 0.3135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5803, partial_loss/deprel_loss: 0.5271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7127, loss: 0.7799, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  33%|###3      | 37/111 [00:25<00:52,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9400, LAS: 0.8925, UEM: 0.5530, LEM: 0.3207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3376, partial_loss/deprel_loss: 0.4714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6196, loss: 0.7748, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  37%|###6      | 41/111 [00:28<00:49,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9632, UAS: 0.9408, LAS: 0.8937, UEM: 0.5844, LEM: 0.3672, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0568, partial_loss/deprel_loss: 0.1404, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2986, loss: 0.7665, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  40%|###9      | 44/111 [00:30<00:49,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9411, LAS: 0.8936, UEM: 0.5783, LEM: 0.3588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2504, partial_loss/deprel_loss: 0.4800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6091, loss: 0.7676, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  42%|####2     | 47/111 [00:32<00:45,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8815, UAS: 0.9419, LAS: 0.8945, UEM: 0.5785, LEM: 0.3548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6921, partial_loss/deprel_loss: 0.7226, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8914, loss: 0.7608, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  46%|####5     | 51/111 [00:35<00:41,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8731, UAS: 0.9407, LAS: 0.8931, UEM: 0.5619, LEM: 0.3419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9564, partial_loss/deprel_loss: 0.7671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9799, loss: 0.7714, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||:  50%|####9     | 55/111 [00:37<00:38,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9407, LAS: 0.8932, UEM: 0.5584, LEM: 0.3364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5583, partial_loss/deprel_loss: 0.5483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7253, loss: 0.7697, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||:  53%|#####3    | 59/111 [00:40<00:34,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8819, UAS: 0.9405, LAS: 0.8928, UEM: 0.5496, LEM: 0.3283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7194, partial_loss/deprel_loss: 0.7566, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9240, loss: 0.7737, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||:  57%|#####6    | 63/111 [00:43<00:31,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9013, UAS: 0.9410, LAS: 0.8932, UEM: 0.5453, LEM: 0.3202, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4204, partial_loss/deprel_loss: 0.5264, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6801, loss: 0.7715, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||:  60%|######    | 67/111 [00:45<00:27,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9418, LAS: 0.8937, UEM: 0.5471, LEM: 0.3167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3232, partial_loss/deprel_loss: 0.4991, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6388, loss: 0.7663, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||:  64%|######3   | 71/111 [00:48<00:26,  1.49it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8778, UAS: 0.9413, LAS: 0.8930, UEM: 0.5375, LEM: 0.3083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7553, partial_loss/deprel_loss: 0.7453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9222, loss: 0.7724, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||:  68%|######7   | 75/111 [00:51<00:24,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8882, UAS: 0.9418, LAS: 0.8934, UEM: 0.5385, LEM: 0.3074, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5953, partial_loss/deprel_loss: 0.6810, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8388, loss: 0.7695, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||:  70%|#######   | 78/111 [00:53<00:24,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9427, LAS: 0.8946, UEM: 0.5573, LEM: 0.3260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2803, partial_loss/deprel_loss: 0.4075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5569, loss: 0.7609, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||:  73%|#######2  | 81/111 [00:55<00:21,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8745, UAS: 0.9429, LAS: 0.8948, UEM: 0.5602, LEM: 0.3283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8755, partial_loss/deprel_loss: 0.6715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8872, loss: 0.7592, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||:  76%|#######5  | 84/111 [00:58<00:19,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9429, LAS: 0.8950, UEM: 0.5685, LEM: 0.3388, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2962, partial_loss/deprel_loss: 0.4650, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6061, loss: 0.7592, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||:  78%|#######8  | 87/111 [01:00<00:17,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9437, LAS: 0.8959, UEM: 0.5770, LEM: 0.3451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2044, partial_loss/deprel_loss: 0.3830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5221, loss: 0.7520, batch_reg_loss: 0.1748, reg_loss: 0.1750 ||:  82%|########1 | 91/111 [01:02<00:14,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9440, LAS: 0.8962, UEM: 0.5740, LEM: 0.3409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4221, partial_loss/deprel_loss: 0.4896, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6510, loss: 0.7511, batch_reg_loss: 0.1748, reg_loss: 0.1750 ||:  85%|########4 | 94/111 [01:05<00:12,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9435, LAS: 0.8957, UEM: 0.5720, LEM: 0.3396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3220, partial_loss/deprel_loss: 0.4080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5656, loss: 0.7546, batch_reg_loss: 0.1748, reg_loss: 0.1749 ||:  88%|########8 | 98/111 [01:07<00:09,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8723, UAS: 0.9435, LAS: 0.8959, UEM: 0.5687, LEM: 0.3355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9934, partial_loss/deprel_loss: 0.7374, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9634, loss: 0.7537, batch_reg_loss: 0.1748, reg_loss: 0.1749 ||:  92%|#########1| 102/111 [01:10<00:06,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9441, LAS: 0.8966, UEM: 0.5770, LEM: 0.3420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1999, partial_loss/deprel_loss: 0.3860, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5236, loss: 0.7478, batch_reg_loss: 0.1748, reg_loss: 0.1749 ||:  95%|#########4| 105/111 [01:13<00:04,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9441, LAS: 0.8966, UEM: 0.5723, LEM: 0.3380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3267, partial_loss/deprel_loss: 0.3953, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5564, loss: 0.7484, batch_reg_loss: 0.1748, reg_loss: 0.1749 ||:  98%|#########8| 109/111 [01:15<00:01,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9445, LAS: 0.8970, UEM: 0.5766, LEM: 0.3406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2103, partial_loss/deprel_loss: 0.3635, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5076, loss: 0.7455, batch_reg_loss: 0.1748, reg_loss: 0.1749 ||: 100%|##########| 111/111 [01:16<00:00,  1.44it/s]\n",
+      "2023-04-07 00:22:51,428 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:22:51,428 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:22:51,428 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:22:51,428 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:22:51,428 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:22:51,428 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:22:51,428 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.363  |       N/A\n",
+      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.210  |       N/A\n",
+      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.175  |       N/A\n",
+      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - UEM                      |     0.577  |       N/A\n",
+      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - LAS                      |     0.897  |       N/A\n",
+      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - loss                     |     0.746  |       N/A\n",
+      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - LEM                      |     0.341  |       N/A\n",
+      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - UAS                      |     0.945  |       N/A\n",
+      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - EM                       |     0.925  |       N/A\n",
+      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:22:51,434 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 00:22:55,983 - INFO - combo.training.trainer - Epoch duration: 0:01:24.403512\n",
+      "2023-04-07 00:22:55,983 - INFO - combo.training.trainer - Estimated training time remaining: 7:19:06\n",
+      "2023-04-07 00:22:55,984 - INFO - allennlp.training.trainer - Epoch 70/399\n",
+      "2023-04-07 00:22:55,984 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:22:55,984 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:22:55,993 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9506, LAS: 0.9042, UEM: 0.5290, LEM: 0.2968, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6881, partial_loss/deprel_loss: 0.6097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8001, loss: 0.6847, batch_reg_loss: 0.1748, reg_loss: 0.1748 ||:   3%|2         | 3/111 [00:02<01:22,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9477, LAS: 0.8997, UEM: 0.5508, LEM: 0.2936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2564, partial_loss/deprel_loss: 0.4398, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5779, loss: 0.7136, batch_reg_loss: 0.1748, reg_loss: 0.1748 ||:   6%|6         | 7/111 [00:04<01:14,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8665, UAS: 0.9454, LAS: 0.8973, UEM: 0.5153, LEM: 0.2580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8429, partial_loss/deprel_loss: 0.8392, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0147, loss: 0.7399, batch_reg_loss: 0.1747, reg_loss: 0.1748 ||:  10%|9         | 11/111 [00:07<01:10,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9452, LAS: 0.8978, UEM: 0.5334, LEM: 0.2912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5317, partial_loss/deprel_loss: 0.5513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7221, loss: 0.7331, batch_reg_loss: 0.1747, reg_loss: 0.1748 ||:  13%|#2        | 14/111 [00:09<01:08,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8345, UAS: 0.9460, LAS: 0.8982, UEM: 0.5915, LEM: 0.3525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1596, partial_loss/deprel_loss: 0.8480, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0851, loss: 0.7203, batch_reg_loss: 0.1747, reg_loss: 0.1748 ||:  16%|#6        | 18/111 [00:12<01:03,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8866, UAS: 0.9457, LAS: 0.8980, UEM: 0.5696, LEM: 0.3340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4944, partial_loss/deprel_loss: 0.6857, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8221, loss: 0.7229, batch_reg_loss: 0.1747, reg_loss: 0.1747 ||:  20%|#9        | 22/111 [00:14<00:58,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9450, LAS: 0.8981, UEM: 0.5822, LEM: 0.3567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1255, partial_loss/deprel_loss: 0.2653, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4120, loss: 0.7276, batch_reg_loss: 0.1747, reg_loss: 0.1747 ||:  23%|##3       | 26/111 [00:17<00:55,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9464, LAS: 0.8994, UEM: 0.6001, LEM: 0.3663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1067, partial_loss/deprel_loss: 0.3424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4700, loss: 0.7160, batch_reg_loss: 0.1747, reg_loss: 0.1747 ||:  27%|##7       | 30/111 [00:19<00:52,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8758, UAS: 0.9470, LAS: 0.9001, UEM: 0.6030, LEM: 0.3675, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7936, partial_loss/deprel_loss: 0.7543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9368, loss: 0.7124, batch_reg_loss: 0.1747, reg_loss: 0.1747 ||:  30%|##9       | 33/111 [00:21<00:51,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9472, LAS: 0.9003, UEM: 0.6065, LEM: 0.3669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4683, partial_loss/deprel_loss: 0.5891, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7396, loss: 0.7110, batch_reg_loss: 0.1747, reg_loss: 0.1747 ||:  32%|###2      | 36/111 [00:24<00:52,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9483, LAS: 0.9017, UEM: 0.6156, LEM: 0.3730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1905, partial_loss/deprel_loss: 0.3738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5118, loss: 0.7037, batch_reg_loss: 0.1747, reg_loss: 0.1747 ||:  35%|###5      | 39/111 [00:26<00:50,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9464, LAS: 0.8989, UEM: 0.5964, LEM: 0.3577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5875, partial_loss/deprel_loss: 0.6289, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7953, loss: 0.7232, batch_reg_loss: 0.1747, reg_loss: 0.1747 ||:  39%|###8      | 43/111 [00:28<00:46,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9463, LAS: 0.8987, UEM: 0.5899, LEM: 0.3501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8414, partial_loss/deprel_loss: 0.6776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8850, loss: 0.7244, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  41%|####1     | 46/111 [00:31<00:46,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9472, LAS: 0.8996, UEM: 0.5881, LEM: 0.3436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3002, partial_loss/deprel_loss: 0.4886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6255, loss: 0.7186, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  45%|####5     | 50/111 [00:33<00:41,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9467, LAS: 0.8991, UEM: 0.5861, LEM: 0.3422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2186, partial_loss/deprel_loss: 0.3734, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5171, loss: 0.7234, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  49%|####8     | 54/111 [00:36<00:39,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9007, UAS: 0.9450, LAS: 0.8975, UEM: 0.5755, LEM: 0.3348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5630, partial_loss/deprel_loss: 0.6081, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7737, loss: 0.7364, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  51%|#####1    | 57/111 [00:38<00:37,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9450, LAS: 0.8976, UEM: 0.5710, LEM: 0.3301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2503, partial_loss/deprel_loss: 0.3736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5236, loss: 0.7372, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  55%|#####4    | 61/111 [00:41<00:34,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8635, UAS: 0.9442, LAS: 0.8967, UEM: 0.5627, LEM: 0.3232, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9444, partial_loss/deprel_loss: 0.8030, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0059, loss: 0.7428, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  59%|#####8    | 65/111 [00:43<00:30,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9451, LAS: 0.8978, UEM: 0.5759, LEM: 0.3349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3515, partial_loss/deprel_loss: 0.4999, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6448, loss: 0.7330, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  62%|######2   | 69/111 [00:46<00:28,  1.50it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9447, LAS: 0.8976, UEM: 0.5749, LEM: 0.3324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3702, partial_loss/deprel_loss: 0.4574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6146, loss: 0.7347, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  66%|######5   | 73/111 [00:49<00:26,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8852, UAS: 0.9453, LAS: 0.8984, UEM: 0.5932, LEM: 0.3584, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6705, partial_loss/deprel_loss: 0.6253, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8089, loss: 0.7296, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  68%|######8   | 76/111 [00:52<00:26,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9058, UAS: 0.9456, LAS: 0.8986, UEM: 0.5912, LEM: 0.3558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3765, partial_loss/deprel_loss: 0.5242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6692, loss: 0.7272, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  71%|#######1  | 79/111 [00:54<00:23,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9146, UAS: 0.9456, LAS: 0.8988, UEM: 0.5885, LEM: 0.3543, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3512, partial_loss/deprel_loss: 0.3822, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5506, loss: 0.7257, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  74%|#######3  | 82/111 [00:56<00:21,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9080, UAS: 0.9458, LAS: 0.8988, UEM: 0.5861, LEM: 0.3519, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4328, partial_loss/deprel_loss: 0.5251, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6812, loss: 0.7256, batch_reg_loss: 0.1745, reg_loss: 0.1747 ||:  77%|#######6  | 85/111 [00:58<00:18,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9459, LAS: 0.8990, UEM: 0.5836, LEM: 0.3492, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6683, partial_loss/deprel_loss: 0.6249, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8081, loss: 0.7242, batch_reg_loss: 0.1745, reg_loss: 0.1747 ||:  79%|#######9  | 88/111 [01:00<00:16,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9462, LAS: 0.8994, UEM: 0.5841, LEM: 0.3468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3782, partial_loss/deprel_loss: 0.5520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6918, loss: 0.7221, batch_reg_loss: 0.1745, reg_loss: 0.1746 ||:  83%|########2 | 92/111 [01:03<00:13,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9420, UAS: 0.9457, LAS: 0.8989, UEM: 0.5914, LEM: 0.3576, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1358, partial_loss/deprel_loss: 0.2361, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3906, loss: 0.7262, batch_reg_loss: 0.1745, reg_loss: 0.1746 ||:  86%|########5 | 95/111 [01:05<00:11,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9459, LAS: 0.8990, UEM: 0.5926, LEM: 0.3576, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2622, partial_loss/deprel_loss: 0.4041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5503, loss: 0.7256, batch_reg_loss: 0.1745, reg_loss: 0.1746 ||:  89%|########9 | 99/111 [01:08<00:08,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9452, LAS: 0.8983, UEM: 0.5850, LEM: 0.3516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6349, partial_loss/deprel_loss: 0.5700, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7575, loss: 0.7305, batch_reg_loss: 0.1745, reg_loss: 0.1746 ||:  93%|#########2| 103/111 [01:10<00:05,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8712, UAS: 0.9447, LAS: 0.8977, UEM: 0.5808, LEM: 0.3479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8001, partial_loss/deprel_loss: 0.7797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9583, loss: 0.7356, batch_reg_loss: 0.1745, reg_loss: 0.1746 ||:  96%|#########6| 107/111 [01:12<00:02,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9445, LAS: 0.8976, UEM: 0.5775, LEM: 0.3453, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5486, partial_loss/deprel_loss: 0.6677, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8184, loss: 0.7377, batch_reg_loss: 0.1745, reg_loss: 0.1746 ||: 100%|##########| 111/111 [01:15<00:00,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9445, LAS: 0.8976, UEM: 0.5775, LEM: 0.3453, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5486, partial_loss/deprel_loss: 0.6677, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8184, loss: 0.7377, batch_reg_loss: 0.1745, reg_loss: 0.1746 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
+      "2023-04-07 00:24:14,896 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9108, UAS: 0.9488, LAS: 0.8951, UEM: 0.5461, LEM: 0.2057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4334, partial_loss/deprel_loss: 24.7874, partial_loss/cycle_loss: 0.0000, batch_loss: 19.9166, loss: 23.9872, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:08,  1.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9054, UAS: 0.9478, LAS: 0.8936, UEM: 0.5263, LEM: 0.1940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5667, partial_loss/deprel_loss: 24.3909, partial_loss/cycle_loss: 0.0000, batch_loss: 19.6260, loss: 25.3352, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:04<00:07,  1.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8277, UAS: 0.9436, LAS: 0.8916, UEM: 0.6500, LEM: 0.3974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5601, partial_loss/deprel_loss: 57.8863, partial_loss/cycle_loss: 0.0000, batch_loss: 46.6211, loss: 27.1227, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  54%|#####3    | 7/13 [00:06<00:05,  1.05it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9284, UAS: 0.9474, LAS: 0.8963, UEM: 0.6602, LEM: 0.3935, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3731, partial_loss/deprel_loss: 17.6734, partial_loss/cycle_loss: 0.0000, batch_loss: 14.2133, loss: 25.4952, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  77%|#######6  | 10/13 [00:09<00:02,  1.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9467, LAS: 0.8959, UEM: 0.6521, LEM: 0.3874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9122, partial_loss/deprel_loss: 31.0175, partial_loss/cycle_loss: 0.0000, batch_loss: 24.9964, loss: 26.0198, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9467, LAS: 0.8959, UEM: 0.6521, LEM: 0.3874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9122, partial_loss/deprel_loss: 31.0175, partial_loss/cycle_loss: 0.0000, batch_loss: 24.9964, loss: 26.0198, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.03it/s]\n",
+      "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.668  |    31.017\n",
+      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.549  |     0.912\n",
+      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.175  |     0.000\n",
+      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - UEM                      |     0.577  |     0.652\n",
+      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - LAS                      |     0.898  |     0.896\n",
+      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - loss                     |     0.738  |    26.020\n",
+      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - LEM                      |     0.345  |     0.387\n",
+      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - UAS                      |     0.944  |     0.947\n",
+      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - EM                       |     0.896  |     0.884\n",
+      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:24:27,558 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:24:32,516 - INFO - combo.training.trainer - Epoch duration: 0:01:36.532109\n",
+      "2023-04-07 00:24:32,516 - INFO - combo.training.trainer - Estimated training time remaining: 7:19:04\n",
+      "2023-04-07 00:24:32,516 - INFO - allennlp.training.trainer - Epoch 71/399\n",
+      "2023-04-07 00:24:32,516 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:24:32,517 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:24:32,524 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9590, LAS: 0.9141, UEM: 0.6957, LEM: 0.4722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1020, partial_loss/deprel_loss: 0.2615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4041, loss: 0.6331, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||:   4%|3         | 4/111 [00:02<01:12,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8606, UAS: 0.9402, LAS: 0.8957, UEM: 0.6073, LEM: 0.4034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0627, partial_loss/deprel_loss: 0.6654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9193, loss: 0.7472, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||:   6%|6         | 7/111 [00:05<01:15,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9165, UAS: 0.9451, LAS: 0.9012, UEM: 0.5755, LEM: 0.3458, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3404, partial_loss/deprel_loss: 0.4493, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6020, loss: 0.7071, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||:  10%|9         | 11/111 [00:07<01:10,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8943, UAS: 0.9442, LAS: 0.8999, UEM: 0.5837, LEM: 0.3646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6201, partial_loss/deprel_loss: 0.6013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7796, loss: 0.7150, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||:  14%|#3        | 15/111 [00:10<01:04,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9411, LAS: 0.8963, UEM: 0.5649, LEM: 0.3436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4521, partial_loss/deprel_loss: 0.5205, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6813, loss: 0.7479, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||:  16%|#6        | 18/111 [00:12<01:03,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9401, LAS: 0.8946, UEM: 0.5597, LEM: 0.3347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2594, partial_loss/deprel_loss: 0.4458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5830, loss: 0.7609, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||:  20%|#9        | 22/111 [00:15<01:01,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9231, UAS: 0.9421, LAS: 0.8969, UEM: 0.5898, LEM: 0.3564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2663, partial_loss/deprel_loss: 0.4187, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5626, loss: 0.7449, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||:  23%|##2       | 25/111 [00:17<01:00,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8760, UAS: 0.9435, LAS: 0.8984, UEM: 0.5941, LEM: 0.3574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9035, partial_loss/deprel_loss: 0.7504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9555, loss: 0.7326, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||:  26%|##6       | 29/111 [00:19<00:56,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9435, LAS: 0.8980, UEM: 0.5835, LEM: 0.3432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2197, partial_loss/deprel_loss: 0.3918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5318, loss: 0.7323, batch_reg_loss: 0.1744, reg_loss: 0.1745 ||:  30%|##9       | 33/111 [00:22<00:51,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8720, UAS: 0.9419, LAS: 0.8962, UEM: 0.5642, LEM: 0.3297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8650, partial_loss/deprel_loss: 0.7420, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9410, loss: 0.7496, batch_reg_loss: 0.1744, reg_loss: 0.1745 ||:  32%|###2      | 36/111 [00:24<00:50,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9417, LAS: 0.8960, UEM: 0.5526, LEM: 0.3200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4917, partial_loss/deprel_loss: 0.5471, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7104, loss: 0.7502, batch_reg_loss: 0.1744, reg_loss: 0.1745 ||:  35%|###5      | 39/111 [00:26<00:49,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9422, LAS: 0.8962, UEM: 0.5459, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3982, partial_loss/deprel_loss: 0.4688, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6291, loss: 0.7475, batch_reg_loss: 0.1744, reg_loss: 0.1745 ||:  39%|###8      | 43/111 [00:28<00:45,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9426, LAS: 0.8967, UEM: 0.5581, LEM: 0.3228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2111, partial_loss/deprel_loss: 0.3592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5040, loss: 0.7444, batch_reg_loss: 0.1744, reg_loss: 0.1745 ||:  42%|####2     | 47/111 [00:32<00:45,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8804, UAS: 0.9429, LAS: 0.8970, UEM: 0.5574, LEM: 0.3219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6908, partial_loss/deprel_loss: 0.6305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8170, loss: 0.7423, batch_reg_loss: 0.1744, reg_loss: 0.1745 ||:  45%|####5     | 50/111 [00:34<00:44,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9442, LAS: 0.8986, UEM: 0.5893, LEM: 0.3646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2660, partial_loss/deprel_loss: 0.4181, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5620, loss: 0.7319, batch_reg_loss: 0.1744, reg_loss: 0.1745 ||:  48%|####7     | 53/111 [00:37<00:44,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8396, UAS: 0.9442, LAS: 0.8985, UEM: 0.5971, LEM: 0.3702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2169, partial_loss/deprel_loss: 0.9480, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1761, loss: 0.7328, batch_reg_loss: 0.1744, reg_loss: 0.1744 ||:  51%|#####1    | 57/111 [00:39<00:39,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9446, LAS: 0.8990, UEM: 0.5982, LEM: 0.3703, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2724, partial_loss/deprel_loss: 0.3848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5367, loss: 0.7271, batch_reg_loss: 0.1744, reg_loss: 0.1744 ||:  54%|#####4    | 60/111 [00:41<00:36,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8703, UAS: 0.9439, LAS: 0.8982, UEM: 0.5894, LEM: 0.3637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8146, partial_loss/deprel_loss: 0.7395, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9289, loss: 0.7332, batch_reg_loss: 0.1744, reg_loss: 0.1744 ||:  58%|#####7    | 64/111 [00:44<00:32,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9441, LAS: 0.8983, UEM: 0.5906, LEM: 0.3623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2832, partial_loss/deprel_loss: 0.4338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5781, loss: 0.7327, batch_reg_loss: 0.1744, reg_loss: 0.1744 ||:  60%|######    | 67/111 [00:46<00:30,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9442, LAS: 0.8982, UEM: 0.5844, LEM: 0.3549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3510, partial_loss/deprel_loss: 0.5362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6735, loss: 0.7346, batch_reg_loss: 0.1744, reg_loss: 0.1744 ||:  64%|######3   | 71/111 [00:48<00:26,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9443, LAS: 0.8983, UEM: 0.5809, LEM: 0.3504, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4050, partial_loss/deprel_loss: 0.4906, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6479, loss: 0.7343, batch_reg_loss: 0.1744, reg_loss: 0.1744 ||:  68%|######7   | 75/111 [00:51<00:23,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9447, LAS: 0.8986, UEM: 0.5798, LEM: 0.3479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2284, partial_loss/deprel_loss: 0.3343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4875, loss: 0.7322, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||:  71%|#######1  | 79/111 [00:54<00:21,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9449, LAS: 0.8989, UEM: 0.5804, LEM: 0.3481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2282, partial_loss/deprel_loss: 0.3447, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4958, loss: 0.7293, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||:  75%|#######4  | 83/111 [00:56<00:19,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9453, LAS: 0.8992, UEM: 0.5786, LEM: 0.3446, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2871, partial_loss/deprel_loss: 0.4169, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5653, loss: 0.7271, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||:  77%|#######7  | 86/111 [00:59<00:17,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8387, UAS: 0.9448, LAS: 0.8986, UEM: 0.5749, LEM: 0.3413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3576, partial_loss/deprel_loss: 0.9162, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1788, loss: 0.7315, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||:  80%|########  | 89/111 [01:01<00:15,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9453, LAS: 0.8991, UEM: 0.5820, LEM: 0.3470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2507, partial_loss/deprel_loss: 0.3985, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5433, loss: 0.7274, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||:  84%|########3 | 93/111 [01:04<00:12,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9457, LAS: 0.8996, UEM: 0.5859, LEM: 0.3502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2463, partial_loss/deprel_loss: 0.3536, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5065, loss: 0.7239, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||:  86%|########6 | 96/111 [01:06<00:10,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8722, UAS: 0.9452, LAS: 0.8989, UEM: 0.5788, LEM: 0.3453, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8455, partial_loss/deprel_loss: 0.7369, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9329, loss: 0.7287, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||:  89%|########9 | 99/111 [01:08<00:08,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9451, LAS: 0.8987, UEM: 0.5735, LEM: 0.3395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4627, partial_loss/deprel_loss: 0.5341, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6941, loss: 0.7290, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||:  93%|#########2| 103/111 [01:10<00:05,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9452, LAS: 0.8988, UEM: 0.5804, LEM: 0.3492, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5536, partial_loss/deprel_loss: 0.6417, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7984, loss: 0.7292, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||:  95%|#########5| 106/111 [01:13<00:03,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9449, LAS: 0.8985, UEM: 0.5797, LEM: 0.3489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2004, partial_loss/deprel_loss: 0.3910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5271, loss: 0.7315, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||:  98%|#########8| 109/111 [01:15<00:01,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9453, LAS: 0.8989, UEM: 0.5821, LEM: 0.3497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2464, partial_loss/deprel_loss: 0.4372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5733, loss: 0.7289, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||: 100%|##########| 111/111 [01:16<00:00,  1.46it/s]\n",
+      "2023-04-07 00:25:51,826 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.437  |       N/A\n",
+      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.246  |       N/A\n",
+      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.174  |       N/A\n",
+      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - UEM                      |     0.582  |       N/A\n",
+      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - LAS                      |     0.899  |       N/A\n",
+      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - loss                     |     0.729  |       N/A\n",
+      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - LEM                      |     0.350  |       N/A\n",
+      "2023-04-07 00:25:51,828 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:25:51,828 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:25:51,828 - INFO - combo.training.tensorboard_writer - UAS                      |     0.945  |       N/A\n",
+      "2023-04-07 00:25:51,828 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:25:51,828 - INFO - combo.training.tensorboard_writer - EM                       |     0.919  |       N/A\n",
+      "2023-04-07 00:25:51,828 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:25:51,833 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:25:58,450 - INFO - combo.training.trainer - Epoch duration: 0:01:25.934082\n",
+      "2023-04-07 00:25:58,451 - INFO - combo.training.trainer - Estimated training time remaining: 7:18:10\n",
+      "2023-04-07 00:25:58,451 - INFO - allennlp.training.trainer - Epoch 72/399\n",
+      "2023-04-07 00:25:58,451 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:25:58,451 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:25:58,459 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8653, UAS: 0.9210, LAS: 0.8741, UEM: 0.1528, LEM: 0.0349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0325, partial_loss/deprel_loss: 0.7074, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9467, loss: 0.9111, batch_reg_loss: 0.1743, reg_loss: 0.1743 ||:   3%|2         | 3/111 [00:02<01:14,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9339, LAS: 0.8884, UEM: 0.3328, LEM: 0.1396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3098, partial_loss/deprel_loss: 0.4203, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5725, loss: 0.8094, batch_reg_loss: 0.1743, reg_loss: 0.1743 ||:   5%|5         | 6/111 [00:04<01:12,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9255, UAS: 0.9389, LAS: 0.8942, UEM: 0.3980, LEM: 0.1852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2779, partial_loss/deprel_loss: 0.4066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5551, loss: 0.7716, batch_reg_loss: 0.1742, reg_loss: 0.1743 ||:   8%|8         | 9/111 [00:06<01:12,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9455, LAS: 0.9005, UEM: 0.5356, LEM: 0.2947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2017, partial_loss/deprel_loss: 0.3285, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4774, loss: 0.7129, batch_reg_loss: 0.1742, reg_loss: 0.1743 ||:  11%|#         | 12/111 [00:08<01:10,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9476, LAS: 0.9035, UEM: 0.6410, LEM: 0.4393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0145, partial_loss/deprel_loss: 0.7799, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0010, loss: 0.6982, batch_reg_loss: 0.1742, reg_loss: 0.1743 ||:  14%|#3        | 15/111 [00:11<01:14,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9487, LAS: 0.9049, UEM: 0.6574, LEM: 0.4550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1425, partial_loss/deprel_loss: 0.2706, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4192, loss: 0.6935, batch_reg_loss: 0.1742, reg_loss: 0.1742 ||:  16%|#6        | 18/111 [00:13<01:09,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8470, UAS: 0.9461, LAS: 0.9020, UEM: 0.6318, LEM: 0.4214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3470, partial_loss/deprel_loss: 0.7804, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0679, loss: 0.7139, batch_reg_loss: 0.1742, reg_loss: 0.1742 ||:  20%|#9        | 22/111 [00:16<01:04,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9479, LAS: 0.9035, UEM: 0.6285, LEM: 0.4075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5938, partial_loss/deprel_loss: 0.5446, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7286, loss: 0.6959, batch_reg_loss: 0.1742, reg_loss: 0.1742 ||:  23%|##3       | 26/111 [00:18<00:59,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9480, LAS: 0.9035, UEM: 0.6255, LEM: 0.4011, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2719, partial_loss/deprel_loss: 0.4565, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5938, loss: 0.6938, batch_reg_loss: 0.1742, reg_loss: 0.1742 ||:  26%|##6       | 29/111 [00:21<00:59,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8860, UAS: 0.9482, LAS: 0.9034, UEM: 0.6138, LEM: 0.3845, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5769, partial_loss/deprel_loss: 0.6008, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7702, loss: 0.6935, batch_reg_loss: 0.1742, reg_loss: 0.1742 ||:  30%|##9       | 33/111 [00:23<00:55,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9489, LAS: 0.9044, UEM: 0.6279, LEM: 0.3985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6194, partial_loss/deprel_loss: 0.5291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7213, loss: 0.6839, batch_reg_loss: 0.1742, reg_loss: 0.1742 ||:  32%|###2      | 36/111 [00:26<00:55,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9488, LAS: 0.9043, UEM: 0.6230, LEM: 0.3930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2512, partial_loss/deprel_loss: 0.3353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4926, loss: 0.6844, batch_reg_loss: 0.1742, reg_loss: 0.1742 ||:  36%|###6      | 40/111 [00:29<00:52,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8891, UAS: 0.9484, LAS: 0.9035, UEM: 0.6086, LEM: 0.3789, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5742, partial_loss/deprel_loss: 0.5775, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7509, loss: 0.6907, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  40%|###9      | 44/111 [00:31<00:46,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9182, UAS: 0.9482, LAS: 0.9033, UEM: 0.5955, LEM: 0.3669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3510, partial_loss/deprel_loss: 0.4102, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5725, loss: 0.6924, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  43%|####3     | 48/111 [00:33<00:41,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8468, UAS: 0.9474, LAS: 0.9021, UEM: 0.5940, LEM: 0.3668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2345, partial_loss/deprel_loss: 0.8553, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1053, loss: 0.7012, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  47%|####6     | 52/111 [00:36<00:38,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9483, LAS: 0.9031, UEM: 0.6069, LEM: 0.3767, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2363, partial_loss/deprel_loss: 0.3497, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5011, loss: 0.6941, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  50%|#####     | 56/111 [00:39<00:36,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9199, UAS: 0.9483, LAS: 0.9028, UEM: 0.5992, LEM: 0.3684, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2925, partial_loss/deprel_loss: 0.3917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5459, loss: 0.6959, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  54%|#####4    | 60/111 [00:41<00:33,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.9464, LAS: 0.9008, UEM: 0.5965, LEM: 0.3693, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0754, partial_loss/deprel_loss: 0.7823, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0150, loss: 0.7112, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  58%|#####7    | 64/111 [00:44<00:31,  1.50it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8076, UAS: 0.9458, LAS: 0.9003, UEM: 0.6044, LEM: 0.3765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8518, partial_loss/deprel_loss: 1.1044, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4279, loss: 0.7156, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  61%|######1   | 68/111 [00:47<00:29,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9458, LAS: 0.9002, UEM: 0.6026, LEM: 0.3740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6688, partial_loss/deprel_loss: 0.6208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8045, loss: 0.7183, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  64%|######3   | 71/111 [00:49<00:29,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9061, UAS: 0.9461, LAS: 0.9006, UEM: 0.6006, LEM: 0.3704, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3879, partial_loss/deprel_loss: 0.5238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6707, loss: 0.7152, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  67%|######6   | 74/111 [00:52<00:26,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9453, LAS: 0.8996, UEM: 0.5901, LEM: 0.3609, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5763, partial_loss/deprel_loss: 0.6045, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7729, loss: 0.7218, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  70%|#######   | 78/111 [00:54<00:22,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8735, UAS: 0.9454, LAS: 0.8994, UEM: 0.5849, LEM: 0.3537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7327, partial_loss/deprel_loss: 0.6924, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8746, loss: 0.7226, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  74%|#######3  | 82/111 [00:56<00:19,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8878, UAS: 0.9455, LAS: 0.8995, UEM: 0.5842, LEM: 0.3510, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7146, partial_loss/deprel_loss: 0.6244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8165, loss: 0.7207, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  77%|#######7  | 86/111 [00:59<00:16,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8576, UAS: 0.9446, LAS: 0.8984, UEM: 0.5772, LEM: 0.3451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0883, partial_loss/deprel_loss: 0.7811, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0166, loss: 0.7292, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  81%|########1 | 90/111 [01:02<00:13,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8825, UAS: 0.9444, LAS: 0.8984, UEM: 0.5738, LEM: 0.3422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8949, partial_loss/deprel_loss: 0.6739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8922, loss: 0.7309, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  85%|########4 | 94/111 [01:04<00:11,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9445, LAS: 0.8985, UEM: 0.5741, LEM: 0.3413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7387, partial_loss/deprel_loss: 0.6574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8477, loss: 0.7307, batch_reg_loss: 0.1741, reg_loss: 0.1741 ||:  88%|########8 | 98/111 [01:07<00:08,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9456, LAS: 0.8997, UEM: 0.5927, LEM: 0.3601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0877, partial_loss/deprel_loss: 0.2313, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3766, loss: 0.7215, batch_reg_loss: 0.1741, reg_loss: 0.1741 ||:  92%|#########1| 102/111 [01:10<00:06,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8893, UAS: 0.9453, LAS: 0.8995, UEM: 0.5870, LEM: 0.3552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6028, partial_loss/deprel_loss: 0.5774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7565, loss: 0.7237, batch_reg_loss: 0.1741, reg_loss: 0.1741 ||:  95%|#########4| 105/111 [01:12<00:04,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9456, LAS: 0.8997, UEM: 0.5861, LEM: 0.3529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4799, partial_loss/deprel_loss: 0.5671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7237, loss: 0.7223, batch_reg_loss: 0.1741, reg_loss: 0.1741 ||:  97%|#########7| 108/111 [01:14<00:02,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9235, UAS: 0.9457, LAS: 0.8998, UEM: 0.5843, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2883, partial_loss/deprel_loss: 0.4537, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5946, loss: 0.7223, batch_reg_loss: 0.1740, reg_loss: 0.1741 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9235, UAS: 0.9457, LAS: 0.8998, UEM: 0.5843, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2883, partial_loss/deprel_loss: 0.4537, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5946, loss: 0.7223, batch_reg_loss: 0.1740, reg_loss: 0.1741 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
+      "2023-04-07 00:27:18,544 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.454  |       N/A\n",
+      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.288  |       N/A\n",
+      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.174  |       N/A\n",
+      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - UEM                      |     0.584  |       N/A\n",
+      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - LAS                      |     0.900  |       N/A\n",
+      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - loss                     |     0.722  |       N/A\n",
+      "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - LEM                      |     0.351  |       N/A\n",
+      "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - UAS                      |     0.946  |       N/A\n",
+      "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - EM                       |     0.924  |       N/A\n",
+      "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:27:18,552 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:27:24,771 - INFO - combo.training.trainer - Epoch duration: 0:01:26.320285\n",
+      "2023-04-07 00:27:24,771 - INFO - combo.training.trainer - Estimated training time remaining: 7:17:18\n",
+      "2023-04-07 00:27:24,771 - INFO - allennlp.training.trainer - Epoch 73/399\n",
+      "2023-04-07 00:27:24,772 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:27:24,772 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:27:24,779 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9243, UAS: 0.9532, LAS: 0.9077, UEM: 0.5342, LEM: 0.2404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2385, partial_loss/deprel_loss: 0.4693, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5971, loss: 0.6751, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||:   4%|3         | 4/111 [00:02<01:12,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9652, UAS: 0.9604, LAS: 0.9180, UEM: 0.7379, LEM: 0.5320, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0522, partial_loss/deprel_loss: 0.1375, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2945, loss: 0.5981, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||:   6%|6         | 7/111 [00:05<01:14,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9118, UAS: 0.9585, LAS: 0.9155, UEM: 0.6843, LEM: 0.4623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3479, partial_loss/deprel_loss: 0.5002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6437, loss: 0.6111, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||:  10%|9         | 11/111 [00:07<01:10,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9587, LAS: 0.9153, UEM: 0.6754, LEM: 0.4484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6654, partial_loss/deprel_loss: 0.5753, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7673, loss: 0.6098, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||:  13%|#2        | 14/111 [00:10<01:09,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9597, LAS: 0.9163, UEM: 0.6823, LEM: 0.4418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2609, partial_loss/deprel_loss: 0.4559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5908, loss: 0.6001, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||:  15%|#5        | 17/111 [00:12<01:09,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8714, UAS: 0.9560, LAS: 0.9106, UEM: 0.6453, LEM: 0.4084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8720, partial_loss/deprel_loss: 0.6651, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8805, loss: 0.6418, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||:  19%|#8        | 21/111 [00:15<01:04,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8644, UAS: 0.9553, LAS: 0.9103, UEM: 0.6530, LEM: 0.4157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0246, partial_loss/deprel_loss: 0.8085, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0257, loss: 0.6453, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||:  22%|##1       | 24/111 [00:17<01:02,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9540, LAS: 0.9098, UEM: 0.6519, LEM: 0.4187, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3734, partial_loss/deprel_loss: 0.4383, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5992, loss: 0.6471, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  24%|##4       | 27/111 [00:19<01:00,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8607, UAS: 0.9525, LAS: 0.9076, UEM: 0.6388, LEM: 0.4050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9665, partial_loss/deprel_loss: 0.7185, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9421, loss: 0.6611, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  28%|##7       | 31/111 [00:21<00:55,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9514, LAS: 0.9063, UEM: 0.6255, LEM: 0.3937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0289, partial_loss/deprel_loss: 0.7669, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9932, loss: 0.6731, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  31%|###       | 34/111 [00:24<00:52,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9315, UAS: 0.9517, LAS: 0.9066, UEM: 0.6244, LEM: 0.3906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1890, partial_loss/deprel_loss: 0.3509, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4924, loss: 0.6727, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  33%|###3      | 37/111 [00:26<00:51,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9514, LAS: 0.9063, UEM: 0.6176, LEM: 0.3814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5196, partial_loss/deprel_loss: 0.5613, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7269, loss: 0.6731, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  36%|###6      | 40/111 [00:28<00:49,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8627, UAS: 0.9502, LAS: 0.9048, UEM: 0.6083, LEM: 0.3723, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0434, partial_loss/deprel_loss: 0.8135, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0334, loss: 0.6860, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  40%|###9      | 44/111 [00:30<00:45,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9485, LAS: 0.9032, UEM: 0.5897, LEM: 0.3579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9389, partial_loss/deprel_loss: 0.7671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9754, loss: 0.7012, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  43%|####3     | 48/111 [00:33<00:41,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9485, LAS: 0.9034, UEM: 0.5817, LEM: 0.3499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7179, partial_loss/deprel_loss: 0.6370, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8271, loss: 0.7025, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  47%|####6     | 52/111 [00:35<00:37,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9486, LAS: 0.9035, UEM: 0.5822, LEM: 0.3508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3235, partial_loss/deprel_loss: 0.4352, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5868, loss: 0.7005, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  50%|#####     | 56/111 [00:38<00:37,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9498, LAS: 0.9046, UEM: 0.6007, LEM: 0.3648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2713, partial_loss/deprel_loss: 0.4238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5672, loss: 0.6910, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  53%|#####3    | 59/111 [00:40<00:36,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9096, UAS: 0.9496, LAS: 0.9047, UEM: 0.6015, LEM: 0.3670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4178, partial_loss/deprel_loss: 0.4418, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6108, loss: 0.6893, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  56%|#####5    | 62/111 [00:43<00:34,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9491, LAS: 0.9041, UEM: 0.5914, LEM: 0.3569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4079, partial_loss/deprel_loss: 0.4585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6222, loss: 0.6939, batch_reg_loss: 0.1739, reg_loss: 0.1739 ||:  59%|#####9    | 66/111 [00:45<00:30,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9480, LAS: 0.9030, UEM: 0.5828, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3412, partial_loss/deprel_loss: 0.4105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5705, loss: 0.7012, batch_reg_loss: 0.1739, reg_loss: 0.1739 ||:  63%|######3   | 70/111 [00:48<00:27,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8167, UAS: 0.9473, LAS: 0.9025, UEM: 0.5904, LEM: 0.3606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8044, partial_loss/deprel_loss: 1.0041, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3380, loss: 0.7049, batch_reg_loss: 0.1739, reg_loss: 0.1739 ||:  67%|######6   | 74/111 [00:51<00:26,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9003, UAS: 0.9475, LAS: 0.9027, UEM: 0.5984, LEM: 0.3730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5672, partial_loss/deprel_loss: 0.6062, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7722, loss: 0.7044, batch_reg_loss: 0.1739, reg_loss: 0.1739 ||:  69%|######9   | 77/111 [00:53<00:23,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9465, LAS: 0.9015, UEM: 0.5902, LEM: 0.3671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6163, partial_loss/deprel_loss: 0.5954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7734, loss: 0.7126, batch_reg_loss: 0.1739, reg_loss: 0.1739 ||:  72%|#######2  | 80/111 [00:55<00:22,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8700, UAS: 0.9460, LAS: 0.9007, UEM: 0.5845, LEM: 0.3607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9029, partial_loss/deprel_loss: 0.7944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9899, loss: 0.7188, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||:  76%|#######5  | 84/111 [00:58<00:18,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8562, UAS: 0.9461, LAS: 0.9008, UEM: 0.5894, LEM: 0.3649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0194, partial_loss/deprel_loss: 0.7513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9788, loss: 0.7168, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||:  79%|#######9  | 88/111 [01:00<00:15,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9464, LAS: 0.9011, UEM: 0.5857, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3949, partial_loss/deprel_loss: 0.4863, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6419, loss: 0.7150, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||:  82%|########1 | 91/111 [01:03<00:14,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8849, UAS: 0.9463, LAS: 0.9008, UEM: 0.5802, LEM: 0.3548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7188, partial_loss/deprel_loss: 0.7382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9082, loss: 0.7179, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||:  85%|########4 | 94/111 [01:05<00:12,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9464, LAS: 0.9009, UEM: 0.5844, LEM: 0.3581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3451, partial_loss/deprel_loss: 0.4686, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6178, loss: 0.7152, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||:  87%|########7 | 97/111 [01:07<00:10,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9463, LAS: 0.9008, UEM: 0.5848, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3774, partial_loss/deprel_loss: 0.5079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6556, loss: 0.7175, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||:  90%|######### | 100/111 [01:09<00:08,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9466, LAS: 0.9012, UEM: 0.5866, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2466, partial_loss/deprel_loss: 0.4409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5759, loss: 0.7140, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||:  94%|#########3| 104/111 [01:12<00:05,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8519, UAS: 0.9466, LAS: 0.9010, UEM: 0.5883, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2192, partial_loss/deprel_loss: 0.8357, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0862, loss: 0.7151, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||:  96%|#########6| 107/111 [01:14<00:02,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9465, LAS: 0.9009, UEM: 0.5843, LEM: 0.3538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5333, partial_loss/deprel_loss: 0.6096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7682, loss: 0.7148, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||: 100%|##########| 111/111 [01:17<00:00,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9465, LAS: 0.9009, UEM: 0.5843, LEM: 0.3538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5333, partial_loss/deprel_loss: 0.6096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7682, loss: 0.7148, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||: 100%|##########| 111/111 [01:17<00:00,  1.44it/s]\n",
+      "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.610  |       N/A\n",
+      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.533  |       N/A\n",
+      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.174  |       N/A\n",
+      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - UEM                      |     0.584  |       N/A\n",
+      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - LAS                      |     0.901  |       N/A\n",
+      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - loss                     |     0.715  |       N/A\n",
+      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - LEM                      |     0.354  |       N/A\n",
+      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - UAS                      |     0.947  |       N/A\n",
+      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - EM                       |     0.894  |       N/A\n",
+      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:28:45,380 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:28:50,593 - INFO - combo.training.trainer - Epoch duration: 0:01:25.821825\n",
+      "2023-04-07 00:28:50,594 - INFO - combo.training.trainer - Estimated training time remaining: 7:16:22\n",
+      "2023-04-07 00:28:50,594 - INFO - allennlp.training.trainer - Epoch 74/399\n",
+      "2023-04-07 00:28:50,594 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:28:50,595 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:28:50,602 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8910, UAS: 0.9457, LAS: 0.8979, UEM: 0.4358, LEM: 0.1813, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4698, partial_loss/deprel_loss: 0.6442, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7831, loss: 0.7372, batch_reg_loss: 0.1738, reg_loss: 0.1738 ||:   4%|3         | 4/111 [00:02<01:04,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8980, UAS: 0.9483, LAS: 0.8997, UEM: 0.4974, LEM: 0.2300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4275, partial_loss/deprel_loss: 0.6147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7511, loss: 0.7173, batch_reg_loss: 0.1738, reg_loss: 0.1738 ||:   6%|6         | 7/111 [00:04<01:06,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9457, LAS: 0.8984, UEM: 0.4551, LEM: 0.2003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5032, partial_loss/deprel_loss: 0.5335, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7012, loss: 0.7334, batch_reg_loss: 0.1738, reg_loss: 0.1738 ||:  10%|9         | 11/111 [00:07<01:03,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9439, LAS: 0.8984, UEM: 0.4737, LEM: 0.2324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2852, partial_loss/deprel_loss: 0.3420, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5044, loss: 0.7341, batch_reg_loss: 0.1738, reg_loss: 0.1738 ||:  13%|#2        | 14/111 [00:09<01:03,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9475, LAS: 0.9026, UEM: 0.5509, LEM: 0.3213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4653, partial_loss/deprel_loss: 0.5485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7056, loss: 0.7058, batch_reg_loss: 0.1738, reg_loss: 0.1738 ||:  16%|#6        | 18/111 [00:11<01:01,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9479, LAS: 0.9031, UEM: 0.5658, LEM: 0.3382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1822, partial_loss/deprel_loss: 0.3363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4793, loss: 0.6988, batch_reg_loss: 0.1738, reg_loss: 0.1738 ||:  20%|#9        | 22/111 [00:14<01:00,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9479, LAS: 0.9028, UEM: 0.5521, LEM: 0.3233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3213, partial_loss/deprel_loss: 0.4385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5888, loss: 0.7014, batch_reg_loss: 0.1738, reg_loss: 0.1738 ||:  23%|##2       | 25/111 [00:17<01:00,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9110, UAS: 0.9484, LAS: 0.9031, UEM: 0.5483, LEM: 0.3160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3309, partial_loss/deprel_loss: 0.5004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6403, loss: 0.6986, batch_reg_loss: 0.1737, reg_loss: 0.1738 ||:  25%|##5       | 28/111 [00:19<01:00,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8777, UAS: 0.9473, LAS: 0.9015, UEM: 0.5368, LEM: 0.3037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6838, partial_loss/deprel_loss: 0.6598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8384, loss: 0.7088, batch_reg_loss: 0.1737, reg_loss: 0.1738 ||:  29%|##8       | 32/111 [00:21<00:54,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9080, UAS: 0.9485, LAS: 0.9027, UEM: 0.5627, LEM: 0.3290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3361, partial_loss/deprel_loss: 0.4837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6279, loss: 0.7007, batch_reg_loss: 0.1737, reg_loss: 0.1738 ||:  32%|###1      | 35/111 [00:24<00:53,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9201, UAS: 0.9499, LAS: 0.9039, UEM: 0.5790, LEM: 0.3363, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2282, partial_loss/deprel_loss: 0.4233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5580, loss: 0.6914, batch_reg_loss: 0.1737, reg_loss: 0.1738 ||:  34%|###4      | 38/111 [00:26<00:53,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8834, UAS: 0.9492, LAS: 0.9031, UEM: 0.5832, LEM: 0.3421, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5601, partial_loss/deprel_loss: 0.7277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8679, loss: 0.6963, batch_reg_loss: 0.1737, reg_loss: 0.1738 ||:  37%|###6      | 41/111 [00:28<00:50,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8833, UAS: 0.9482, LAS: 0.9020, UEM: 0.5690, LEM: 0.3308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8162, partial_loss/deprel_loss: 0.7002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8971, loss: 0.7059, batch_reg_loss: 0.1737, reg_loss: 0.1738 ||:  40%|###9      | 44/111 [00:30<00:48,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9478, LAS: 0.9018, UEM: 0.5640, LEM: 0.3279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2325, partial_loss/deprel_loss: 0.3602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5083, loss: 0.7076, batch_reg_loss: 0.1737, reg_loss: 0.1738 ||:  43%|####3     | 48/111 [00:33<00:42,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9472, LAS: 0.9016, UEM: 0.5642, LEM: 0.3289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2649, partial_loss/deprel_loss: 0.3708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5233, loss: 0.7090, batch_reg_loss: 0.1737, reg_loss: 0.1737 ||:  47%|####6     | 52/111 [00:35<00:40,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9473, LAS: 0.9019, UEM: 0.5663, LEM: 0.3295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2980, partial_loss/deprel_loss: 0.4821, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6190, loss: 0.7079, batch_reg_loss: 0.1737, reg_loss: 0.1737 ||:  50%|####9     | 55/111 [00:37<00:38,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9480, LAS: 0.9025, UEM: 0.5654, LEM: 0.3257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2673, partial_loss/deprel_loss: 0.4732, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6057, loss: 0.7046, batch_reg_loss: 0.1737, reg_loss: 0.1737 ||:  52%|#####2    | 58/111 [00:40<00:37,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9475, LAS: 0.9022, UEM: 0.5687, LEM: 0.3288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2206, partial_loss/deprel_loss: 0.3796, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5214, loss: 0.7055, batch_reg_loss: 0.1737, reg_loss: 0.1737 ||:  56%|#####5    | 62/111 [00:42<00:34,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9476, LAS: 0.9025, UEM: 0.6012, LEM: 0.3717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1395, partial_loss/deprel_loss: 0.3569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4871, loss: 0.7037, batch_reg_loss: 0.1737, reg_loss: 0.1737 ||:  59%|#####8    | 65/111 [00:45<00:33,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9469, LAS: 0.9016, UEM: 0.5897, LEM: 0.3617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5729, partial_loss/deprel_loss: 0.5866, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7575, loss: 0.7124, batch_reg_loss: 0.1737, reg_loss: 0.1737 ||:  62%|######2   | 69/111 [00:47<00:29,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8403, UAS: 0.9468, LAS: 0.9016, UEM: 0.5911, LEM: 0.3602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4491, partial_loss/deprel_loss: 0.8480, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1418, loss: 0.7127, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  66%|######5   | 73/111 [00:50<00:26,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8697, UAS: 0.9465, LAS: 0.9013, UEM: 0.5840, LEM: 0.3541, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7986, partial_loss/deprel_loss: 0.7437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9283, loss: 0.7160, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  68%|######8   | 76/111 [00:52<00:24,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9460, LAS: 0.9008, UEM: 0.5814, LEM: 0.3498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2858, partial_loss/deprel_loss: 0.4362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5797, loss: 0.7194, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  72%|#######2  | 80/111 [00:55<00:20,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9465, LAS: 0.9011, UEM: 0.5803, LEM: 0.3452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4513, partial_loss/deprel_loss: 0.5489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7031, loss: 0.7158, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  76%|#######5  | 84/111 [00:57<00:18,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8191, UAS: 0.9453, LAS: 0.8998, UEM: 0.5735, LEM: 0.3399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7406, partial_loss/deprel_loss: 1.0592, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3691, loss: 0.7262, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  78%|#######8  | 87/111 [01:00<00:16,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9462, LAS: 0.9008, UEM: 0.5816, LEM: 0.3452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1876, partial_loss/deprel_loss: 0.3523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4930, loss: 0.7184, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  82%|########1 | 91/111 [01:02<00:13,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8601, UAS: 0.9458, LAS: 0.9004, UEM: 0.5796, LEM: 0.3441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9515, partial_loss/deprel_loss: 0.8350, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0319, loss: 0.7209, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  86%|########5 | 95/111 [01:05<00:10,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9462, LAS: 0.9009, UEM: 0.5865, LEM: 0.3511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2142, partial_loss/deprel_loss: 0.3441, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4918, loss: 0.7158, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  88%|########8 | 98/111 [01:07<00:09,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9463, LAS: 0.9009, UEM: 0.5842, LEM: 0.3484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3423, partial_loss/deprel_loss: 0.5043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6456, loss: 0.7160, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  91%|######### | 101/111 [01:09<00:07,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8651, UAS: 0.9461, LAS: 0.9005, UEM: 0.5788, LEM: 0.3430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9346, partial_loss/deprel_loss: 0.7656, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9730, loss: 0.7180, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  95%|#########4| 105/111 [01:12<00:04,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9465, LAS: 0.9009, UEM: 0.5816, LEM: 0.3436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6470, partial_loss/deprel_loss: 0.5651, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7551, loss: 0.7137, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  98%|#########8| 109/111 [01:15<00:01,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9116, UAS: 0.9469, LAS: 0.9013, UEM: 0.5879, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4319, partial_loss/deprel_loss: 0.4654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6323, loss: 0.7106, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
+      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.465  |       N/A\n",
+      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.432  |       N/A\n",
+      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.174  |       N/A\n",
+      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - UEM                      |     0.588  |       N/A\n",
+      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - LAS                      |     0.901  |       N/A\n",
+      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - loss                     |     0.711  |       N/A\n",
+      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - LEM                      |     0.351  |       N/A\n",
+      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - UAS                      |     0.947  |       N/A\n",
+      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - EM                       |     0.912  |       N/A\n",
+      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:30:10,477 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 00:30:15,615 - INFO - combo.training.trainer - Epoch duration: 0:01:25.020714\n",
+      "2023-04-07 00:30:15,615 - INFO - combo.training.trainer - Estimated training time remaining: 7:15:22\n",
+      "2023-04-07 00:30:15,616 - INFO - allennlp.training.trainer - Epoch 75/399\n",
+      "2023-04-07 00:30:15,616 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:30:15,616 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:30:15,626 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9491, LAS: 0.9042, UEM: 0.4891, LEM: 0.2782, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6299, partial_loss/deprel_loss: 0.6336, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8064, loss: 0.7056, batch_reg_loss: 0.1736, reg_loss: 0.1736 ||:   4%|3         | 4/111 [00:02<01:08,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9146, UAS: 0.9499, LAS: 0.9071, UEM: 0.4945, LEM: 0.2844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3865, partial_loss/deprel_loss: 0.4271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5926, loss: 0.6799, batch_reg_loss: 0.1736, reg_loss: 0.1736 ||:   6%|6         | 7/111 [00:04<01:07,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9516, LAS: 0.9080, UEM: 0.5327, LEM: 0.3093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4005, partial_loss/deprel_loss: 0.5567, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6990, loss: 0.6671, batch_reg_loss: 0.1735, reg_loss: 0.1736 ||:   9%|9         | 10/111 [00:06<01:06,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9507, LAS: 0.9067, UEM: 0.5098, LEM: 0.2815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4433, partial_loss/deprel_loss: 0.5343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6896, loss: 0.6811, batch_reg_loss: 0.1735, reg_loss: 0.1736 ||:  12%|#1        | 13/111 [00:08<01:05,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8704, UAS: 0.9465, LAS: 0.9025, UEM: 0.4974, LEM: 0.2796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9581, partial_loss/deprel_loss: 0.7562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9701, loss: 0.7203, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  15%|#5        | 17/111 [00:11<01:02,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9489, LAS: 0.9046, UEM: 0.5301, LEM: 0.2974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2274, partial_loss/deprel_loss: 0.4505, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5794, loss: 0.6991, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  19%|#8        | 21/111 [00:14<01:00,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9478, LAS: 0.9035, UEM: 0.5397, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5845, partial_loss/deprel_loss: 0.5930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7648, loss: 0.7022, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  22%|##1       | 24/111 [00:16<00:58,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9468, LAS: 0.9015, UEM: 0.5314, LEM: 0.3007, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2592, partial_loss/deprel_loss: 0.4407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5779, loss: 0.7139, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  24%|##4       | 27/111 [00:18<00:58,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.9464, LAS: 0.9007, UEM: 0.5205, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8469, partial_loss/deprel_loss: 0.7144, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9144, loss: 0.7212, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  28%|##7       | 31/111 [00:20<00:54,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9458, LAS: 0.9003, UEM: 0.5028, LEM: 0.2713, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7110, partial_loss/deprel_loss: 0.5689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7708, loss: 0.7229, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  32%|###1      | 35/111 [00:23<00:49,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9259, UAS: 0.9465, LAS: 0.9008, UEM: 0.5095, LEM: 0.2718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2651, partial_loss/deprel_loss: 0.4027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5487, loss: 0.7180, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  35%|###5      | 39/111 [00:25<00:46,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8458, UAS: 0.9450, LAS: 0.8992, UEM: 0.5146, LEM: 0.2811, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3986, partial_loss/deprel_loss: 0.8601, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1413, loss: 0.7268, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  39%|###8      | 43/111 [00:28<00:46,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9453, LAS: 0.8996, UEM: 0.5111, LEM: 0.2752, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7778, partial_loss/deprel_loss: 0.7009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8898, loss: 0.7258, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  42%|####2     | 47/111 [00:31<00:42,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9460, LAS: 0.9001, UEM: 0.5274, LEM: 0.2936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1283, partial_loss/deprel_loss: 0.2925, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4332, loss: 0.7209, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  45%|####5     | 50/111 [00:33<00:41,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9331, UAS: 0.9465, LAS: 0.9009, UEM: 0.5576, LEM: 0.3287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1901, partial_loss/deprel_loss: 0.3367, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4808, loss: 0.7148, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  48%|####7     | 53/111 [00:35<00:41,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9470, LAS: 0.9016, UEM: 0.5619, LEM: 0.3321, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4573, partial_loss/deprel_loss: 0.5106, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6734, loss: 0.7086, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  50%|#####     | 56/111 [00:38<00:40,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9478, LAS: 0.9026, UEM: 0.5709, LEM: 0.3398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2196, partial_loss/deprel_loss: 0.3034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4601, loss: 0.7010, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  53%|#####3    | 59/111 [00:40<00:40,  1.29it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9140, UAS: 0.9478, LAS: 0.9028, UEM: 0.5694, LEM: 0.3376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3711, partial_loss/deprel_loss: 0.4710, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6245, loss: 0.6999, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  56%|#####5    | 62/111 [00:42<00:36,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8679, UAS: 0.9477, LAS: 0.9025, UEM: 0.5648, LEM: 0.3325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9499, partial_loss/deprel_loss: 0.7206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9399, loss: 0.7035, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  59%|#####8    | 65/111 [00:44<00:33,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8757, UAS: 0.9478, LAS: 0.9026, UEM: 0.5617, LEM: 0.3290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7457, partial_loss/deprel_loss: 0.7231, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9010, loss: 0.7022, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  62%|######2   | 69/111 [00:47<00:29,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8668, UAS: 0.9464, LAS: 0.9012, UEM: 0.5578, LEM: 0.3260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0939, partial_loss/deprel_loss: 0.8407, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0648, loss: 0.7157, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  65%|######4   | 72/111 [00:49<00:27,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9469, LAS: 0.9017, UEM: 0.5644, LEM: 0.3297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5945, partial_loss/deprel_loss: 0.5757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7529, loss: 0.7114, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  68%|######7   | 75/111 [00:51<00:25,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8894, UAS: 0.9467, LAS: 0.9014, UEM: 0.5578, LEM: 0.3226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6574, partial_loss/deprel_loss: 0.6179, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7992, loss: 0.7137, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  71%|#######1  | 79/111 [00:54<00:21,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8979, UAS: 0.9470, LAS: 0.9017, UEM: 0.5695, LEM: 0.3354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5613, partial_loss/deprel_loss: 0.5691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7409, loss: 0.7098, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  75%|#######4  | 83/111 [00:56<00:19,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9227, UAS: 0.9473, LAS: 0.9019, UEM: 0.5681, LEM: 0.3323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3195, partial_loss/deprel_loss: 0.4217, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5746, loss: 0.7095, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  78%|#######8  | 87/111 [00:59<00:16,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9471, LAS: 0.9017, UEM: 0.5661, LEM: 0.3293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4214, partial_loss/deprel_loss: 0.4737, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6366, loss: 0.7102, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  82%|########1 | 91/111 [01:01<00:12,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8424, UAS: 0.9471, LAS: 0.9017, UEM: 0.5694, LEM: 0.3318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3132, partial_loss/deprel_loss: 0.8401, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1081, loss: 0.7094, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  86%|########5 | 95/111 [01:04<00:10,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9166, UAS: 0.9467, LAS: 0.9015, UEM: 0.5678, LEM: 0.3295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4053, partial_loss/deprel_loss: 0.4962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6514, loss: 0.7116, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  89%|########9 | 99/111 [01:07<00:07,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9283, UAS: 0.9472, LAS: 0.9019, UEM: 0.5759, LEM: 0.3360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1922, partial_loss/deprel_loss: 0.3905, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5242, loss: 0.7089, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  93%|#########2| 103/111 [01:10<00:05,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8366, UAS: 0.9472, LAS: 0.9020, UEM: 0.5894, LEM: 0.3556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3455, partial_loss/deprel_loss: 1.0114, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2516, loss: 0.7093, batch_reg_loss: 0.1733, reg_loss: 0.1735 ||:  95%|#########5| 106/111 [01:12<00:03,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8681, UAS: 0.9473, LAS: 0.9022, UEM: 0.5902, LEM: 0.3549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0149, partial_loss/deprel_loss: 0.6764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9174, loss: 0.7074, batch_reg_loss: 0.1733, reg_loss: 0.1735 ||:  99%|#########9| 110/111 [01:14<00:00,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9474, LAS: 0.9022, UEM: 0.5892, LEM: 0.3539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5141, partial_loss/deprel_loss: 0.4841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6635, loss: 0.7070, batch_reg_loss: 0.1733, reg_loss: 0.1735 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
+      "2023-04-07 00:31:33,915 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8312, UAS: 0.9126, LAS: 0.8528, UEM: 0.2678, LEM: 0.0820, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5891, partial_loss/deprel_loss: 57.0978, partial_loss/cycle_loss: 0.0000, batch_loss: 45.9961, loss: 35.5607, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:11,  1.04s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9458, LAS: 0.8918, UEM: 0.6731, LEM: 0.3689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4201, partial_loss/deprel_loss: 24.8719, partial_loss/cycle_loss: 0.0000, batch_loss: 19.9815, loss: 26.3380, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:04<00:08,  1.01s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8755, UAS: 0.9447, LAS: 0.8922, UEM: 0.6285, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0363, partial_loss/deprel_loss: 36.5851, partial_loss/cycle_loss: 0.0000, batch_loss: 29.4754, loss: 26.2771, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:07<00:04,  1.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9436, LAS: 0.8913, UEM: 0.6011, LEM: 0.3155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5407, partial_loss/deprel_loss: 24.4729, partial_loss/cycle_loss: 0.0000, batch_loss: 19.6864, loss: 26.8626, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  77%|#######6  | 10/13 [00:09<00:02,  1.02it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9466, LAS: 0.8953, UEM: 0.6564, LEM: 0.3961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1730, partial_loss/deprel_loss: 20.4255, partial_loss/cycle_loss: 0.0000, batch_loss: 16.3750, loss: 25.7702, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  92%|#########2| 12/13 [00:11<00:00,  1.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9464, LAS: 0.8949, UEM: 0.6475, LEM: 0.3824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6519, partial_loss/deprel_loss: 34.6901, partial_loss/cycle_loss: 0.0000, batch_loss: 27.8825, loss: 25.9327, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.04it/s]\n",
+      "2023-04-07 00:31:46,420 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.484  |    34.690\n",
+      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.514  |     0.652\n",
+      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.173  |     0.000\n",
+      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - UEM                      |     0.589  |     0.648\n",
+      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - LAS                      |     0.902  |     0.895\n",
+      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - loss                     |     0.707  |    25.933\n",
+      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - LEM                      |     0.354  |     0.382\n",
+      "2023-04-07 00:31:46,422 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:31:46,422 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:31:46,422 - INFO - combo.training.tensorboard_writer - UAS                      |     0.947  |     0.946\n",
+      "2023-04-07 00:31:46,422 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:31:46,422 - INFO - combo.training.tensorboard_writer - EM                       |     0.907  |     0.890\n",
+      "2023-04-07 00:31:46,422 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:31:46,427 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 00:31:51,593 - INFO - combo.training.trainer - Epoch duration: 0:01:35.977183\n",
+      "2023-04-07 00:31:51,595 - INFO - combo.training.trainer - Estimated training time remaining: 7:15:08\n",
+      "2023-04-07 00:31:51,595 - INFO - allennlp.training.trainer - Epoch 76/399\n",
+      "2023-04-07 00:31:51,595 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:31:51,596 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:31:51,605 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8557, UAS: 0.9347, LAS: 0.8909, UEM: 0.5095, LEM: 0.2695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2675, partial_loss/deprel_loss: 0.8097, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0746, loss: 0.7894, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:   4%|3         | 4/111 [00:02<01:09,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8760, UAS: 0.9366, LAS: 0.8924, UEM: 0.3993, LEM: 0.1864, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9186, partial_loss/deprel_loss: 0.7514, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9581, loss: 0.7899, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:   7%|7         | 8/111 [00:05<01:05,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8899, UAS: 0.9376, LAS: 0.8935, UEM: 0.3859, LEM: 0.1759, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6642, partial_loss/deprel_loss: 0.6574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8321, loss: 0.7815, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  10%|9         | 11/111 [00:07<01:05,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9429, LAS: 0.8999, UEM: 0.5021, LEM: 0.2824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1660, partial_loss/deprel_loss: 0.3516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4878, loss: 0.7301, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  13%|#2        | 14/111 [00:09<01:07,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8859, UAS: 0.9421, LAS: 0.8981, UEM: 0.4642, LEM: 0.2499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5952, partial_loss/deprel_loss: 0.5753, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7526, loss: 0.7337, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  16%|#6        | 18/111 [00:12<01:03,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9433, LAS: 0.8993, UEM: 0.4622, LEM: 0.2416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7205, partial_loss/deprel_loss: 0.6275, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8194, loss: 0.7294, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  19%|#8        | 21/111 [00:14<01:01,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8956, UAS: 0.9412, LAS: 0.8971, UEM: 0.4414, LEM: 0.2264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5751, partial_loss/deprel_loss: 0.5682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7429, loss: 0.7399, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  22%|##1       | 24/111 [00:16<00:59,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9438, LAS: 0.9003, UEM: 0.4829, LEM: 0.2618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1826, partial_loss/deprel_loss: 0.2829, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4361, loss: 0.7217, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  25%|##5       | 28/111 [00:18<00:53,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9451, LAS: 0.9016, UEM: 0.5168, LEM: 0.2964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6928, partial_loss/deprel_loss: 0.6290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8150, loss: 0.7092, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  28%|##7       | 31/111 [00:20<00:56,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9432, LAS: 0.8997, UEM: 0.5206, LEM: 0.3000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7606, partial_loss/deprel_loss: 0.6660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8582, loss: 0.7262, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  31%|###       | 34/111 [00:23<00:55,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9443, LAS: 0.9008, UEM: 0.5325, LEM: 0.3093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2798, partial_loss/deprel_loss: 0.3900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5412, loss: 0.7177, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  33%|###3      | 37/111 [00:25<00:52,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9536, UAS: 0.9462, LAS: 0.9029, UEM: 0.5708, LEM: 0.3511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0746, partial_loss/deprel_loss: 0.1974, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3461, loss: 0.7017, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  36%|###6      | 40/111 [00:27<00:49,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9462, LAS: 0.9027, UEM: 0.5641, LEM: 0.3419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3328, partial_loss/deprel_loss: 0.4941, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6351, loss: 0.7032, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  39%|###8      | 43/111 [00:29<00:48,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8922, UAS: 0.9468, LAS: 0.9032, UEM: 0.5601, LEM: 0.3345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5435, partial_loss/deprel_loss: 0.6927, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8361, loss: 0.7015, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  42%|####2     | 47/111 [00:32<00:44,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9016, UAS: 0.9467, LAS: 0.9027, UEM: 0.5492, LEM: 0.3239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4341, partial_loss/deprel_loss: 0.5543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7035, loss: 0.7062, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  45%|####5     | 50/111 [00:34<00:41,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8707, UAS: 0.9462, LAS: 0.9021, UEM: 0.5426, LEM: 0.3180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0915, partial_loss/deprel_loss: 0.7196, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9672, loss: 0.7087, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  49%|####8     | 54/111 [00:36<00:37,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9400, UAS: 0.9460, LAS: 0.9020, UEM: 0.5445, LEM: 0.3212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1289, partial_loss/deprel_loss: 0.2808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4237, loss: 0.7099, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  52%|#####2    | 58/111 [00:39<00:34,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8858, UAS: 0.9462, LAS: 0.9021, UEM: 0.5429, LEM: 0.3164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7801, partial_loss/deprel_loss: 0.6634, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8600, loss: 0.7097, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  56%|#####5    | 62/111 [00:42<00:33,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9451, LAS: 0.9010, UEM: 0.5357, LEM: 0.3106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4855, partial_loss/deprel_loss: 0.4707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6469, loss: 0.7182, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  59%|#####8    | 65/111 [00:44<00:32,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9461, LAS: 0.9021, UEM: 0.5474, LEM: 0.3176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2151, partial_loss/deprel_loss: 0.3456, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4927, loss: 0.7102, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  61%|######1   | 68/111 [00:46<00:30,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9467, LAS: 0.9027, UEM: 0.5512, LEM: 0.3201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1928, partial_loss/deprel_loss: 0.3655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5042, loss: 0.7054, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  65%|######4   | 72/111 [00:49<00:27,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9475, LAS: 0.9035, UEM: 0.5626, LEM: 0.3277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2363, partial_loss/deprel_loss: 0.3691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5158, loss: 0.6985, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  68%|######7   | 75/111 [00:51<00:24,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8756, UAS: 0.9473, LAS: 0.9034, UEM: 0.5586, LEM: 0.3227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8980, partial_loss/deprel_loss: 0.7342, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9401, loss: 0.7008, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  72%|#######2  | 80/111 [00:53<00:19,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9467, LAS: 0.9025, UEM: 0.5626, LEM: 0.3271, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0960, partial_loss/deprel_loss: 0.3072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4381, loss: 0.7070, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  76%|#######5  | 84/111 [00:56<00:17,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9468, LAS: 0.9025, UEM: 0.5600, LEM: 0.3238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2817, partial_loss/deprel_loss: 0.4330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5759, loss: 0.7073, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  79%|#######9  | 88/111 [00:59<00:15,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9472, LAS: 0.9029, UEM: 0.5658, LEM: 0.3264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2821, partial_loss/deprel_loss: 0.4354, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5779, loss: 0.7038, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  83%|########2 | 92/111 [01:02<00:13,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9481, LAS: 0.9040, UEM: 0.5924, LEM: 0.3602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1210, partial_loss/deprel_loss: 0.2562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4023, loss: 0.6952, batch_reg_loss: 0.1732, reg_loss: 0.1732 ||:  86%|########5 | 95/111 [01:05<00:12,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9480, LAS: 0.9038, UEM: 0.5892, LEM: 0.3560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3368, partial_loss/deprel_loss: 0.5038, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6435, loss: 0.6965, batch_reg_loss: 0.1731, reg_loss: 0.1732 ||:  89%|########9 | 99/111 [01:07<00:08,  1.39it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9482, LAS: 0.9040, UEM: 0.5977, LEM: 0.3651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1306, partial_loss/deprel_loss: 0.2463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3963, loss: 0.6941, batch_reg_loss: 0.1731, reg_loss: 0.1732 ||:  92%|#########1| 102/111 [01:10<00:06,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8735, UAS: 0.9480, LAS: 0.9038, UEM: 0.5968, LEM: 0.3653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9104, partial_loss/deprel_loss: 0.7103, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9235, loss: 0.6946, batch_reg_loss: 0.1731, reg_loss: 0.1732 ||:  95%|#########4| 105/111 [01:12<00:04,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9480, LAS: 0.9037, UEM: 0.5927, LEM: 0.3607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5892, partial_loss/deprel_loss: 0.6759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8316, loss: 0.6965, batch_reg_loss: 0.1731, reg_loss: 0.1732 ||:  98%|#########8| 109/111 [01:14<00:01,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8419, UAS: 0.9473, LAS: 0.9031, UEM: 0.5895, LEM: 0.3579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4323, partial_loss/deprel_loss: 0.8211, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1164, loss: 0.7008, batch_reg_loss: 0.1731, reg_loss: 0.1732 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
+      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.821  |       N/A\n",
+      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.432  |       N/A\n",
+      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.173  |       N/A\n",
+      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - UEM                      |     0.590  |       N/A\n",
+      "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - LAS                      |     0.903  |       N/A\n",
+      "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - loss                     |     0.701  |       N/A\n",
+      "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - LEM                      |     0.358  |       N/A\n",
+      "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - UAS                      |     0.947  |       N/A\n",
+      "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - EM                       |     0.842  |       N/A\n",
+      "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:33:10,837 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 00:33:15,301 - INFO - combo.training.trainer - Epoch duration: 0:01:23.706250\n",
+      "2023-04-07 00:33:15,302 - INFO - combo.training.trainer - Estimated training time remaining: 7:14:01\n",
+      "2023-04-07 00:33:15,302 - INFO - allennlp.training.trainer - Epoch 77/399\n",
+      "2023-04-07 00:33:15,302 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:33:15,303 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:33:15,313 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9540, LAS: 0.9091, UEM: 0.4911, LEM: 0.2216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3272, partial_loss/deprel_loss: 0.4489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5977, loss: 0.6525, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:   4%|3         | 4/111 [00:02<01:08,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9550, LAS: 0.9096, UEM: 0.5444, LEM: 0.2853, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1937, partial_loss/deprel_loss: 0.3571, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4976, loss: 0.6352, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:   6%|6         | 7/111 [00:04<01:10,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9568, LAS: 0.9127, UEM: 0.6099, LEM: 0.3717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3553, partial_loss/deprel_loss: 0.4601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6122, loss: 0.6160, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:   9%|9         | 10/111 [00:06<01:08,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9056, UAS: 0.9545, LAS: 0.9111, UEM: 0.5946, LEM: 0.3607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4713, partial_loss/deprel_loss: 0.5090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6746, loss: 0.6297, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:  12%|#1        | 13/111 [00:09<01:08,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9542, LAS: 0.9106, UEM: 0.5909, LEM: 0.3562, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3604, partial_loss/deprel_loss: 0.4224, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5831, loss: 0.6357, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:  14%|#4        | 16/111 [00:11<01:07,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9000, UAS: 0.9499, LAS: 0.9057, UEM: 0.5877, LEM: 0.3513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5063, partial_loss/deprel_loss: 0.5628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7246, loss: 0.6704, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:  17%|#7        | 19/111 [00:13<01:07,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9477, LAS: 0.9023, UEM: 0.5584, LEM: 0.3260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7295, partial_loss/deprel_loss: 0.6436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8338, loss: 0.6924, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:  20%|#9        | 22/111 [00:15<01:04,  1.38it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9458, LAS: 0.9005, UEM: 0.5394, LEM: 0.3091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4192, partial_loss/deprel_loss: 0.4877, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6471, loss: 0.7056, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:  23%|##2       | 25/111 [00:18<01:03,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9250, UAS: 0.9491, LAS: 0.9041, UEM: 0.5924, LEM: 0.3523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2642, partial_loss/deprel_loss: 0.3273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4878, loss: 0.6803, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:  25%|##5       | 28/111 [00:20<00:59,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9486, LAS: 0.9040, UEM: 0.5864, LEM: 0.3475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5366, partial_loss/deprel_loss: 0.5191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6956, loss: 0.6813, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:  28%|##7       | 31/111 [00:22<00:56,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9480, LAS: 0.9034, UEM: 0.5770, LEM: 0.3385, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2727, partial_loss/deprel_loss: 0.4163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5606, loss: 0.6854, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:  32%|###1      | 35/111 [00:24<00:52,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9487, LAS: 0.9038, UEM: 0.5780, LEM: 0.3365, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2471, partial_loss/deprel_loss: 0.4322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5682, loss: 0.6814, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||:  34%|###4      | 38/111 [00:26<00:50,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8962, UAS: 0.9490, LAS: 0.9041, UEM: 0.5731, LEM: 0.3308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5803, partial_loss/deprel_loss: 0.6454, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8054, loss: 0.6820, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||:  37%|###6      | 41/111 [00:29<00:49,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9311, UAS: 0.9507, LAS: 0.9061, UEM: 0.5970, LEM: 0.3520, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2123, partial_loss/deprel_loss: 0.3388, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4865, loss: 0.6680, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||:  40%|###9      | 44/111 [00:31<00:47,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9510, LAS: 0.9065, UEM: 0.5949, LEM: 0.3489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5873, partial_loss/deprel_loss: 0.5985, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7692, loss: 0.6658, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||:  42%|####2     | 47/111 [00:33<00:46,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9517, LAS: 0.9072, UEM: 0.6124, LEM: 0.3671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2415, partial_loss/deprel_loss: 0.3660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.6589, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||:  45%|####5     | 50/111 [00:35<00:45,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9068, UAS: 0.9508, LAS: 0.9060, UEM: 0.6017, LEM: 0.3565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3449, partial_loss/deprel_loss: 0.5163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6550, loss: 0.6699, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||:  49%|####8     | 54/111 [00:38<00:40,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9676, UAS: 0.9505, LAS: 0.9062, UEM: 0.6242, LEM: 0.3916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0425, partial_loss/deprel_loss: 0.1334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2883, loss: 0.6690, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||:  51%|#####1    | 57/111 [00:41<00:42,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9501, LAS: 0.9056, UEM: 0.6222, LEM: 0.3901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3604, partial_loss/deprel_loss: 0.4116, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5743, loss: 0.6729, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||:  55%|#####4    | 61/111 [00:43<00:36,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9498, LAS: 0.9051, UEM: 0.6129, LEM: 0.3819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6639, partial_loss/deprel_loss: 0.6474, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8237, loss: 0.6772, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||:  58%|#####7    | 64/111 [00:45<00:33,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9495, LAS: 0.9047, UEM: 0.6096, LEM: 0.3764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3216, partial_loss/deprel_loss: 0.4934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6320, loss: 0.6809, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||:  60%|######    | 67/111 [00:48<00:32,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9498, LAS: 0.9050, UEM: 0.6106, LEM: 0.3777, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1373, partial_loss/deprel_loss: 0.2911, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4333, loss: 0.6803, batch_reg_loss: 0.1730, reg_loss: 0.1730 ||:  63%|######3   | 70/111 [00:50<00:29,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9489, LAS: 0.9041, UEM: 0.6022, LEM: 0.3710, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4646, partial_loss/deprel_loss: 0.4755, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6463, loss: 0.6865, batch_reg_loss: 0.1730, reg_loss: 0.1730 ||:  66%|######5   | 73/111 [00:52<00:28,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9492, LAS: 0.9046, UEM: 0.6020, LEM: 0.3689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3846, partial_loss/deprel_loss: 0.5038, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6530, loss: 0.6829, batch_reg_loss: 0.1730, reg_loss: 0.1730 ||:  68%|######8   | 76/111 [00:54<00:26,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8673, UAS: 0.9493, LAS: 0.9047, UEM: 0.5995, LEM: 0.3650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0225, partial_loss/deprel_loss: 0.7170, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9511, loss: 0.6818, batch_reg_loss: 0.1730, reg_loss: 0.1730 ||:  72%|#######2  | 80/111 [00:57<00:21,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9496, LAS: 0.9049, UEM: 0.5995, LEM: 0.3628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3052, partial_loss/deprel_loss: 0.4495, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5936, loss: 0.6812, batch_reg_loss: 0.1730, reg_loss: 0.1730 ||:  75%|#######4  | 83/111 [00:59<00:20,  1.39it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9490, LAS: 0.9043, UEM: 0.5976, LEM: 0.3622, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9099, partial_loss/deprel_loss: 0.7320, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9406, loss: 0.6865, batch_reg_loss: 0.1730, reg_loss: 0.1730 ||:  78%|#######8  | 87/111 [01:02<00:16,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9490, LAS: 0.9044, UEM: 0.5949, LEM: 0.3608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3954, partial_loss/deprel_loss: 0.4187, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5870, loss: 0.6859, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||:  81%|########1 | 90/111 [01:06<00:20,  1.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9448, UAS: 0.9494, LAS: 0.9049, UEM: 0.6072, LEM: 0.3764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0955, partial_loss/deprel_loss: 0.2082, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3586, loss: 0.6819, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||:  84%|########3 | 93/111 [01:09<00:17,  1.06it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8814, UAS: 0.9491, LAS: 0.9046, UEM: 0.6034, LEM: 0.3721, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7977, partial_loss/deprel_loss: 0.6350, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8405, loss: 0.6841, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||:  86%|########6 | 96/111 [01:11<00:13,  1.15it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9492, LAS: 0.9047, UEM: 0.6042, LEM: 0.3730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2056, partial_loss/deprel_loss: 0.3270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4756, loss: 0.6822, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||:  89%|########9 | 99/111 [01:13<00:09,  1.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9485, LAS: 0.9039, UEM: 0.5998, LEM: 0.3694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6815, partial_loss/deprel_loss: 0.5970, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7868, loss: 0.6867, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||:  92%|#########1| 102/111 [01:15<00:07,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8910, UAS: 0.9487, LAS: 0.9040, UEM: 0.5997, LEM: 0.3681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6866, partial_loss/deprel_loss: 0.6442, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8256, loss: 0.6861, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||:  95%|#########4| 105/111 [01:18<00:04,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8776, UAS: 0.9485, LAS: 0.9037, UEM: 0.5933, LEM: 0.3618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8087, partial_loss/deprel_loss: 0.8120, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9843, loss: 0.6896, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||:  98%|#########8| 109/111 [01:20<00:01,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8752, UAS: 0.9480, LAS: 0.9032, UEM: 0.5896, LEM: 0.3592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0166, partial_loss/deprel_loss: 0.6683, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9109, loss: 0.6941, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||: 100%|##########| 111/111 [01:21<00:00,  1.35it/s]\n",
+      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.668  |       N/A\n",
+      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.017  |       N/A\n",
+      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.173  |       N/A\n",
+      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - UEM                      |     0.590  |       N/A\n",
+      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - LAS                      |     0.903  |       N/A\n",
+      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - loss                     |     0.694  |       N/A\n",
+      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - LEM                      |     0.359  |       N/A\n",
+      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - UAS                      |     0.948  |       N/A\n",
+      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - EM                       |     0.875  |       N/A\n",
+      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:34:40,196 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 00:34:44,979 - INFO - combo.training.trainer - Epoch duration: 0:01:29.676969\n",
+      "2023-04-07 00:34:44,980 - INFO - combo.training.trainer - Estimated training time remaining: 7:13:18\n",
+      "2023-04-07 00:34:44,980 - INFO - allennlp.training.trainer - Epoch 78/399\n",
+      "2023-04-07 00:34:44,980 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:34:44,981 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:34:44,988 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9679, LAS: 0.9231, UEM: 0.7181, LEM: 0.4050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3375, partial_loss/deprel_loss: 0.3727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5386, loss: 0.5293, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:   3%|2         | 3/111 [00:02<01:15,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9566, LAS: 0.9133, UEM: 0.6358, LEM: 0.3537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6508, partial_loss/deprel_loss: 0.6221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8007, loss: 0.6167, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:   5%|5         | 6/111 [00:04<01:13,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9543, LAS: 0.9101, UEM: 0.6182, LEM: 0.3409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3246, partial_loss/deprel_loss: 0.4870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6274, loss: 0.6452, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:   9%|9         | 10/111 [00:06<01:08,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8786, UAS: 0.9486, LAS: 0.9035, UEM: 0.5601, LEM: 0.3033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8651, partial_loss/deprel_loss: 0.6585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8727, loss: 0.6916, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  12%|#1        | 13/111 [00:08<01:07,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9496, LAS: 0.9042, UEM: 0.5650, LEM: 0.2982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5894, partial_loss/deprel_loss: 0.5549, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7347, loss: 0.6833, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  14%|#4        | 16/111 [00:11<01:06,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9507, LAS: 0.9051, UEM: 0.5807, LEM: 0.3174, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5727, partial_loss/deprel_loss: 0.6267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7888, loss: 0.6759, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  17%|#7        | 19/111 [00:13<01:07,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9504, LAS: 0.9054, UEM: 0.5797, LEM: 0.3181, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5428, partial_loss/deprel_loss: 0.5371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7111, loss: 0.6827, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  20%|#9        | 22/111 [00:15<01:05,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8458, UAS: 0.9482, LAS: 0.9033, UEM: 0.5805, LEM: 0.3326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2453, partial_loss/deprel_loss: 0.8579, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1083, loss: 0.6936, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  23%|##2       | 25/111 [00:17<01:03,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9480, LAS: 0.9034, UEM: 0.5686, LEM: 0.3231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7153, partial_loss/deprel_loss: 0.5758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7766, loss: 0.6925, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  25%|##5       | 28/111 [00:20<01:03,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9279, UAS: 0.9483, LAS: 0.9041, UEM: 0.5652, LEM: 0.3186, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2857, partial_loss/deprel_loss: 0.3994, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5495, loss: 0.6867, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  28%|##7       | 31/111 [00:22<01:02,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8680, UAS: 0.9485, LAS: 0.9044, UEM: 0.5621, LEM: 0.3129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0274, partial_loss/deprel_loss: 0.8121, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0280, loss: 0.6880, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  32%|###1      | 35/111 [00:25<00:54,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8752, UAS: 0.9465, LAS: 0.9023, UEM: 0.5479, LEM: 0.3012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8060, partial_loss/deprel_loss: 0.7816, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9593, loss: 0.7045, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  35%|###5      | 39/111 [00:27<00:50,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8914, UAS: 0.9456, LAS: 0.9013, UEM: 0.5402, LEM: 0.2945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5544, partial_loss/deprel_loss: 0.6268, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7852, loss: 0.7115, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  38%|###7      | 42/111 [00:29<00:47,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8893, UAS: 0.9461, LAS: 0.9019, UEM: 0.5449, LEM: 0.2997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7151, partial_loss/deprel_loss: 0.7046, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8796, loss: 0.7092, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  41%|####      | 45/111 [00:31<00:45,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9474, LAS: 0.9031, UEM: 0.5644, LEM: 0.3191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5186, partial_loss/deprel_loss: 0.6419, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7901, loss: 0.7012, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  43%|####3     | 48/111 [00:34<00:45,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9469, LAS: 0.9025, UEM: 0.5606, LEM: 0.3189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8224, partial_loss/deprel_loss: 0.6433, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8520, loss: 0.7051, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  47%|####6     | 52/111 [00:36<00:40,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9475, LAS: 0.9031, UEM: 0.5585, LEM: 0.3156, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2593, partial_loss/deprel_loss: 0.3815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5299, loss: 0.7007, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  50%|####9     | 55/111 [00:38<00:39,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9470, LAS: 0.9024, UEM: 0.5479, LEM: 0.3069, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4642, partial_loss/deprel_loss: 0.5490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7049, loss: 0.7073, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  53%|#####3    | 59/111 [00:41<00:34,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9475, LAS: 0.9030, UEM: 0.5552, LEM: 0.3137, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4942, partial_loss/deprel_loss: 0.5451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7077, loss: 0.7039, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  57%|#####6    | 63/111 [00:43<00:32,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9472, LAS: 0.9028, UEM: 0.5517, LEM: 0.3139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3959, partial_loss/deprel_loss: 0.4358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6006, loss: 0.7036, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  60%|######    | 67/111 [00:46<00:30,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9478, LAS: 0.9035, UEM: 0.5566, LEM: 0.3166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2160, partial_loss/deprel_loss: 0.3595, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5036, loss: 0.6997, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  64%|######3   | 71/111 [00:49<00:27,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9544, UAS: 0.9476, LAS: 0.9032, UEM: 0.5699, LEM: 0.3348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0714, partial_loss/deprel_loss: 0.2042, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3505, loss: 0.7030, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  67%|######6   | 74/111 [00:51<00:25,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9465, LAS: 0.9023, UEM: 0.5679, LEM: 0.3350, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8180, partial_loss/deprel_loss: 0.6136, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8273, loss: 0.7098, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  69%|######9   | 77/111 [00:54<00:24,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9465, LAS: 0.9021, UEM: 0.5639, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6078, partial_loss/deprel_loss: 0.6108, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7830, loss: 0.7105, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  73%|#######2  | 81/111 [00:56<00:21,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9470, LAS: 0.9028, UEM: 0.5722, LEM: 0.3391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1430, partial_loss/deprel_loss: 0.2524, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4033, loss: 0.7049, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  76%|#######5  | 84/111 [00:58<00:19,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8863, UAS: 0.9474, LAS: 0.9034, UEM: 0.5887, LEM: 0.3620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6315, partial_loss/deprel_loss: 0.6066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7844, loss: 0.6999, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  78%|#######8  | 87/111 [01:01<00:17,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9481, LAS: 0.9040, UEM: 0.5977, LEM: 0.3680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2512, partial_loss/deprel_loss: 0.4475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5810, loss: 0.6947, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  81%|########1 | 90/111 [01:03<00:15,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9479, LAS: 0.9036, UEM: 0.5902, LEM: 0.3608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6856, partial_loss/deprel_loss: 0.5673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7637, loss: 0.6968, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  85%|########4 | 94/111 [01:06<00:12,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9479, LAS: 0.9038, UEM: 0.5882, LEM: 0.3587, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3477, partial_loss/deprel_loss: 0.5077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6485, loss: 0.6960, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  87%|########7 | 97/111 [01:08<00:10,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9475, LAS: 0.9035, UEM: 0.5840, LEM: 0.3553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6664, partial_loss/deprel_loss: 0.5377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7362, loss: 0.6976, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  90%|######### | 100/111 [01:10<00:07,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9480, LAS: 0.9041, UEM: 0.5887, LEM: 0.3604, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1575, partial_loss/deprel_loss: 0.2746, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4240, loss: 0.6932, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  94%|#########3| 104/111 [01:13<00:04,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9486, LAS: 0.9047, UEM: 0.5946, LEM: 0.3647, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2394, partial_loss/deprel_loss: 0.3851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5287, loss: 0.6893, batch_reg_loss: 0.1728, reg_loss: 0.1728 ||:  96%|#########6| 107/111 [01:15<00:02,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9489, LAS: 0.9049, UEM: 0.5942, LEM: 0.3639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6411, partial_loss/deprel_loss: 0.6306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8055, loss: 0.6882, batch_reg_loss: 0.1728, reg_loss: 0.1728 ||:  99%|#########9| 110/111 [01:17<00:00,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9489, LAS: 0.9048, UEM: 0.5932, LEM: 0.3620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4630, partial_loss/deprel_loss: 0.6202, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7615, loss: 0.6888, batch_reg_loss: 0.1728, reg_loss: 0.1728 ||: 100%|##########| 111/111 [01:18<00:00,  1.42it/s]\n",
+      "2023-04-07 00:36:06,576 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.620  |       N/A\n",
+      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.463  |       N/A\n",
+      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.173  |       N/A\n",
+      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - UEM                      |     0.593  |       N/A\n",
+      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - LAS                      |     0.905  |       N/A\n",
+      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - loss                     |     0.689  |       N/A\n",
+      "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - LEM                      |     0.362  |       N/A\n",
+      "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - UAS                      |     0.949  |       N/A\n",
+      "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - EM                       |     0.898  |       N/A\n",
+      "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:36:06,583 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:36:11,692 - INFO - combo.training.trainer - Epoch duration: 0:01:26.712266\n",
+      "2023-04-07 00:36:11,693 - INFO - combo.training.trainer - Estimated training time remaining: 7:12:21\n",
+      "2023-04-07 00:36:11,693 - INFO - allennlp.training.trainer - Epoch 79/399\n",
+      "2023-04-07 00:36:11,693 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:36:11,693 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:36:11,701 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9323, UAS: 0.9567, LAS: 0.9180, UEM: 0.5695, LEM: 0.3250, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2451, partial_loss/deprel_loss: 0.4015, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5430, loss: 0.6235, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:   4%|3         | 4/111 [00:02<01:09,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8239, UAS: 0.9426, LAS: 0.9010, UEM: 0.4922, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7117, partial_loss/deprel_loss: 1.0595, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3627, loss: 0.7478, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:   7%|7         | 8/111 [00:05<01:08,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9500, LAS: 0.9082, UEM: 0.6338, LEM: 0.4162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3560, partial_loss/deprel_loss: 0.5119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6534, loss: 0.6912, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:  10%|9         | 11/111 [00:07<01:08,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9078, UAS: 0.9476, LAS: 0.9051, UEM: 0.5838, LEM: 0.3653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3645, partial_loss/deprel_loss: 0.4990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6448, loss: 0.7086, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:  14%|#3        | 15/111 [00:10<01:04,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9468, LAS: 0.9040, UEM: 0.5621, LEM: 0.3448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3119, partial_loss/deprel_loss: 0.4127, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5653, loss: 0.7126, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:  16%|#6        | 18/111 [00:12<01:03,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9495, LAS: 0.9071, UEM: 0.6012, LEM: 0.3786, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1973, partial_loss/deprel_loss: 0.3137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4632, loss: 0.6835, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:  19%|#8        | 21/111 [00:14<01:00,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9512, LAS: 0.9097, UEM: 0.6573, LEM: 0.4541, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7300, partial_loss/deprel_loss: 0.6385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8295, loss: 0.6655, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:  22%|##1       | 24/111 [00:16<01:02,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9152, UAS: 0.9509, LAS: 0.9091, UEM: 0.6380, LEM: 0.4309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3313, partial_loss/deprel_loss: 0.4382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5895, loss: 0.6719, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:  25%|##5       | 28/111 [00:19<00:57,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9527, LAS: 0.9108, UEM: 0.6429, LEM: 0.4273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2971, partial_loss/deprel_loss: 0.4320, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5777, loss: 0.6572, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:  29%|##8       | 32/111 [00:21<00:51,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9526, LAS: 0.9103, UEM: 0.6318, LEM: 0.4139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3001, partial_loss/deprel_loss: 0.4517, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5941, loss: 0.6554, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:  32%|###1      | 35/111 [00:23<00:50,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8422, UAS: 0.9514, LAS: 0.9086, UEM: 0.6262, LEM: 0.4088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2311, partial_loss/deprel_loss: 0.8674, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1128, loss: 0.6664, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:  34%|###4      | 38/111 [00:25<00:49,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9524, LAS: 0.9097, UEM: 0.6317, LEM: 0.4082, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2377, partial_loss/deprel_loss: 0.3761, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5211, loss: 0.6570, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:  37%|###6      | 41/111 [00:27<00:48,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9507, LAS: 0.9078, UEM: 0.6229, LEM: 0.4022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1997, partial_loss/deprel_loss: 0.3551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4966, loss: 0.6716, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  41%|####      | 45/111 [00:30<00:45,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9501, LAS: 0.9073, UEM: 0.6259, LEM: 0.4101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1513, partial_loss/deprel_loss: 0.2561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4078, loss: 0.6734, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  44%|####4     | 49/111 [00:33<00:43,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9051, UAS: 0.9506, LAS: 0.9077, UEM: 0.6257, LEM: 0.4059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5370, partial_loss/deprel_loss: 0.5998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7598, loss: 0.6716, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  47%|####6     | 52/111 [00:35<00:41,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9509, LAS: 0.9082, UEM: 0.6271, LEM: 0.4067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2181, partial_loss/deprel_loss: 0.2975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4542, loss: 0.6671, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  50%|#####     | 56/111 [00:38<00:38,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9504, LAS: 0.9075, UEM: 0.6145, LEM: 0.3936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5854, partial_loss/deprel_loss: 0.5008, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6903, loss: 0.6702, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  54%|#####4    | 60/111 [00:40<00:33,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9176, UAS: 0.9511, LAS: 0.9083, UEM: 0.6169, LEM: 0.3916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3994, partial_loss/deprel_loss: 0.4495, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6121, loss: 0.6644, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  58%|#####7    | 64/111 [00:43<00:32,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9515, LAS: 0.9084, UEM: 0.6153, LEM: 0.3867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2341, partial_loss/deprel_loss: 0.4211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5563, loss: 0.6629, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  60%|######    | 67/111 [00:45<00:30,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8708, UAS: 0.9511, LAS: 0.9079, UEM: 0.6110, LEM: 0.3826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8882, partial_loss/deprel_loss: 0.7016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9115, loss: 0.6672, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  63%|######3   | 70/111 [00:48<00:29,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9509, LAS: 0.9078, UEM: 0.6095, LEM: 0.3815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1806, partial_loss/deprel_loss: 0.3297, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4725, loss: 0.6690, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  66%|######5   | 73/111 [00:50<00:27,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9505, LAS: 0.9071, UEM: 0.6078, LEM: 0.3788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2898, partial_loss/deprel_loss: 0.4325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5766, loss: 0.6730, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  69%|######9   | 77/111 [00:52<00:23,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9508, LAS: 0.9073, UEM: 0.6133, LEM: 0.3822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1380, partial_loss/deprel_loss: 0.3113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4492, loss: 0.6704, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  72%|#######2  | 80/111 [00:54<00:21,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8482, UAS: 0.9498, LAS: 0.9063, UEM: 0.6056, LEM: 0.3753, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5038, partial_loss/deprel_loss: 0.9507, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2339, loss: 0.6799, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  76%|#######5  | 84/111 [00:57<00:18,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8845, UAS: 0.9499, LAS: 0.9062, UEM: 0.6077, LEM: 0.3767, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6644, partial_loss/deprel_loss: 0.6769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8469, loss: 0.6789, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||:  78%|#######8  | 87/111 [00:59<00:16,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9496, LAS: 0.9058, UEM: 0.6070, LEM: 0.3774, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7890, partial_loss/deprel_loss: 0.8387, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0013, loss: 0.6827, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||:  81%|########1 | 90/111 [01:01<00:14,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9044, UAS: 0.9486, LAS: 0.9046, UEM: 0.5989, LEM: 0.3707, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4162, partial_loss/deprel_loss: 0.5504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6961, loss: 0.6908, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||:  85%|########4 | 94/111 [01:04<00:11,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9480, LAS: 0.9039, UEM: 0.5931, LEM: 0.3646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6230, partial_loss/deprel_loss: 0.6034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7799, loss: 0.6954, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||:  88%|########8 | 98/111 [01:07<00:08,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9481, LAS: 0.9041, UEM: 0.5966, LEM: 0.3690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8358, partial_loss/deprel_loss: 0.7337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9267, loss: 0.6936, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||:  91%|######### | 101/111 [01:09<00:07,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9480, LAS: 0.9040, UEM: 0.5914, LEM: 0.3628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4340, partial_loss/deprel_loss: 0.4662, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6323, loss: 0.6934, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||:  95%|#########4| 105/111 [01:11<00:04,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8881, UAS: 0.9478, LAS: 0.9037, UEM: 0.5856, LEM: 0.3578, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8297, partial_loss/deprel_loss: 0.6664, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8716, loss: 0.6959, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||:  98%|#########8| 109/111 [01:14<00:01,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9479, LAS: 0.9038, UEM: 0.5869, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7285, partial_loss/deprel_loss: 0.5894, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7897, loss: 0.6951, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||: 100%|##########| 111/111 [01:15<00:00,  1.46it/s]\n",
+      "2023-04-07 00:37:30,881 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.589  |       N/A\n",
+      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.729  |       N/A\n",
+      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.173  |       N/A\n",
+      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - UEM                      |     0.587  |       N/A\n",
+      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - LAS                      |     0.904  |       N/A\n",
+      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - loss                     |     0.695  |       N/A\n",
+      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - LEM                      |     0.360  |       N/A\n",
+      "2023-04-07 00:37:30,883 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:37:30,883 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:37:30,883 - INFO - combo.training.tensorboard_writer - UAS                      |     0.948  |       N/A\n",
+      "2023-04-07 00:37:30,883 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:37:30,883 - INFO - combo.training.tensorboard_writer - EM                       |     0.889  |       N/A\n",
+      "2023-04-07 00:37:30,883 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:37:30,890 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:37:36,892 - INFO - combo.training.trainer - Epoch duration: 0:01:25.198854\n",
+      "2023-04-07 00:37:36,892 - INFO - combo.training.trainer - Estimated training time remaining: 7:11:18\n",
+      "2023-04-07 00:37:36,892 - INFO - allennlp.training.trainer - Epoch 80/399\n",
+      "2023-04-07 00:37:36,893 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:37:36,893 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:37:36,903 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9196, UAS: 0.9620, LAS: 0.9237, UEM: 0.6907, LEM: 0.4553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3221, partial_loss/deprel_loss: 0.4183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5716, loss: 0.5313, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||:   3%|2         | 3/111 [00:02<01:17,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9603, LAS: 0.9177, UEM: 0.6303, LEM: 0.3688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4412, partial_loss/deprel_loss: 0.5262, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6817, loss: 0.5811, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||:   5%|5         | 6/111 [00:04<01:15,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9588, LAS: 0.9181, UEM: 0.6741, LEM: 0.4565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7152, partial_loss/deprel_loss: 0.6657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8481, loss: 0.5944, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||:   8%|8         | 9/111 [00:06<01:14,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9549, LAS: 0.9129, UEM: 0.6113, LEM: 0.3937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3193, partial_loss/deprel_loss: 0.4733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6149, loss: 0.6329, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||:  12%|#1        | 13/111 [00:09<01:08,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9546, LAS: 0.9125, UEM: 0.6094, LEM: 0.3910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4229, partial_loss/deprel_loss: 0.4221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5947, loss: 0.6348, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||:  14%|#4        | 16/111 [00:11<01:08,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9532, LAS: 0.9108, UEM: 0.6202, LEM: 0.4140, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9059, partial_loss/deprel_loss: 0.7547, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9574, loss: 0.6489, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||:  17%|#7        | 19/111 [00:13<01:07,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9530, LAS: 0.9100, UEM: 0.6040, LEM: 0.3906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3067, partial_loss/deprel_loss: 0.4951, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6299, loss: 0.6532, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||:  20%|#9        | 22/111 [00:15<01:05,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9490, LAS: 0.9057, UEM: 0.5830, LEM: 0.3724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4699, partial_loss/deprel_loss: 0.5475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7044, loss: 0.6857, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||:  23%|##2       | 25/111 [00:18<01:03,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9299, UAS: 0.9502, LAS: 0.9070, UEM: 0.5930, LEM: 0.3742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2599, partial_loss/deprel_loss: 0.4180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5588, loss: 0.6773, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||:  26%|##6       | 29/111 [00:20<00:58,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9518, LAS: 0.9092, UEM: 0.6273, LEM: 0.4061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2288, partial_loss/deprel_loss: 0.3738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5173, loss: 0.6576, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||:  29%|##8       | 32/111 [00:23<00:57,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9495, LAS: 0.9065, UEM: 0.6101, LEM: 0.3909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4890, partial_loss/deprel_loss: 0.5513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7113, loss: 0.6791, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  32%|###1      | 35/111 [00:25<00:54,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8907, UAS: 0.9486, LAS: 0.9054, UEM: 0.6030, LEM: 0.3847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5379, partial_loss/deprel_loss: 0.5874, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7500, loss: 0.6869, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  34%|###4      | 38/111 [00:27<00:52,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8247, UAS: 0.9468, LAS: 0.9033, UEM: 0.5977, LEM: 0.3799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7654, partial_loss/deprel_loss: 0.9535, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2883, loss: 0.7037, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  37%|###6      | 41/111 [00:29<00:49,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9236, UAS: 0.9469, LAS: 0.9034, UEM: 0.5872, LEM: 0.3688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3795, partial_loss/deprel_loss: 0.3789, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5514, loss: 0.7030, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  41%|####      | 45/111 [00:31<00:44,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9462, LAS: 0.9022, UEM: 0.5714, LEM: 0.3543, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5592, partial_loss/deprel_loss: 0.6000, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7643, loss: 0.7125, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  44%|####4     | 49/111 [00:34<00:40,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9474, LAS: 0.9035, UEM: 0.5757, LEM: 0.3527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3003, partial_loss/deprel_loss: 0.4217, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5699, loss: 0.7029, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  48%|####7     | 53/111 [00:37<00:41,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9485, LAS: 0.9047, UEM: 0.5836, LEM: 0.3553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2203, partial_loss/deprel_loss: 0.3744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5160, loss: 0.6956, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  50%|#####     | 56/111 [00:39<00:39,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9483, LAS: 0.9043, UEM: 0.5866, LEM: 0.3581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1981, partial_loss/deprel_loss: 0.3500, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4921, loss: 0.6978, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  53%|#####3    | 59/111 [00:41<00:36,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9490, LAS: 0.9051, UEM: 0.5953, LEM: 0.3652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2126, partial_loss/deprel_loss: 0.3401, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4870, loss: 0.6900, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  56%|#####5    | 62/111 [00:44<00:37,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9492, LAS: 0.9052, UEM: 0.5994, LEM: 0.3674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2119, partial_loss/deprel_loss: 0.3785, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5176, loss: 0.6883, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  59%|#####8    | 65/111 [00:46<00:34,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9495, LAS: 0.9056, UEM: 0.6049, LEM: 0.3719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1288, partial_loss/deprel_loss: 0.3110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4469, loss: 0.6860, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  61%|######1   | 68/111 [00:48<00:31,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8482, UAS: 0.9491, LAS: 0.9052, UEM: 0.6076, LEM: 0.3730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3398, partial_loss/deprel_loss: 0.7577, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0465, loss: 0.6871, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  64%|######3   | 71/111 [00:50<00:29,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9494, LAS: 0.9057, UEM: 0.6087, LEM: 0.3739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2983, partial_loss/deprel_loss: 0.4091, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5593, loss: 0.6846, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  67%|######6   | 74/111 [00:53<00:27,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9496, LAS: 0.9057, UEM: 0.6040, LEM: 0.3663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3739, partial_loss/deprel_loss: 0.5073, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6530, loss: 0.6851, batch_reg_loss: 0.1724, reg_loss: 0.1724 ||:  70%|#######   | 78/111 [00:55<00:22,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9166, UAS: 0.9496, LAS: 0.9056, UEM: 0.6007, LEM: 0.3625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3293, partial_loss/deprel_loss: 0.4565, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6035, loss: 0.6847, batch_reg_loss: 0.1724, reg_loss: 0.1724 ||:  74%|#######3  | 82/111 [00:57<00:19,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9495, LAS: 0.9057, UEM: 0.5956, LEM: 0.3583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4589, partial_loss/deprel_loss: 0.4744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6437, loss: 0.6845, batch_reg_loss: 0.1724, reg_loss: 0.1724 ||:  77%|#######6  | 85/111 [01:00<00:18,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9355, UAS: 0.9495, LAS: 0.9056, UEM: 0.5939, LEM: 0.3549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2203, partial_loss/deprel_loss: 0.3479, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4947, loss: 0.6853, batch_reg_loss: 0.1724, reg_loss: 0.1724 ||:  80%|########  | 89/111 [01:02<00:14,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8917, UAS: 0.9491, LAS: 0.9052, UEM: 0.5858, LEM: 0.3478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7029, partial_loss/deprel_loss: 0.6080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7993, loss: 0.6869, batch_reg_loss: 0.1723, reg_loss: 0.1724 ||:  84%|########3 | 93/111 [01:05<00:11,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8718, UAS: 0.9482, LAS: 0.9041, UEM: 0.5799, LEM: 0.3432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9657, partial_loss/deprel_loss: 0.7077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9316, loss: 0.6950, batch_reg_loss: 0.1723, reg_loss: 0.1724 ||:  87%|########7 | 97/111 [01:07<00:09,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9480, LAS: 0.9037, UEM: 0.5733, LEM: 0.3373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5950, partial_loss/deprel_loss: 0.5820, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7570, loss: 0.6973, batch_reg_loss: 0.1723, reg_loss: 0.1724 ||:  91%|######### | 101/111 [01:10<00:06,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8983, UAS: 0.9483, LAS: 0.9039, UEM: 0.5756, LEM: 0.3389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5457, partial_loss/deprel_loss: 0.6095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7691, loss: 0.6958, batch_reg_loss: 0.1723, reg_loss: 0.1724 ||:  95%|#########4| 105/111 [01:13<00:04,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9485, LAS: 0.9043, UEM: 0.5833, LEM: 0.3468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2313, partial_loss/deprel_loss: 0.3321, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4842, loss: 0.6930, batch_reg_loss: 0.1723, reg_loss: 0.1724 ||:  97%|#########7| 108/111 [01:15<00:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8750, UAS: 0.9487, LAS: 0.9045, UEM: 0.5949, LEM: 0.3645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7318, partial_loss/deprel_loss: 0.6724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8566, loss: 0.6913, batch_reg_loss: 0.1723, reg_loss: 0.1724 ||: 100%|##########| 111/111 [01:17<00:00,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8750, UAS: 0.9487, LAS: 0.9045, UEM: 0.5949, LEM: 0.3645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7318, partial_loss/deprel_loss: 0.6724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8566, loss: 0.6913, batch_reg_loss: 0.1723, reg_loss: 0.1724 ||: 100%|##########| 111/111 [01:17<00:00,  1.43it/s]\n",
+      "2023-04-07 00:38:57,543 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8646, UAS: 0.9029, LAS: 0.8477, UEM: 0.1151, LEM: 0.0144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3311, partial_loss/deprel_loss: 47.7680, partial_loss/cycle_loss: 0.0000, batch_loss: 38.4806, loss: 41.8893, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:11,  1.09s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9320, LAS: 0.8765, UEM: 0.5111, LEM: 0.2229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5485, partial_loss/deprel_loss: 24.1775, partial_loss/cycle_loss: 0.0000, batch_loss: 19.4517, loss: 30.7239, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:05<00:08,  1.05s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9407, LAS: 0.8871, UEM: 0.6027, LEM: 0.3056, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1748, partial_loss/deprel_loss: 23.6009, partial_loss/cycle_loss: 0.0000, batch_loss: 18.9157, loss: 28.3449, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:07<00:05,  1.01s/it]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9280, UAS: 0.9430, LAS: 0.8909, UEM: 0.5963, LEM: 0.3052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3954, partial_loss/deprel_loss: 17.4416, partial_loss/cycle_loss: 0.0000, batch_loss: 14.0323, loss: 26.6526, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:10<00:01,  1.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.9458, LAS: 0.8946, UEM: 0.6489, LEM: 0.3860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7757, partial_loss/deprel_loss: 29.8046, partial_loss/cycle_loss: 0.0000, batch_loss: 23.9988, loss: 25.6342, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.06it/s]\n",
+      "2023-04-07 00:39:09,770 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:39:09,772 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:39:09,772 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:39:09,772 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:39:09,772 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 00:39:09,772 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:39:09,772 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 00:39:09,772 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.672  |    29.805\n",
+      "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.732  |     0.776\n",
+      "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.172  |     0.000\n",
+      "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - UEM                      |     0.595  |     0.649\n",
+      "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - LAS                      |     0.904  |     0.895\n",
+      "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - loss                     |     0.691  |    25.634\n",
+      "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - LEM                      |     0.365  |     0.386\n",
+      "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:39:09,774 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:39:09,774 - INFO - combo.training.tensorboard_writer - UAS                      |     0.949  |     0.946\n",
+      "2023-04-07 00:39:09,774 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:39:09,774 - INFO - combo.training.tensorboard_writer - EM                       |     0.875  |     0.881\n",
+      "2023-04-07 00:39:09,774 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:39:09,780 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 00:39:14,857 - INFO - combo.training.trainer - Epoch duration: 0:01:37.964569\n",
+      "2023-04-07 00:39:14,858 - INFO - combo.training.trainer - Estimated training time remaining: 7:11:04\n",
+      "2023-04-07 00:39:14,858 - INFO - allennlp.training.trainer - Epoch 81/399\n",
+      "2023-04-07 00:39:14,858 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:39:14,859 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:39:14,868 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9547, LAS: 0.9104, UEM: 0.6792, LEM: 0.4550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5030, partial_loss/deprel_loss: 0.5679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7273, loss: 0.6154, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:   3%|2         | 3/111 [00:02<01:14,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9549, LAS: 0.9128, UEM: 0.7015, LEM: 0.4632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2751, partial_loss/deprel_loss: 0.3782, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5299, loss: 0.6082, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:   6%|6         | 7/111 [00:04<01:10,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9524, LAS: 0.9107, UEM: 0.6876, LEM: 0.4629, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6333, partial_loss/deprel_loss: 0.6023, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7808, loss: 0.6312, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:   9%|9         | 10/111 [00:06<01:09,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9514, LAS: 0.9102, UEM: 0.6589, LEM: 0.4373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4960, partial_loss/deprel_loss: 0.5311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6964, loss: 0.6450, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:  12%|#1        | 13/111 [00:08<01:06,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9522, LAS: 0.9101, UEM: 0.6362, LEM: 0.4087, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2727, partial_loss/deprel_loss: 0.4308, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5715, loss: 0.6486, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:  14%|#4        | 16/111 [00:11<01:10,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9496, LAS: 0.9079, UEM: 0.6037, LEM: 0.3839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4495, partial_loss/deprel_loss: 0.4817, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6475, loss: 0.6674, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:  17%|#7        | 19/111 [00:13<01:07,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9513, LAS: 0.9092, UEM: 0.6182, LEM: 0.3905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2502, partial_loss/deprel_loss: 0.4057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5469, loss: 0.6559, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:  20%|#9        | 22/111 [00:15<01:05,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9502, LAS: 0.9075, UEM: 0.6075, LEM: 0.3815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1735, partial_loss/deprel_loss: 0.3221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4646, loss: 0.6651, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:  23%|##2       | 25/111 [00:17<01:02,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9510, LAS: 0.9083, UEM: 0.6091, LEM: 0.3793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1998, partial_loss/deprel_loss: 0.3217, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4696, loss: 0.6594, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:  25%|##5       | 28/111 [00:20<01:01,  1.35it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8468, UAS: 0.9499, LAS: 0.9070, UEM: 0.6042, LEM: 0.3718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2352, partial_loss/deprel_loss: 0.7932, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0539, loss: 0.6675, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:  28%|##7       | 31/111 [00:22<00:59,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9509, LAS: 0.9084, UEM: 0.6005, LEM: 0.3653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3909, partial_loss/deprel_loss: 0.4168, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5838, loss: 0.6564, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:  32%|###1      | 35/111 [00:25<00:54,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9528, LAS: 0.9105, UEM: 0.6227, LEM: 0.3832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2360, partial_loss/deprel_loss: 0.3608, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5081, loss: 0.6427, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:  34%|###4      | 38/111 [00:27<00:52,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9514, LAS: 0.9089, UEM: 0.6216, LEM: 0.3814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4446, partial_loss/deprel_loss: 0.4394, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6127, loss: 0.6547, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:  37%|###6      | 41/111 [00:29<00:50,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9518, LAS: 0.9095, UEM: 0.6119, LEM: 0.3702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4576, partial_loss/deprel_loss: 0.4736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6427, loss: 0.6515, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  41%|####      | 45/111 [00:31<00:45,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9508, LAS: 0.9086, UEM: 0.6184, LEM: 0.3826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1493, partial_loss/deprel_loss: 0.2488, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4012, loss: 0.6600, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  43%|####3     | 48/111 [00:34<00:45,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9077, UAS: 0.9505, LAS: 0.9082, UEM: 0.6075, LEM: 0.3719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6031, partial_loss/deprel_loss: 0.5009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6935, loss: 0.6638, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  46%|####5     | 51/111 [00:36<00:44,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9509, LAS: 0.9087, UEM: 0.6097, LEM: 0.3735, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1804, partial_loss/deprel_loss: 0.3201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4644, loss: 0.6610, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  49%|####8     | 54/111 [00:38<00:42,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8718, UAS: 0.9501, LAS: 0.9077, UEM: 0.6038, LEM: 0.3686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0205, partial_loss/deprel_loss: 0.7639, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9874, loss: 0.6706, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  51%|#####1    | 57/111 [00:41<00:39,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8983, UAS: 0.9498, LAS: 0.9072, UEM: 0.5953, LEM: 0.3598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6021, partial_loss/deprel_loss: 0.5233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7113, loss: 0.6743, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  55%|#####4    | 61/111 [00:43<00:35,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9496, LAS: 0.9071, UEM: 0.5866, LEM: 0.3521, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3604, partial_loss/deprel_loss: 0.4199, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5802, loss: 0.6753, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  59%|#####8    | 65/111 [00:46<00:31,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9191, UAS: 0.9505, LAS: 0.9079, UEM: 0.5911, LEM: 0.3532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2425, partial_loss/deprel_loss: 0.4279, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5631, loss: 0.6692, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  62%|######2   | 69/111 [00:49<00:29,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9508, LAS: 0.9080, UEM: 0.5965, LEM: 0.3573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1185, partial_loss/deprel_loss: 0.3069, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4414, loss: 0.6676, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  66%|######5   | 73/111 [00:51<00:26,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9508, LAS: 0.9081, UEM: 0.6005, LEM: 0.3605, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2179, partial_loss/deprel_loss: 0.3738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5148, loss: 0.6657, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  68%|######8   | 76/111 [00:54<00:26,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9501, LAS: 0.9073, UEM: 0.5916, LEM: 0.3543, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7469, partial_loss/deprel_loss: 0.6689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8567, loss: 0.6726, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  71%|#######1  | 79/111 [00:56<00:23,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8454, UAS: 0.9500, LAS: 0.9070, UEM: 0.5944, LEM: 0.3549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3228, partial_loss/deprel_loss: 0.8789, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1398, loss: 0.6744, batch_reg_loss: 0.1722, reg_loss: 0.1722 ||:  75%|#######4  | 83/111 [00:59<00:20,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9497, LAS: 0.9067, UEM: 0.5907, LEM: 0.3531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1929, partial_loss/deprel_loss: 0.2878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4410, loss: 0.6763, batch_reg_loss: 0.1722, reg_loss: 0.1722 ||:  78%|#######8  | 87/111 [01:01<00:16,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9492, LAS: 0.9060, UEM: 0.5841, LEM: 0.3475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6835, partial_loss/deprel_loss: 0.5940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7840, loss: 0.6808, batch_reg_loss: 0.1722, reg_loss: 0.1722 ||:  81%|########1 | 90/111 [01:03<00:14,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8816, UAS: 0.9490, LAS: 0.9058, UEM: 0.5808, LEM: 0.3447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7765, partial_loss/deprel_loss: 0.6530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8498, loss: 0.6830, batch_reg_loss: 0.1722, reg_loss: 0.1722 ||:  84%|########3 | 93/111 [01:05<00:12,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9491, LAS: 0.9058, UEM: 0.5772, LEM: 0.3403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6823, partial_loss/deprel_loss: 0.6745, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8483, loss: 0.6848, batch_reg_loss: 0.1722, reg_loss: 0.1722 ||:  87%|########7 | 97/111 [01:08<00:09,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9499, LAS: 0.9066, UEM: 0.5916, LEM: 0.3558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2769, partial_loss/deprel_loss: 0.4403, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5797, loss: 0.6777, batch_reg_loss: 0.1722, reg_loss: 0.1722 ||:  91%|######### | 101/111 [01:11<00:06,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9636, UAS: 0.9495, LAS: 0.9062, UEM: 0.6024, LEM: 0.3746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0667, partial_loss/deprel_loss: 0.1438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3005, loss: 0.6809, batch_reg_loss: 0.1721, reg_loss: 0.1722 ||:  94%|#########3| 104/111 [01:13<00:05,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9497, LAS: 0.9063, UEM: 0.6006, LEM: 0.3714, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4018, partial_loss/deprel_loss: 0.4389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6036, loss: 0.6805, batch_reg_loss: 0.1721, reg_loss: 0.1722 ||:  96%|#########6| 107/111 [01:16<00:02,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9496, LAS: 0.9061, UEM: 0.5974, LEM: 0.3681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3216, partial_loss/deprel_loss: 0.4782, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6190, loss: 0.6823, batch_reg_loss: 0.1721, reg_loss: 0.1722 ||:  99%|#########9| 110/111 [01:18<00:00,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9495, LAS: 0.9060, UEM: 0.5958, LEM: 0.3663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5263, partial_loss/deprel_loss: 0.5980, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7558, loss: 0.6830, batch_reg_loss: 0.1721, reg_loss: 0.1722 ||: 100%|##########| 111/111 [01:18<00:00,  1.41it/s]\n",
+      "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.598  |       N/A\n",
+      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.526  |       N/A\n",
+      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.172  |       N/A\n",
+      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - UEM                      |     0.596  |       N/A\n",
+      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - LAS                      |     0.906  |       N/A\n",
+      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - loss                     |     0.683  |       N/A\n",
+      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - LEM                      |     0.366  |       N/A\n",
+      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - UAS                      |     0.950  |       N/A\n",
+      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - EM                       |     0.895  |       N/A\n",
+      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:40:37,041 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 00:40:41,884 - INFO - combo.training.trainer - Epoch duration: 0:01:27.026083\n",
+      "2023-04-07 00:40:41,884 - INFO - combo.training.trainer - Estimated training time remaining: 7:10:06\n",
+      "2023-04-07 00:40:41,885 - INFO - allennlp.training.trainer - Epoch 82/399\n",
+      "2023-04-07 00:40:41,885 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:40:41,885 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:40:41,894 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8768, UAS: 0.9409, LAS: 0.8998, UEM: 0.4771, LEM: 0.2604, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0136, partial_loss/deprel_loss: 0.6579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9012, loss: 0.7123, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:   4%|3         | 4/111 [00:02<01:10,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8989, UAS: 0.9483, LAS: 0.9083, UEM: 0.6919, LEM: 0.5363, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5977, partial_loss/deprel_loss: 0.5405, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7241, loss: 0.6607, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:   6%|6         | 7/111 [00:05<01:14,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9542, LAS: 0.9138, UEM: 0.7011, LEM: 0.4979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6391, partial_loss/deprel_loss: 0.5094, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7074, loss: 0.6194, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:  10%|9         | 11/111 [00:07<01:08,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9534, LAS: 0.9131, UEM: 0.6858, LEM: 0.4754, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4420, partial_loss/deprel_loss: 0.4731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6390, loss: 0.6224, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:  13%|#2        | 14/111 [00:09<01:05,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9539, LAS: 0.9126, UEM: 0.6711, LEM: 0.4491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6797, partial_loss/deprel_loss: 0.6238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8071, loss: 0.6269, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:  16%|#6        | 18/111 [00:12<01:01,  1.52it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9545, LAS: 0.9128, UEM: 0.6608, LEM: 0.4301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3726, partial_loss/deprel_loss: 0.5161, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6595, loss: 0.6252, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:  19%|#8        | 21/111 [00:14<01:00,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9565, LAS: 0.9145, UEM: 0.6808, LEM: 0.4468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4160, partial_loss/deprel_loss: 0.5045, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6589, loss: 0.6114, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:  22%|##1       | 24/111 [00:16<01:01,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8881, UAS: 0.9542, LAS: 0.9119, UEM: 0.6572, LEM: 0.4251, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6785, partial_loss/deprel_loss: 0.6107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7963, loss: 0.6330, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:  24%|##4       | 27/111 [00:18<00:58,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9553, LAS: 0.9132, UEM: 0.6573, LEM: 0.4177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2071, partial_loss/deprel_loss: 0.3437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4885, loss: 0.6242, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:  28%|##7       | 31/111 [00:21<00:56,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8581, UAS: 0.9533, LAS: 0.9109, UEM: 0.6456, LEM: 0.4064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1913, partial_loss/deprel_loss: 0.8398, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0822, loss: 0.6427, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:  31%|###       | 34/111 [00:23<00:53,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8703, UAS: 0.9520, LAS: 0.9095, UEM: 0.6338, LEM: 0.3971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0930, partial_loss/deprel_loss: 0.6926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9448, loss: 0.6531, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:  33%|###3      | 37/111 [00:25<00:52,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9523, LAS: 0.9097, UEM: 0.6358, LEM: 0.3974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1727, partial_loss/deprel_loss: 0.3159, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4593, loss: 0.6540, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:  37%|###6      | 41/111 [00:28<00:48,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9517, LAS: 0.9092, UEM: 0.6257, LEM: 0.3878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2168, partial_loss/deprel_loss: 0.3799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5193, loss: 0.6588, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  41%|####      | 45/111 [00:30<00:42,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9508, LAS: 0.9081, UEM: 0.6245, LEM: 0.3829, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4910, partial_loss/deprel_loss: 0.5458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7069, loss: 0.6681, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  44%|####4     | 49/111 [00:33<00:40,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9501, LAS: 0.9071, UEM: 0.6120, LEM: 0.3725, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8077, partial_loss/deprel_loss: 0.6382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8442, loss: 0.6766, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  48%|####7     | 53/111 [00:35<00:39,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9507, LAS: 0.9076, UEM: 0.6135, LEM: 0.3716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2720, partial_loss/deprel_loss: 0.4549, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5904, loss: 0.6743, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  50%|#####     | 56/111 [00:38<00:38,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8874, UAS: 0.9502, LAS: 0.9071, UEM: 0.5999, LEM: 0.3610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6217, partial_loss/deprel_loss: 0.5910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7692, loss: 0.6763, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  54%|#####4    | 60/111 [00:40<00:34,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9502, LAS: 0.9069, UEM: 0.5913, LEM: 0.3521, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5812, partial_loss/deprel_loss: 0.5780, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7507, loss: 0.6767, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  58%|#####7    | 64/111 [00:43<00:31,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9498, LAS: 0.9065, UEM: 0.5906, LEM: 0.3518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2432, partial_loss/deprel_loss: 0.3638, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5117, loss: 0.6800, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  60%|######    | 67/111 [00:46<00:32,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9500, LAS: 0.9065, UEM: 0.5908, LEM: 0.3497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2326, partial_loss/deprel_loss: 0.4214, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5557, loss: 0.6793, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  63%|######3   | 70/111 [00:48<00:30,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8726, UAS: 0.9501, LAS: 0.9067, UEM: 0.5942, LEM: 0.3538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9001, partial_loss/deprel_loss: 0.6856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9006, loss: 0.6772, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  66%|######5   | 73/111 [00:50<00:28,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9371, UAS: 0.9502, LAS: 0.9067, UEM: 0.5941, LEM: 0.3537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1827, partial_loss/deprel_loss: 0.3380, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4790, loss: 0.6774, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  68%|######8   | 76/111 [00:52<00:26,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9507, LAS: 0.9072, UEM: 0.6020, LEM: 0.3641, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3602, partial_loss/deprel_loss: 0.5102, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6522, loss: 0.6746, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  72%|#######2  | 80/111 [00:55<00:22,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9504, LAS: 0.9068, UEM: 0.5954, LEM: 0.3582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7883, partial_loss/deprel_loss: 0.6437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8446, loss: 0.6771, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  75%|#######4  | 83/111 [00:57<00:19,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9504, LAS: 0.9068, UEM: 0.5946, LEM: 0.3573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3513, partial_loss/deprel_loss: 0.4657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6149, loss: 0.6778, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  77%|#######7  | 86/111 [00:59<00:17,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9503, LAS: 0.9066, UEM: 0.5921, LEM: 0.3549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3417, partial_loss/deprel_loss: 0.4772, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6221, loss: 0.6793, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  80%|########  | 89/111 [01:01<00:15,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9502, LAS: 0.9063, UEM: 0.5880, LEM: 0.3507, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7008, partial_loss/deprel_loss: 0.5836, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7791, loss: 0.6807, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  83%|########2 | 92/111 [01:03<00:13,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9504, LAS: 0.9067, UEM: 0.5963, LEM: 0.3600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6970, partial_loss/deprel_loss: 0.5774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7733, loss: 0.6775, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  86%|########5 | 95/111 [01:06<00:11,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9136, UAS: 0.9498, LAS: 0.9059, UEM: 0.5917, LEM: 0.3550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3445, partial_loss/deprel_loss: 0.4310, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5857, loss: 0.6827, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  89%|########9 | 99/111 [01:08<00:08,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9501, LAS: 0.9062, UEM: 0.5957, LEM: 0.3577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2567, partial_loss/deprel_loss: 0.4081, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5498, loss: 0.6808, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  92%|#########1| 102/111 [01:10<00:06,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9501, LAS: 0.9062, UEM: 0.5980, LEM: 0.3613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1534, partial_loss/deprel_loss: 0.2828, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4289, loss: 0.6796, batch_reg_loss: 0.1720, reg_loss: 0.1720 ||:  95%|#########5| 106/111 [01:13<00:03,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9505, LAS: 0.9066, UEM: 0.6012, LEM: 0.3650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2708, partial_loss/deprel_loss: 0.3733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5247, loss: 0.6757, batch_reg_loss: 0.1720, reg_loss: 0.1720 ||:  98%|#########8| 109/111 [01:15<00:01,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9500, LAS: 0.9062, UEM: 0.5992, LEM: 0.3631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3536, partial_loss/deprel_loss: 0.4593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6101, loss: 0.6789, batch_reg_loss: 0.1720, reg_loss: 0.1720 ||: 100%|##########| 111/111 [01:17<00:00,  1.44it/s]\n",
+      "2023-04-07 00:42:02,217 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.459  |       N/A\n",
+      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.354  |       N/A\n",
+      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.172  |       N/A\n",
+      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - UEM                      |     0.599  |       N/A\n",
+      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - LAS                      |     0.906  |       N/A\n",
+      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - loss                     |     0.679  |       N/A\n",
+      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:42:02,219 - INFO - combo.training.tensorboard_writer - LEM                      |     0.363  |       N/A\n",
+      "2023-04-07 00:42:02,219 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:42:02,219 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:42:02,219 - INFO - combo.training.tensorboard_writer - UAS                      |     0.950  |       N/A\n",
+      "2023-04-07 00:42:02,219 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:42:02,219 - INFO - combo.training.tensorboard_writer - EM                       |     0.915  |       N/A\n",
+      "2023-04-07 00:42:02,219 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:42:02,224 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 00:42:07,283 - INFO - combo.training.trainer - Epoch duration: 0:01:25.398504\n",
+      "2023-04-07 00:42:07,284 - INFO - combo.training.trainer - Estimated training time remaining: 7:09:01\n",
+      "2023-04-07 00:42:07,284 - INFO - allennlp.training.trainer - Epoch 83/399\n",
+      "2023-04-07 00:42:07,284 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:42:07,285 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:42:07,294 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9284, LAS: 0.8837, UEM: 0.1775, LEM: 0.0476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6096, partial_loss/deprel_loss: 0.6407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8064, loss: 0.8763, batch_reg_loss: 0.1720, reg_loss: 0.1720 ||:   3%|2         | 3/111 [00:02<01:18,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9434, LAS: 0.8991, UEM: 0.5232, LEM: 0.2785, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2584, partial_loss/deprel_loss: 0.4491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5829, loss: 0.7464, batch_reg_loss: 0.1720, reg_loss: 0.1720 ||:   5%|5         | 6/111 [00:04<01:14,  1.40it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9472, LAS: 0.9040, UEM: 0.5188, LEM: 0.2745, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3754, partial_loss/deprel_loss: 0.4332, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5936, loss: 0.7046, batch_reg_loss: 0.1720, reg_loss: 0.1720 ||:   9%|9         | 10/111 [00:06<01:09,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8927, UAS: 0.9509, LAS: 0.9083, UEM: 0.5943, LEM: 0.3498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7866, partial_loss/deprel_loss: 0.5632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7799, loss: 0.6678, batch_reg_loss: 0.1720, reg_loss: 0.1720 ||:  13%|#2        | 14/111 [00:09<01:03,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9491, LAS: 0.9066, UEM: 0.5690, LEM: 0.3295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4959, partial_loss/deprel_loss: 0.5747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7309, loss: 0.6766, batch_reg_loss: 0.1719, reg_loss: 0.1720 ||:  15%|#5        | 17/111 [00:11<01:04,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8928, UAS: 0.9483, LAS: 0.9054, UEM: 0.5519, LEM: 0.3169, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7224, partial_loss/deprel_loss: 0.6577, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8426, loss: 0.6896, batch_reg_loss: 0.1719, reg_loss: 0.1720 ||:  19%|#8        | 21/111 [00:13<00:58,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8593, UAS: 0.9476, LAS: 0.9052, UEM: 0.5393, LEM: 0.3055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3746, partial_loss/deprel_loss: 0.7047, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0106, loss: 0.6951, batch_reg_loss: 0.1719, reg_loss: 0.1720 ||:  23%|##3       | 26/111 [00:15<00:50,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9492, LAS: 0.9067, UEM: 0.6104, LEM: 0.3823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2221, partial_loss/deprel_loss: 0.3582, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5029, loss: 0.6811, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  27%|##7       | 30/111 [00:18<00:47,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9487, LAS: 0.9066, UEM: 0.5992, LEM: 0.3710, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9904, partial_loss/deprel_loss: 0.5820, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8356, loss: 0.6787, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  31%|###       | 34/111 [00:20<00:46,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8845, UAS: 0.9484, LAS: 0.9060, UEM: 0.5845, LEM: 0.3575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7106, partial_loss/deprel_loss: 0.6451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8301, loss: 0.6820, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  34%|###4      | 38/111 [00:23<00:43,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9250, UAS: 0.9472, LAS: 0.9040, UEM: 0.5775, LEM: 0.3495, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2128, partial_loss/deprel_loss: 0.3823, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5203, loss: 0.6965, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  38%|###7      | 42/111 [00:25<00:42,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9459, LAS: 0.9025, UEM: 0.5688, LEM: 0.3394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5569, partial_loss/deprel_loss: 0.5899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7552, loss: 0.7069, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  41%|####1     | 46/111 [00:28<00:42,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9474, LAS: 0.9046, UEM: 0.6034, LEM: 0.3864, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2728, partial_loss/deprel_loss: 0.3495, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5061, loss: 0.6915, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  45%|####5     | 50/111 [00:31<00:42,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9489, LAS: 0.9062, UEM: 0.6256, LEM: 0.4053, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1323, partial_loss/deprel_loss: 0.2757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4189, loss: 0.6783, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  48%|####7     | 53/111 [00:34<00:42,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9494, LAS: 0.9068, UEM: 0.6231, LEM: 0.4025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3449, partial_loss/deprel_loss: 0.4298, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5847, loss: 0.6730, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  51%|#####1    | 57/111 [00:36<00:37,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9124, UAS: 0.9496, LAS: 0.9068, UEM: 0.6177, LEM: 0.3945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4062, partial_loss/deprel_loss: 0.4269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5946, loss: 0.6716, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  55%|#####4    | 61/111 [00:39<00:34,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9496, LAS: 0.9068, UEM: 0.6141, LEM: 0.3893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3288, partial_loss/deprel_loss: 0.3589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5248, loss: 0.6721, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  58%|#####7    | 64/111 [00:41<00:32,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9504, LAS: 0.9075, UEM: 0.6194, LEM: 0.3902, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2091, partial_loss/deprel_loss: 0.3767, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5151, loss: 0.6667, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  60%|######    | 67/111 [00:44<00:33,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9505, LAS: 0.9076, UEM: 0.6181, LEM: 0.3875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4662, partial_loss/deprel_loss: 0.4629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6354, loss: 0.6657, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  63%|######3   | 70/111 [00:46<00:30,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8761, UAS: 0.9504, LAS: 0.9074, UEM: 0.6133, LEM: 0.3826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7722, partial_loss/deprel_loss: 0.6533, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8489, loss: 0.6670, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  66%|######5   | 73/111 [00:48<00:28,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9505, LAS: 0.9074, UEM: 0.6114, LEM: 0.3800, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9190, partial_loss/deprel_loss: 0.6907, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9083, loss: 0.6686, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  68%|######8   | 76/111 [00:50<00:25,  1.35it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9506, LAS: 0.9075, UEM: 0.6083, LEM: 0.3737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2458, partial_loss/deprel_loss: 0.3589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5082, loss: 0.6687, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  72%|#######2  | 80/111 [00:53<00:22,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9507, LAS: 0.9076, UEM: 0.6118, LEM: 0.3788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1026, partial_loss/deprel_loss: 0.2484, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3911, loss: 0.6690, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||:  76%|#######5  | 84/111 [00:56<00:18,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8797, UAS: 0.9502, LAS: 0.9070, UEM: 0.6113, LEM: 0.3799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7965, partial_loss/deprel_loss: 0.6126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8212, loss: 0.6721, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||:  78%|#######8  | 87/111 [00:58<00:16,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9025, UAS: 0.9498, LAS: 0.9066, UEM: 0.6044, LEM: 0.3737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6229, partial_loss/deprel_loss: 0.5504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7368, loss: 0.6750, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||:  81%|########1 | 90/111 [01:00<00:14,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8997, UAS: 0.9495, LAS: 0.9063, UEM: 0.6002, LEM: 0.3700, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6756, partial_loss/deprel_loss: 0.6268, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8084, loss: 0.6786, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||:  84%|########3 | 93/111 [01:02<00:12,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9491, LAS: 0.9058, UEM: 0.5947, LEM: 0.3652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3796, partial_loss/deprel_loss: 0.4655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6201, loss: 0.6819, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||:  86%|########6 | 96/111 [01:04<00:10,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9492, LAS: 0.9059, UEM: 0.5928, LEM: 0.3622, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2853, partial_loss/deprel_loss: 0.4503, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5891, loss: 0.6819, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||:  90%|######### | 100/111 [01:06<00:07,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9496, LAS: 0.9062, UEM: 0.5967, LEM: 0.3640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1409, partial_loss/deprel_loss: 0.3100, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4481, loss: 0.6789, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||:  94%|#########3| 104/111 [01:09<00:04,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9499, LAS: 0.9066, UEM: 0.6023, LEM: 0.3686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1972, partial_loss/deprel_loss: 0.3334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4780, loss: 0.6747, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||:  97%|#########7| 108/111 [01:12<00:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9498, LAS: 0.9063, UEM: 0.5988, LEM: 0.3643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4659, partial_loss/deprel_loss: 0.5357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6935, loss: 0.6770, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||: 100%|##########| 111/111 [01:13<00:00,  1.50it/s]\n",
+      "2023-04-07 00:43:24,069 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.536  |       N/A\n",
+      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.466  |       N/A\n",
+      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.172  |       N/A\n",
+      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - UEM                      |     0.599  |       N/A\n",
+      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - LAS                      |     0.906  |       N/A\n",
+      "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - loss                     |     0.677  |       N/A\n",
+      "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - LEM                      |     0.364  |       N/A\n",
+      "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - UAS                      |     0.950  |       N/A\n",
+      "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - EM                       |     0.896  |       N/A\n",
+      "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:43:24,076 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 00:43:28,783 - INFO - combo.training.trainer - Epoch duration: 0:01:21.499439\n",
+      "2023-04-07 00:43:28,783 - INFO - combo.training.trainer - Estimated training time remaining: 7:07:41\n",
+      "2023-04-07 00:43:28,784 - INFO - allennlp.training.trainer - Epoch 84/399\n",
+      "2023-04-07 00:43:28,784 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:43:28,784 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:43:28,790 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9204, UAS: 0.9514, LAS: 0.9079, UEM: 0.4796, LEM: 0.2044, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2878, partial_loss/deprel_loss: 0.4113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5584, loss: 0.6576, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:   5%|4         | 5/111 [00:02<00:45,  2.32it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9469, LAS: 0.9044, UEM: 0.4177, LEM: 0.1680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4348, partial_loss/deprel_loss: 0.4723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6366, loss: 0.6858, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:   9%|9         | 10/111 [00:04<00:44,  2.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8954, UAS: 0.9428, LAS: 0.9011, UEM: 0.4024, LEM: 0.1678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6157, partial_loss/deprel_loss: 0.6063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7800, loss: 0.7110, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  14%|#3        | 15/111 [00:06<00:43,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8660, UAS: 0.9426, LAS: 0.9007, UEM: 0.4122, LEM: 0.1725, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1330, partial_loss/deprel_loss: 0.7580, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0048, loss: 0.7214, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  16%|#6        | 18/111 [00:08<00:49,  1.89it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9024, UAS: 0.9414, LAS: 0.8983, UEM: 0.3904, LEM: 0.1592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5205, partial_loss/deprel_loss: 0.5271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6976, loss: 0.7382, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  19%|#8        | 21/111 [00:11<00:53,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9424, LAS: 0.8993, UEM: 0.4119, LEM: 0.1776, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3382, partial_loss/deprel_loss: 0.4379, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5897, loss: 0.7295, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  22%|##1       | 24/111 [00:13<00:54,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9052, UAS: 0.9434, LAS: 0.9004, UEM: 0.4380, LEM: 0.2060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4872, partial_loss/deprel_loss: 0.5513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7103, loss: 0.7223, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  24%|##4       | 27/111 [00:15<00:55,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9455, LAS: 0.9026, UEM: 0.4731, LEM: 0.2309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2584, partial_loss/deprel_loss: 0.3982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5420, loss: 0.7058, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  27%|##7       | 30/111 [00:17<00:53,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9473, LAS: 0.9042, UEM: 0.5138, LEM: 0.2729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1126, partial_loss/deprel_loss: 0.2701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4104, loss: 0.6924, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  31%|###       | 34/111 [00:20<00:52,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8771, UAS: 0.9434, LAS: 0.9001, UEM: 0.4985, LEM: 0.2645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8823, partial_loss/deprel_loss: 0.6641, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8795, loss: 0.7238, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  33%|###3      | 37/111 [00:22<00:51,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9439, LAS: 0.9003, UEM: 0.4910, LEM: 0.2574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5793, partial_loss/deprel_loss: 0.5165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7008, loss: 0.7221, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  36%|###6      | 40/111 [00:24<00:49,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9448, LAS: 0.9013, UEM: 0.4970, LEM: 0.2601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2447, partial_loss/deprel_loss: 0.4143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5522, loss: 0.7138, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  39%|###8      | 43/111 [00:26<00:46,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9355, UAS: 0.9465, LAS: 0.9034, UEM: 0.5256, LEM: 0.2854, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2238, partial_loss/deprel_loss: 0.3439, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4916, loss: 0.6992, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  41%|####1     | 46/111 [00:28<00:45,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9223, UAS: 0.9458, LAS: 0.9026, UEM: 0.5203, LEM: 0.2823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2626, partial_loss/deprel_loss: 0.3949, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5402, loss: 0.7034, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  44%|####4     | 49/111 [00:31<00:43,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9146, UAS: 0.9466, LAS: 0.9034, UEM: 0.5216, LEM: 0.2819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3617, partial_loss/deprel_loss: 0.4681, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6186, loss: 0.6996, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||:  47%|####6     | 52/111 [00:33<00:41,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9474, LAS: 0.9043, UEM: 0.5501, LEM: 0.3124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1540, partial_loss/deprel_loss: 0.3062, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4475, loss: 0.6910, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||:  50%|#####     | 56/111 [00:35<00:37,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8563, UAS: 0.9467, LAS: 0.9035, UEM: 0.5399, LEM: 0.3035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1279, partial_loss/deprel_loss: 0.7786, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0202, loss: 0.6955, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||:  54%|#####4    | 60/111 [00:38<00:33,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9474, LAS: 0.9045, UEM: 0.5443, LEM: 0.3067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1799, partial_loss/deprel_loss: 0.3411, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4806, loss: 0.6883, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||:  58%|#####7    | 64/111 [00:40<00:30,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8833, UAS: 0.9474, LAS: 0.9044, UEM: 0.5436, LEM: 0.3061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7734, partial_loss/deprel_loss: 0.7165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8995, loss: 0.6890, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||:  61%|######1   | 68/111 [00:43<00:27,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9484, LAS: 0.9054, UEM: 0.5534, LEM: 0.3129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2475, partial_loss/deprel_loss: 0.4111, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5501, loss: 0.6814, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||:  65%|######4   | 72/111 [00:46<00:26,  1.49it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8980, UAS: 0.9485, LAS: 0.9056, UEM: 0.5534, LEM: 0.3148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6119, partial_loss/deprel_loss: 0.5648, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7459, loss: 0.6804, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||:  68%|######7   | 75/111 [00:48<00:25,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9488, LAS: 0.9060, UEM: 0.5591, LEM: 0.3222, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2361, partial_loss/deprel_loss: 0.2912, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4519, loss: 0.6775, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||:  70%|#######   | 78/111 [00:51<00:25,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9484, UAS: 0.9494, LAS: 0.9067, UEM: 0.5780, LEM: 0.3444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0818, partial_loss/deprel_loss: 0.2043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3515, loss: 0.6721, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||:  73%|#######2  | 81/111 [00:53<00:22,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8720, UAS: 0.9490, LAS: 0.9061, UEM: 0.5733, LEM: 0.3404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9083, partial_loss/deprel_loss: 0.6554, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8776, loss: 0.6770, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||:  77%|#######6  | 85/111 [00:56<00:18,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9488, LAS: 0.9059, UEM: 0.5730, LEM: 0.3413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1963, partial_loss/deprel_loss: 0.3102, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4591, loss: 0.6784, batch_reg_loss: 0.1717, reg_loss: 0.1717 ||:  80%|########  | 89/111 [00:58<00:15,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9676, UAS: 0.9493, LAS: 0.9065, UEM: 0.5893, LEM: 0.3645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0396, partial_loss/deprel_loss: 0.1135, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2704, loss: 0.6757, batch_reg_loss: 0.1717, reg_loss: 0.1717 ||:  83%|########2 | 92/111 [01:01<00:14,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9494, LAS: 0.9066, UEM: 0.5906, LEM: 0.3651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8848, partial_loss/deprel_loss: 0.7517, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9500, loss: 0.6758, batch_reg_loss: 0.1716, reg_loss: 0.1717 ||:  86%|########5 | 95/111 [01:03<00:11,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9497, LAS: 0.9070, UEM: 0.5945, LEM: 0.3684, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6637, partial_loss/deprel_loss: 0.6962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8613, loss: 0.6744, batch_reg_loss: 0.1716, reg_loss: 0.1717 ||:  88%|########8 | 98/111 [01:05<00:09,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8481, UAS: 0.9495, LAS: 0.9067, UEM: 0.5956, LEM: 0.3697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2025, partial_loss/deprel_loss: 0.8264, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0732, loss: 0.6749, batch_reg_loss: 0.1716, reg_loss: 0.1717 ||:  92%|#########1| 102/111 [01:08<00:06,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9498, LAS: 0.9069, UEM: 0.5952, LEM: 0.3670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2573, partial_loss/deprel_loss: 0.4458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5797, loss: 0.6735, batch_reg_loss: 0.1716, reg_loss: 0.1717 ||:  95%|#########4| 105/111 [01:10<00:04,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9498, LAS: 0.9069, UEM: 0.5966, LEM: 0.3667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2900, partial_loss/deprel_loss: 0.4007, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5502, loss: 0.6728, batch_reg_loss: 0.1716, reg_loss: 0.1717 ||:  98%|#########8| 109/111 [01:13<00:01,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9500, LAS: 0.9070, UEM: 0.6010, LEM: 0.3704, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0986, partial_loss/deprel_loss: 0.3075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4373, loss: 0.6715, batch_reg_loss: 0.1716, reg_loss: 0.1717 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
+      "2023-04-07 00:44:46,230 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:44:46,230 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:44:46,230 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:44:46,230 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.307  |       N/A\n",
+      "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.099  |       N/A\n",
+      "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.172  |       N/A\n",
+      "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - UEM                      |     0.601  |       N/A\n",
+      "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - LAS                      |     0.907  |       N/A\n",
+      "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - loss                     |     0.671  |       N/A\n",
+      "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - LEM                      |     0.370  |       N/A\n",
+      "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - UAS                      |     0.950  |       N/A\n",
+      "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:44:46,233 - INFO - combo.training.tensorboard_writer - EM                       |     0.935  |       N/A\n",
+      "2023-04-07 00:44:46,233 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:44:46,238 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 00:44:52,274 - INFO - combo.training.trainer - Epoch duration: 0:01:23.490118\n",
+      "2023-04-07 00:44:52,274 - INFO - combo.training.trainer - Estimated training time remaining: 7:06:28\n",
+      "2023-04-07 00:44:52,274 - INFO - allennlp.training.trainer - Epoch 85/399\n",
+      "2023-04-07 00:44:52,274 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:44:52,275 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:44:52,284 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9489, LAS: 0.9040, UEM: 0.4945, LEM: 0.2749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4882, partial_loss/deprel_loss: 0.5869, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7388, loss: 0.6966, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||:   4%|3         | 4/111 [00:02<00:59,  1.80it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8816, UAS: 0.9493, LAS: 0.9031, UEM: 0.4720, LEM: 0.2297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8211, partial_loss/deprel_loss: 0.6876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8859, loss: 0.7048, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||:   7%|7         | 8/111 [00:04<00:59,  1.74it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8923, UAS: 0.9508, LAS: 0.9050, UEM: 0.5020, LEM: 0.2539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5759, partial_loss/deprel_loss: 0.5518, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7282, loss: 0.6806, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||:  10%|9         | 11/111 [00:07<01:03,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9533, LAS: 0.9086, UEM: 0.5372, LEM: 0.2891, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2173, partial_loss/deprel_loss: 0.3593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5025, loss: 0.6507, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||:  14%|#3        | 15/111 [00:09<01:01,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9512, LAS: 0.9070, UEM: 0.5409, LEM: 0.2963, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2206, partial_loss/deprel_loss: 0.3592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5031, loss: 0.6631, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||:  16%|#6        | 18/111 [00:12<01:05,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9511, LAS: 0.9074, UEM: 0.5449, LEM: 0.3035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2308, partial_loss/deprel_loss: 0.3370, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4873, loss: 0.6610, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||:  19%|#8        | 21/111 [00:14<01:03,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9543, LAS: 0.9116, UEM: 0.6365, LEM: 0.4128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2214, partial_loss/deprel_loss: 0.4003, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5361, loss: 0.6342, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||:  22%|##1       | 24/111 [00:16<01:03,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9191, UAS: 0.9527, LAS: 0.9099, UEM: 0.6114, LEM: 0.3901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3740, partial_loss/deprel_loss: 0.4229, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5847, loss: 0.6472, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||:  25%|##5       | 28/111 [00:19<00:58,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9535, LAS: 0.9106, UEM: 0.6154, LEM: 0.3871, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1930, partial_loss/deprel_loss: 0.3449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4861, loss: 0.6429, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||:  28%|##7       | 31/111 [00:21<00:55,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9239, UAS: 0.9547, LAS: 0.9122, UEM: 0.6263, LEM: 0.3920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3075, partial_loss/deprel_loss: 0.4177, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5672, loss: 0.6327, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||:  31%|###       | 34/111 [00:23<00:53,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8845, UAS: 0.9544, LAS: 0.9119, UEM: 0.6212, LEM: 0.3862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6734, partial_loss/deprel_loss: 0.6002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7864, loss: 0.6345, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||:  34%|###4      | 38/111 [00:25<00:48,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9535, LAS: 0.9111, UEM: 0.6093, LEM: 0.3757, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6099, partial_loss/deprel_loss: 0.5151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7056, loss: 0.6401, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||:  37%|###6      | 41/111 [00:27<00:47,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9540, LAS: 0.9116, UEM: 0.6067, LEM: 0.3691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3456, partial_loss/deprel_loss: 0.5257, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6612, loss: 0.6379, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||:  41%|####      | 45/111 [00:30<00:43,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9532, LAS: 0.9111, UEM: 0.5997, LEM: 0.3626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7733, partial_loss/deprel_loss: 0.6122, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8159, loss: 0.6409, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||:  44%|####4     | 49/111 [00:32<00:40,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9513, LAS: 0.9092, UEM: 0.5832, LEM: 0.3510, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6072, partial_loss/deprel_loss: 0.5884, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7637, loss: 0.6533, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||:  48%|####7     | 53/111 [00:35<00:39,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9512, LAS: 0.9091, UEM: 0.5850, LEM: 0.3532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6603, partial_loss/deprel_loss: 0.6363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8126, loss: 0.6534, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||:  50%|#####     | 56/111 [00:38<00:38,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9517, LAS: 0.9096, UEM: 0.5943, LEM: 0.3615, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1501, partial_loss/deprel_loss: 0.2723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4193, loss: 0.6495, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  54%|#####4    | 60/111 [00:40<00:34,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9500, LAS: 0.9079, UEM: 0.5866, LEM: 0.3552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4817, partial_loss/deprel_loss: 0.5117, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6772, loss: 0.6611, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  58%|#####7    | 64/111 [00:43<00:31,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8893, UAS: 0.9503, LAS: 0.9082, UEM: 0.5875, LEM: 0.3562, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6555, partial_loss/deprel_loss: 0.6512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8236, loss: 0.6617, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  61%|######1   | 68/111 [00:46<00:30,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8993, UAS: 0.9508, LAS: 0.9088, UEM: 0.5997, LEM: 0.3701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5530, partial_loss/deprel_loss: 0.4983, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6807, loss: 0.6568, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  64%|######3   | 71/111 [00:48<00:28,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8860, UAS: 0.9502, LAS: 0.9081, UEM: 0.5917, LEM: 0.3636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7786, partial_loss/deprel_loss: 0.6569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8527, loss: 0.6633, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  67%|######6   | 74/111 [00:50<00:26,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9503, LAS: 0.9081, UEM: 0.5887, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5200, partial_loss/deprel_loss: 0.5049, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6793, loss: 0.6635, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  69%|######9   | 77/111 [00:52<00:23,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9168, UAS: 0.9494, LAS: 0.9071, UEM: 0.5841, LEM: 0.3539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3174, partial_loss/deprel_loss: 0.4077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5611, loss: 0.6703, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  72%|#######2  | 80/111 [00:54<00:21,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9502, LAS: 0.9081, UEM: 0.6033, LEM: 0.3762, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2790, partial_loss/deprel_loss: 0.3868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5367, loss: 0.6625, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  75%|#######4  | 83/111 [00:57<00:20,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9505, LAS: 0.9084, UEM: 0.6038, LEM: 0.3730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2464, partial_loss/deprel_loss: 0.3908, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5334, loss: 0.6609, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  77%|#######7  | 86/111 [00:59<00:18,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8735, UAS: 0.9498, LAS: 0.9076, UEM: 0.5981, LEM: 0.3690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9836, partial_loss/deprel_loss: 0.6747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9079, loss: 0.6671, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  81%|########1 | 90/111 [01:01<00:14,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8866, UAS: 0.9492, LAS: 0.9069, UEM: 0.5945, LEM: 0.3658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7101, partial_loss/deprel_loss: 0.6880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8639, loss: 0.6734, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  85%|########4 | 94/111 [01:04<00:11,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8769, UAS: 0.9493, LAS: 0.9069, UEM: 0.5976, LEM: 0.3690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9722, partial_loss/deprel_loss: 0.6962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9228, loss: 0.6741, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  87%|########7 | 97/111 [01:06<00:09,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8829, UAS: 0.9496, LAS: 0.9071, UEM: 0.5950, LEM: 0.3648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7420, partial_loss/deprel_loss: 0.7137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8908, loss: 0.6729, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  92%|#########1| 102/111 [01:08<00:05,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9499, LAS: 0.9075, UEM: 0.5979, LEM: 0.3685, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5373, partial_loss/deprel_loss: 0.5125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6889, loss: 0.6693, batch_reg_loss: 0.1714, reg_loss: 0.1715 ||:  96%|#########6| 107/111 [01:11<00:02,  1.73it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9504, LAS: 0.9079, UEM: 0.6026, LEM: 0.3715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2185, partial_loss/deprel_loss: 0.3660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5080, loss: 0.6663, batch_reg_loss: 0.1714, reg_loss: 0.1715 ||: 100%|##########| 111/111 [01:13<00:00,  1.52it/s]\n",
+      "2023-04-07 00:46:08,660 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9122, LAS: 0.8613, UEM: 0.3719, LEM: 0.1357, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6872, partial_loss/deprel_loss: 33.7202, partial_loss/cycle_loss: 0.0000, batch_loss: 27.1136, loss: 36.1110, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:11,  1.03s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8709, UAS: 0.9236, LAS: 0.8697, UEM: 0.3147, LEM: 0.0932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3113, partial_loss/deprel_loss: 47.1769, partial_loss/cycle_loss: 0.0000, batch_loss: 38.0038, loss: 32.5457, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:04<00:08,  1.01s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9373, LAS: 0.8872, UEM: 0.6018, LEM: 0.3907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1716, partial_loss/deprel_loss: 19.2356, partial_loss/cycle_loss: 0.0000, batch_loss: 15.4228, loss: 28.2524, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:07<00:05,  1.00s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9431, LAS: 0.8932, UEM: 0.6361, LEM: 0.3959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1653, partial_loss/deprel_loss: 23.1310, partial_loss/cycle_loss: 0.0000, batch_loss: 18.5378, loss: 26.2134, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:10<00:01,  1.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9160, UAS: 0.9460, LAS: 0.8958, UEM: 0.6466, LEM: 0.3856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3953, partial_loss/deprel_loss: 25.8727, partial_loss/cycle_loss: 0.0000, batch_loss: 20.7773, loss: 25.2483, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9160, UAS: 0.9460, LAS: 0.8958, UEM: 0.6466, LEM: 0.3856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3953, partial_loss/deprel_loss: 25.8727, partial_loss/cycle_loss: 0.0000, batch_loss: 20.7773, loss: 25.2483, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.03it/s]\n",
+      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.366  |    25.873\n",
+      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.218  |     0.395\n",
+      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.172  |     0.000\n",
+      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - UEM                      |     0.603  |     0.647\n",
+      "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - LAS                      |     0.908  |     0.896\n",
+      "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - loss                     |     0.666  |    25.248\n",
+      "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - LEM                      |     0.371  |     0.386\n",
+      "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - UAS                      |     0.950  |     0.946\n",
+      "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - EM                       |     0.927  |     0.916\n",
+      "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:46:21,318 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:46:26,252 - INFO - combo.training.trainer - Epoch duration: 0:01:33.977591\n",
+      "2023-04-07 00:46:26,252 - INFO - combo.training.trainer - Estimated training time remaining: 7:05:54\n",
+      "2023-04-07 00:46:26,252 - INFO - allennlp.training.trainer - Epoch 86/399\n",
+      "2023-04-07 00:46:26,252 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:46:26,253 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:46:26,259 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8962, UAS: 0.9549, LAS: 0.9143, UEM: 0.5126, LEM: 0.2644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5999, partial_loss/deprel_loss: 0.5818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7569, loss: 0.6319, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:   4%|3         | 4/111 [00:02<01:11,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9319, UAS: 0.9574, LAS: 0.9172, UEM: 0.5572, LEM: 0.2986, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2609, partial_loss/deprel_loss: 0.3570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5092, loss: 0.6052, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:   6%|6         | 7/111 [00:04<01:09,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9556, LAS: 0.9147, UEM: 0.5295, LEM: 0.2703, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3098, partial_loss/deprel_loss: 0.4638, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6044, loss: 0.6292, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:   9%|9         | 10/111 [00:06<01:08,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9560, LAS: 0.9151, UEM: 0.5308, LEM: 0.2715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4331, partial_loss/deprel_loss: 0.4218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5955, loss: 0.6216, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  12%|#1        | 13/111 [00:08<01:07,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9553, LAS: 0.9142, UEM: 0.5352, LEM: 0.2763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3347, partial_loss/deprel_loss: 0.4334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5850, loss: 0.6263, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  15%|#5        | 17/111 [00:11<01:03,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9548, LAS: 0.9133, UEM: 0.5388, LEM: 0.2755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2227, partial_loss/deprel_loss: 0.3917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5293, loss: 0.6341, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  18%|#8        | 20/111 [00:13<01:02,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9508, LAS: 0.9089, UEM: 0.5216, LEM: 0.2667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4718, partial_loss/deprel_loss: 0.5207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6823, loss: 0.6611, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  22%|##1       | 24/111 [00:15<00:56,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9503, LAS: 0.9078, UEM: 0.5263, LEM: 0.2784, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1759, partial_loss/deprel_loss: 0.3242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4659, loss: 0.6687, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  24%|##4       | 27/111 [00:18<00:58,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9507, LAS: 0.9085, UEM: 0.5438, LEM: 0.3015, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2016, partial_loss/deprel_loss: 0.2894, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4432, loss: 0.6630, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  28%|##7       | 31/111 [00:20<00:53,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9025, UAS: 0.9506, LAS: 0.9088, UEM: 0.5685, LEM: 0.3411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6470, partial_loss/deprel_loss: 0.5150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7128, loss: 0.6591, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  31%|###       | 34/111 [00:22<00:52,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9505, LAS: 0.9085, UEM: 0.5655, LEM: 0.3368, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2677, partial_loss/deprel_loss: 0.4214, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5621, loss: 0.6591, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  34%|###4      | 38/111 [00:25<00:49,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9380, UAS: 0.9513, LAS: 0.9093, UEM: 0.5822, LEM: 0.3554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1440, partial_loss/deprel_loss: 0.2598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4080, loss: 0.6536, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  37%|###6      | 41/111 [00:27<00:48,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9521, LAS: 0.9097, UEM: 0.5914, LEM: 0.3558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2431, partial_loss/deprel_loss: 0.4478, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5782, loss: 0.6479, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  40%|###9      | 44/111 [00:30<00:48,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8731, UAS: 0.9506, LAS: 0.9082, UEM: 0.5772, LEM: 0.3460, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0487, partial_loss/deprel_loss: 0.7064, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9462, loss: 0.6611, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  42%|####2     | 47/111 [00:32<00:45,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9518, LAS: 0.9095, UEM: 0.5924, LEM: 0.3571, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2587, partial_loss/deprel_loss: 0.4356, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5716, loss: 0.6508, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  46%|####5     | 51/111 [00:34<00:42,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9527, LAS: 0.9100, UEM: 0.5966, LEM: 0.3561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2301, partial_loss/deprel_loss: 0.3930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5318, loss: 0.6473, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  50%|####9     | 55/111 [00:37<00:39,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9522, LAS: 0.9094, UEM: 0.6012, LEM: 0.3618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1176, partial_loss/deprel_loss: 0.3189, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4499, loss: 0.6513, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  53%|#####3    | 59/111 [00:40<00:35,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9524, LAS: 0.9098, UEM: 0.5956, LEM: 0.3554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4422, partial_loss/deprel_loss: 0.4964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6569, loss: 0.6495, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  57%|#####6    | 63/111 [00:42<00:31,  1.52it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9516, LAS: 0.9088, UEM: 0.5877, LEM: 0.3481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3114, partial_loss/deprel_loss: 0.4026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5557, loss: 0.6568, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  60%|######    | 67/111 [00:44<00:27,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8839, UAS: 0.9507, LAS: 0.9080, UEM: 0.5830, LEM: 0.3466, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8306, partial_loss/deprel_loss: 0.6379, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8478, loss: 0.6621, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  65%|######4   | 72/111 [00:47<00:22,  1.71it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8612, UAS: 0.9501, LAS: 0.9074, UEM: 0.5871, LEM: 0.3530, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1629, partial_loss/deprel_loss: 0.8042, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0473, loss: 0.6673, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  69%|######9   | 77/111 [00:49<00:18,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9510, LAS: 0.9086, UEM: 0.6098, LEM: 0.3822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2064, partial_loss/deprel_loss: 0.3390, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4838, loss: 0.6614, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  73%|#######2  | 81/111 [00:51<00:16,  1.80it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9511, LAS: 0.9085, UEM: 0.6124, LEM: 0.3836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3728, partial_loss/deprel_loss: 0.4867, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6352, loss: 0.6604, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  77%|#######6  | 85/111 [00:55<00:16,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8936, UAS: 0.9501, LAS: 0.9075, UEM: 0.6048, LEM: 0.3768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6928, partial_loss/deprel_loss: 0.6402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8220, loss: 0.6699, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  80%|########  | 89/111 [00:58<00:14,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9502, LAS: 0.9077, UEM: 0.6015, LEM: 0.3738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1512, partial_loss/deprel_loss: 0.3505, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4820, loss: 0.6682, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  84%|########3 | 93/111 [01:00<00:12,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9506, LAS: 0.9082, UEM: 0.6050, LEM: 0.3765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2539, partial_loss/deprel_loss: 0.3479, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5004, loss: 0.6638, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  87%|########7 | 97/111 [01:03<00:09,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8780, UAS: 0.9503, LAS: 0.9078, UEM: 0.5996, LEM: 0.3715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8053, partial_loss/deprel_loss: 0.7396, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9240, loss: 0.6678, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  90%|######### | 100/111 [01:05<00:07,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9505, LAS: 0.9079, UEM: 0.6015, LEM: 0.3717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6447, partial_loss/deprel_loss: 0.5784, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7629, loss: 0.6663, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||:  94%|#########3| 104/111 [01:08<00:04,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9501, LAS: 0.9076, UEM: 0.5952, LEM: 0.3664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5785, partial_loss/deprel_loss: 0.6021, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7687, loss: 0.6689, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||:  97%|#########7| 108/111 [01:10<00:01,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9503, LAS: 0.9078, UEM: 0.6002, LEM: 0.3706, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5065, partial_loss/deprel_loss: 0.5337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6995, loss: 0.6659, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
+      "2023-04-07 00:47:43,046 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.534  |       N/A\n",
+      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.506  |       N/A\n",
+      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.171  |       N/A\n",
+      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - UEM                      |     0.600  |       N/A\n",
+      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - LAS                      |     0.908  |       N/A\n",
+      "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - loss                     |     0.666  |       N/A\n",
+      "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - LEM                      |     0.371  |       N/A\n",
+      "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - UAS                      |     0.950  |       N/A\n",
+      "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - EM                       |     0.902  |       N/A\n",
+      "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:47:43,053 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 00:47:49,210 - INFO - combo.training.trainer - Epoch duration: 0:01:22.957862\n",
+      "2023-04-07 00:47:49,211 - INFO - combo.training.trainer - Estimated training time remaining: 7:04:38\n",
+      "2023-04-07 00:47:49,211 - INFO - allennlp.training.trainer - Epoch 87/399\n",
+      "2023-04-07 00:47:49,211 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:47:49,212 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:47:49,221 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9687, LAS: 0.9283, UEM: 0.6917, LEM: 0.4037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3433, partial_loss/deprel_loss: 0.4337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5869, loss: 0.5496, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||:   3%|2         | 3/111 [00:02<01:17,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9472, UAS: 0.9621, LAS: 0.9222, UEM: 0.7021, LEM: 0.4715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1045, partial_loss/deprel_loss: 0.2157, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3647, loss: 0.5783, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||:   5%|5         | 6/111 [00:04<01:18,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9557, LAS: 0.9144, UEM: 0.6255, LEM: 0.3980, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2458, partial_loss/deprel_loss: 0.3617, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5098, loss: 0.6403, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||:   9%|9         | 10/111 [00:07<01:11,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9478, LAS: 0.9059, UEM: 0.5568, LEM: 0.3432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8828, partial_loss/deprel_loss: 0.6399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8597, loss: 0.6974, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||:  13%|#2        | 14/111 [00:09<01:07,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9500, LAS: 0.9077, UEM: 0.5914, LEM: 0.3698, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1040, partial_loss/deprel_loss: 0.3227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4502, loss: 0.6824, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||:  15%|#5        | 17/111 [00:11<01:06,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9514, LAS: 0.9091, UEM: 0.6130, LEM: 0.3889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1171, partial_loss/deprel_loss: 0.2585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4015, loss: 0.6680, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||:  18%|#8        | 20/111 [00:14<01:04,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9511, LAS: 0.9090, UEM: 0.5950, LEM: 0.3703, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7511, partial_loss/deprel_loss: 0.5584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7682, loss: 0.6676, batch_reg_loss: 0.1712, reg_loss: 0.1713 ||:  21%|##        | 23/111 [00:16<01:01,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9521, LAS: 0.9100, UEM: 0.5844, LEM: 0.3557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4836, partial_loss/deprel_loss: 0.5146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6796, loss: 0.6586, batch_reg_loss: 0.1712, reg_loss: 0.1713 ||:  24%|##4       | 27/111 [00:18<00:55,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9511, LAS: 0.9096, UEM: 0.5885, LEM: 0.3636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3558, partial_loss/deprel_loss: 0.4047, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5662, loss: 0.6604, batch_reg_loss: 0.1712, reg_loss: 0.1713 ||:  28%|##7       | 31/111 [00:21<00:52,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8881, UAS: 0.9496, LAS: 0.9082, UEM: 0.5715, LEM: 0.3486, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8574, partial_loss/deprel_loss: 0.6428, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8570, loss: 0.6712, batch_reg_loss: 0.1712, reg_loss: 0.1713 ||:  32%|###1      | 35/111 [00:23<00:49,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9515, LAS: 0.9106, UEM: 0.5987, LEM: 0.3715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2422, partial_loss/deprel_loss: 0.3096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4673, loss: 0.6518, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  35%|###5      | 39/111 [00:27<00:51,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8493, UAS: 0.9506, LAS: 0.9096, UEM: 0.5906, LEM: 0.3639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2880, partial_loss/deprel_loss: 0.8245, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0884, loss: 0.6588, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  38%|###7      | 42/111 [00:29<00:49,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9517, LAS: 0.9103, UEM: 0.6028, LEM: 0.3697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2292, partial_loss/deprel_loss: 0.4404, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5693, loss: 0.6515, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  41%|####1     | 46/111 [00:31<00:42,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9519, LAS: 0.9103, UEM: 0.5993, LEM: 0.3624, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7766, partial_loss/deprel_loss: 0.5683, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7812, loss: 0.6519, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  46%|####5     | 51/111 [00:33<00:36,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9516, LAS: 0.9102, UEM: 0.6066, LEM: 0.3695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2039, partial_loss/deprel_loss: 0.2804, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4363, loss: 0.6525, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  50%|####9     | 55/111 [00:36<00:35,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8640, UAS: 0.9505, LAS: 0.9089, UEM: 0.5934, LEM: 0.3586, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0241, partial_loss/deprel_loss: 0.7608, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9846, loss: 0.6616, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  53%|#####3    | 59/111 [00:38<00:31,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9355, UAS: 0.9507, LAS: 0.9092, UEM: 0.6009, LEM: 0.3676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2038, partial_loss/deprel_loss: 0.3175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4659, loss: 0.6563, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  57%|#####6    | 63/111 [00:41<00:29,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9209, UAS: 0.9497, LAS: 0.9081, UEM: 0.5987, LEM: 0.3649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2139, partial_loss/deprel_loss: 0.3651, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5061, loss: 0.6632, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  60%|######    | 67/111 [00:43<00:27,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8482, UAS: 0.9490, LAS: 0.9072, UEM: 0.5947, LEM: 0.3592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4450, partial_loss/deprel_loss: 0.8776, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1623, loss: 0.6706, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  65%|######4   | 72/111 [00:46<00:23,  1.69it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9487, LAS: 0.9068, UEM: 0.5909, LEM: 0.3552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2596, partial_loss/deprel_loss: 0.3874, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5330, loss: 0.6724, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  69%|######9   | 77/111 [00:48<00:18,  1.82it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9488, LAS: 0.9069, UEM: 0.5854, LEM: 0.3485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3230, partial_loss/deprel_loss: 0.4347, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5835, loss: 0.6719, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  73%|#######2  | 81/111 [00:51<00:17,  1.71it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8817, UAS: 0.9492, LAS: 0.9074, UEM: 0.6009, LEM: 0.3714, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7277, partial_loss/deprel_loss: 0.6733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8553, loss: 0.6688, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  77%|#######6  | 85/111 [00:54<00:16,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9496, LAS: 0.9078, UEM: 0.6041, LEM: 0.3746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1636, partial_loss/deprel_loss: 0.2827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4300, loss: 0.6651, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  80%|########  | 89/111 [00:57<00:14,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9493, LAS: 0.9073, UEM: 0.5980, LEM: 0.3695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4866, partial_loss/deprel_loss: 0.4848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6563, loss: 0.6681, batch_reg_loss: 0.1711, reg_loss: 0.1712 ||:  84%|########3 | 93/111 [01:00<00:12,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9491, LAS: 0.9071, UEM: 0.5911, LEM: 0.3626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3899, partial_loss/deprel_loss: 0.4559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6138, loss: 0.6705, batch_reg_loss: 0.1711, reg_loss: 0.1712 ||:  87%|########7 | 97/111 [01:03<00:10,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9250, UAS: 0.9496, LAS: 0.9077, UEM: 0.5966, LEM: 0.3655, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3368, partial_loss/deprel_loss: 0.4039, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5616, loss: 0.6659, batch_reg_loss: 0.1711, reg_loss: 0.1712 ||:  91%|######### | 101/111 [01:05<00:06,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9502, LAS: 0.9085, UEM: 0.6076, LEM: 0.3781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3070, partial_loss/deprel_loss: 0.3840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5397, loss: 0.6596, batch_reg_loss: 0.1711, reg_loss: 0.1712 ||:  95%|#########4| 105/111 [01:08<00:03,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9502, LAS: 0.9084, UEM: 0.6053, LEM: 0.3757, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4180, partial_loss/deprel_loss: 0.4299, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5986, loss: 0.6600, batch_reg_loss: 0.1711, reg_loss: 0.1712 ||:  98%|#########8| 109/111 [01:11<00:01,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8934, UAS: 0.9501, LAS: 0.9082, UEM: 0.6015, LEM: 0.3723, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7131, partial_loss/deprel_loss: 0.6420, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8273, loss: 0.6628, batch_reg_loss: 0.1711, reg_loss: 0.1712 ||: 100%|##########| 111/111 [01:12<00:00,  1.52it/s]\n",
+      "2023-04-07 00:49:05,042 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:49:05,042 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:49:05,042 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:49:05,042 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:49:05,042 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.642  |       N/A\n",
+      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.713  |       N/A\n",
+      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.171  |       N/A\n",
+      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - UEM                      |     0.601  |       N/A\n",
+      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - LAS                      |     0.908  |       N/A\n",
+      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - loss                     |     0.663  |       N/A\n",
+      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - LEM                      |     0.372  |       N/A\n",
+      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - UAS                      |     0.950  |       N/A\n",
+      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - EM                       |     0.893  |       N/A\n",
+      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:49:05,048 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 00:49:10,018 - INFO - combo.training.trainer - Epoch duration: 0:01:20.806982\n",
+      "2023-04-07 00:49:10,018 - INFO - combo.training.trainer - Estimated training time remaining: 7:03:15\n",
+      "2023-04-07 00:49:10,018 - INFO - allennlp.training.trainer - Epoch 88/399\n",
+      "2023-04-07 00:49:10,019 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:49:10,019 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:49:10,028 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9648, LAS: 0.9244, UEM: 0.6771, LEM: 0.4049, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3842, partial_loss/deprel_loss: 0.4413, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6010, loss: 0.5365, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:   4%|3         | 4/111 [00:02<01:08,  1.56it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9613, LAS: 0.9201, UEM: 0.6885, LEM: 0.4540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1407, partial_loss/deprel_loss: 0.2453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3955, loss: 0.5656, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:   6%|6         | 7/111 [00:04<01:11,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8917, UAS: 0.9565, LAS: 0.9148, UEM: 0.6298, LEM: 0.3948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8094, partial_loss/deprel_loss: 0.6079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8192, loss: 0.6131, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  10%|9         | 11/111 [00:07<01:07,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9074, UAS: 0.9537, LAS: 0.9116, UEM: 0.6465, LEM: 0.4133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4722, partial_loss/deprel_loss: 0.4675, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6396, loss: 0.6314, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  13%|#2        | 14/111 [00:09<01:04,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9516, LAS: 0.9094, UEM: 0.6364, LEM: 0.4066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2188, partial_loss/deprel_loss: 0.3068, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4603, loss: 0.6542, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  16%|#6        | 18/111 [00:12<01:01,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9494, LAS: 0.9073, UEM: 0.6218, LEM: 0.3947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7785, partial_loss/deprel_loss: 0.5826, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7928, loss: 0.6670, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  20%|#9        | 22/111 [00:14<00:58,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8989, UAS: 0.9493, LAS: 0.9074, UEM: 0.6181, LEM: 0.3962, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6356, partial_loss/deprel_loss: 0.5565, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7434, loss: 0.6665, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  23%|##2       | 25/111 [00:16<00:58,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9479, LAS: 0.9056, UEM: 0.5939, LEM: 0.3749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5422, partial_loss/deprel_loss: 0.5184, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6942, loss: 0.6767, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  25%|##5       | 28/111 [00:19<00:57,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9359, UAS: 0.9484, LAS: 0.9059, UEM: 0.6016, LEM: 0.3789, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1821, partial_loss/deprel_loss: 0.3461, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4843, loss: 0.6760, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  28%|##7       | 31/111 [00:21<01:00,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8825, UAS: 0.9486, LAS: 0.9059, UEM: 0.5937, LEM: 0.3671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7760, partial_loss/deprel_loss: 0.5979, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8046, loss: 0.6750, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  32%|###1      | 35/111 [00:24<00:54,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9470, LAS: 0.9040, UEM: 0.5709, LEM: 0.3493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6367, partial_loss/deprel_loss: 0.6364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8075, loss: 0.6898, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  35%|###5      | 39/111 [00:26<00:49,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9481, LAS: 0.9056, UEM: 0.5839, LEM: 0.3616, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1492, partial_loss/deprel_loss: 0.2564, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4060, loss: 0.6773, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  39%|###8      | 43/111 [00:29<00:47,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9319, UAS: 0.9492, LAS: 0.9066, UEM: 0.5935, LEM: 0.3658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2049, partial_loss/deprel_loss: 0.3325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4780, loss: 0.6670, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  42%|####2     | 47/111 [00:31<00:42,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9255, UAS: 0.9481, LAS: 0.9053, UEM: 0.5892, LEM: 0.3599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2277, partial_loss/deprel_loss: 0.3805, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5210, loss: 0.6769, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||:  47%|####6     | 52/111 [00:34<00:35,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9481, LAS: 0.9055, UEM: 0.5862, LEM: 0.3568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2382, partial_loss/deprel_loss: 0.4381, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5692, loss: 0.6759, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||:  51%|#####1    | 57/111 [00:36<00:30,  1.78it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9497, LAS: 0.9070, UEM: 0.5991, LEM: 0.3631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1718, partial_loss/deprel_loss: 0.3393, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4769, loss: 0.6644, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||:  56%|#####5    | 62/111 [00:38<00:25,  1.92it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9489, LAS: 0.9063, UEM: 0.5947, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2533, partial_loss/deprel_loss: 0.3932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5362, loss: 0.6699, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||:  59%|#####9    | 66/111 [00:41<00:25,  1.76it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9494, LAS: 0.9067, UEM: 0.5983, LEM: 0.3637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1346, partial_loss/deprel_loss: 0.2575, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4039, loss: 0.6678, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||:  63%|######3   | 70/111 [00:43<00:23,  1.74it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9503, LAS: 0.9076, UEM: 0.6103, LEM: 0.3730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2235, partial_loss/deprel_loss: 0.3390, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4869, loss: 0.6601, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||:  67%|######6   | 74/111 [00:46<00:23,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9056, UAS: 0.9505, LAS: 0.9081, UEM: 0.6227, LEM: 0.3947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5366, partial_loss/deprel_loss: 0.5849, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7462, loss: 0.6569, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||:  70%|#######   | 78/111 [00:50<00:22,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8969, UAS: 0.9508, LAS: 0.9084, UEM: 0.6206, LEM: 0.3901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6177, partial_loss/deprel_loss: 0.5950, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7706, loss: 0.6562, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||:  74%|#######3  | 82/111 [00:52<00:20,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9510, LAS: 0.9085, UEM: 0.6165, LEM: 0.3841, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3369, partial_loss/deprel_loss: 0.5227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6566, loss: 0.6572, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||:  77%|#######6  | 85/111 [00:55<00:18,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9511, LAS: 0.9085, UEM: 0.6129, LEM: 0.3792, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5236, partial_loss/deprel_loss: 0.5315, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7009, loss: 0.6570, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||:  79%|#######9  | 88/111 [00:57<00:16,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9504, LAS: 0.9078, UEM: 0.6034, LEM: 0.3718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6980, partial_loss/deprel_loss: 0.6253, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8108, loss: 0.6609, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||:  83%|########2 | 92/111 [00:59<00:13,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9509, LAS: 0.9082, UEM: 0.6093, LEM: 0.3764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3124, partial_loss/deprel_loss: 0.4351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5815, loss: 0.6571, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||:  86%|########5 | 95/111 [01:02<00:11,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8996, UAS: 0.9513, LAS: 0.9088, UEM: 0.6183, LEM: 0.3879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5063, partial_loss/deprel_loss: 0.6092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7596, loss: 0.6536, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||:  88%|########8 | 98/111 [01:04<00:09,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9511, LAS: 0.9085, UEM: 0.6137, LEM: 0.3833, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8182, partial_loss/deprel_loss: 0.7218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9121, loss: 0.6563, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||:  92%|#########1| 102/111 [01:07<00:06,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8930, UAS: 0.9506, LAS: 0.9079, UEM: 0.6094, LEM: 0.3796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6152, partial_loss/deprel_loss: 0.6973, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8518, loss: 0.6612, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||:  95%|#########5| 106/111 [01:09<00:03,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9504, LAS: 0.9075, UEM: 0.6031, LEM: 0.3734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8294, partial_loss/deprel_loss: 0.6723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8747, loss: 0.6649, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||:  99%|#########9| 110/111 [01:11<00:00,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9035, UAS: 0.9503, LAS: 0.9075, UEM: 0.6013, LEM: 0.3718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5801, partial_loss/deprel_loss: 0.5707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7436, loss: 0.6656, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||: 100%|##########| 111/111 [01:12<00:00,  1.53it/s]\n",
+      "2023-04-07 00:50:25,578 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:50:25,578 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.571  |       N/A\n",
+      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.580  |       N/A\n",
+      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.171  |       N/A\n",
+      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - UEM                      |     0.601  |       N/A\n",
+      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - LAS                      |     0.907  |       N/A\n",
+      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - loss                     |     0.666  |       N/A\n",
+      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - LEM                      |     0.372  |       N/A\n",
+      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - UAS                      |     0.950  |       N/A\n",
+      "2023-04-07 00:50:25,580 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:50:25,580 - INFO - combo.training.tensorboard_writer - EM                       |     0.903  |       N/A\n",
+      "2023-04-07 00:50:25,580 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:50:25,584 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 00:50:30,371 - INFO - combo.training.trainer - Epoch duration: 0:01:20.352845\n",
+      "2023-04-07 00:50:30,372 - INFO - combo.training.trainer - Estimated training time remaining: 7:01:50\n",
+      "2023-04-07 00:50:30,372 - INFO - allennlp.training.trainer - Epoch 89/399\n",
+      "2023-04-07 00:50:30,372 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:50:30,373 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:50:30,382 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9209, UAS: 0.9624, LAS: 0.9199, UEM: 0.6179, LEM: 0.3293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2774, partial_loss/deprel_loss: 0.4097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5542, loss: 0.5893, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||:   3%|2         | 3/111 [00:02<01:13,  1.47it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9575, LAS: 0.9151, UEM: 0.6054, LEM: 0.3576, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4951, partial_loss/deprel_loss: 0.5040, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6732, loss: 0.6034, batch_reg_loss: 0.1709, reg_loss: 0.1710 ||:   5%|5         | 6/111 [00:04<01:11,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9608, LAS: 0.9188, UEM: 0.6575, LEM: 0.4024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2058, partial_loss/deprel_loss: 0.3477, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4903, loss: 0.5747, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:   8%|8         | 9/111 [00:06<01:13,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9648, UAS: 0.9584, LAS: 0.9174, UEM: 0.7075, LEM: 0.4978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0484, partial_loss/deprel_loss: 0.1350, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2886, loss: 0.5920, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  12%|#1        | 13/111 [00:09<01:12,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8350, UAS: 0.9516, LAS: 0.9103, UEM: 0.6846, LEM: 0.4747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5908, partial_loss/deprel_loss: 0.9539, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2522, loss: 0.6493, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  14%|#4        | 16/111 [00:14<01:31,  1.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9528, LAS: 0.9117, UEM: 0.6715, LEM: 0.4570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4789, partial_loss/deprel_loss: 0.5093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6741, loss: 0.6407, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  18%|#8        | 20/111 [00:16<01:18,  1.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9546, LAS: 0.9136, UEM: 0.6846, LEM: 0.4671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2704, partial_loss/deprel_loss: 0.4513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5860, loss: 0.6282, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  21%|##        | 23/111 [00:18<01:10,  1.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9526, LAS: 0.9115, UEM: 0.6587, LEM: 0.4420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6559, partial_loss/deprel_loss: 0.6576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8282, loss: 0.6451, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  24%|##4       | 27/111 [00:20<01:00,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9520, LAS: 0.9108, UEM: 0.6580, LEM: 0.4407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1778, partial_loss/deprel_loss: 0.3197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4622, loss: 0.6525, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  29%|##8       | 32/111 [00:23<00:52,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9523, LAS: 0.9115, UEM: 0.6451, LEM: 0.4259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2655, partial_loss/deprel_loss: 0.3666, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5173, loss: 0.6465, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  33%|###3      | 37/111 [00:25<00:44,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9529, LAS: 0.9117, UEM: 0.6360, LEM: 0.4120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3649, partial_loss/deprel_loss: 0.4438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5989, loss: 0.6419, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  38%|###7      | 42/111 [00:27<00:37,  1.83it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9533, LAS: 0.9119, UEM: 0.6308, LEM: 0.4005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3812, partial_loss/deprel_loss: 0.4649, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6191, loss: 0.6401, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  41%|####1     | 46/111 [00:30<00:37,  1.72it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8989, UAS: 0.9530, LAS: 0.9112, UEM: 0.6381, LEM: 0.4133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4505, partial_loss/deprel_loss: 0.6057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7455, loss: 0.6447, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  45%|####5     | 50/111 [00:33<00:36,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9541, LAS: 0.9121, UEM: 0.6467, LEM: 0.4193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3036, partial_loss/deprel_loss: 0.4205, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5680, loss: 0.6382, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  49%|####8     | 54/111 [00:35<00:35,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8853, UAS: 0.9531, LAS: 0.9111, UEM: 0.6393, LEM: 0.4141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7622, partial_loss/deprel_loss: 0.6086, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8102, loss: 0.6446, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  52%|#####2    | 58/111 [00:38<00:33,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9534, LAS: 0.9116, UEM: 0.6483, LEM: 0.4255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8199, partial_loss/deprel_loss: 0.5976, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8129, loss: 0.6389, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  56%|#####5    | 62/111 [00:41<00:32,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8914, UAS: 0.9523, LAS: 0.9106, UEM: 0.6397, LEM: 0.4183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7800, partial_loss/deprel_loss: 0.5918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8003, loss: 0.6471, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  59%|#####9    | 66/111 [00:44<00:30,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9529, LAS: 0.9111, UEM: 0.6421, LEM: 0.4175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3019, partial_loss/deprel_loss: 0.4465, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5885, loss: 0.6425, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  63%|######3   | 70/111 [00:46<00:28,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9294, UAS: 0.9534, LAS: 0.9117, UEM: 0.6431, LEM: 0.4159, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2698, partial_loss/deprel_loss: 0.3487, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5037, loss: 0.6379, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  66%|######5   | 73/111 [00:49<00:26,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8478, UAS: 0.9525, LAS: 0.9106, UEM: 0.6362, LEM: 0.4094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3974, partial_loss/deprel_loss: 0.8038, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0934, loss: 0.6450, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||:  68%|######8   | 76/111 [00:51<00:24,  1.46it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9526, LAS: 0.9106, UEM: 0.6360, LEM: 0.4098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4778, partial_loss/deprel_loss: 0.5209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6831, loss: 0.6453, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||:  71%|#######1  | 79/111 [00:53<00:22,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9524, LAS: 0.9105, UEM: 0.6310, LEM: 0.4043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3757, partial_loss/deprel_loss: 0.4632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6165, loss: 0.6464, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||:  75%|#######4  | 83/111 [00:55<00:18,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9519, LAS: 0.9099, UEM: 0.6210, LEM: 0.3966, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6011, partial_loss/deprel_loss: 0.6377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8012, loss: 0.6522, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||:  78%|#######8  | 87/111 [00:58<00:15,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9520, LAS: 0.9102, UEM: 0.6168, LEM: 0.3921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2273, partial_loss/deprel_loss: 0.3068, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4617, loss: 0.6498, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||:  82%|########1 | 91/111 [01:00<00:13,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9522, LAS: 0.9103, UEM: 0.6161, LEM: 0.3901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2206, partial_loss/deprel_loss: 0.4240, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5542, loss: 0.6488, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||:  85%|########4 | 94/111 [01:02<00:11,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9267, UAS: 0.9523, LAS: 0.9104, UEM: 0.6158, LEM: 0.3889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2154, partial_loss/deprel_loss: 0.3287, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4769, loss: 0.6470, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||:  87%|########7 | 97/111 [01:05<00:09,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9526, LAS: 0.9105, UEM: 0.6182, LEM: 0.3887, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3185, partial_loss/deprel_loss: 0.5270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6561, loss: 0.6454, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||:  91%|######### | 101/111 [01:07<00:06,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9128, UAS: 0.9519, LAS: 0.9096, UEM: 0.6129, LEM: 0.3839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4470, partial_loss/deprel_loss: 0.5585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7070, loss: 0.6513, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||:  94%|#########3| 104/111 [01:09<00:04,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9515, LAS: 0.9093, UEM: 0.6072, LEM: 0.3791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6124, partial_loss/deprel_loss: 0.5701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7494, loss: 0.6536, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||:  97%|#########7| 108/111 [01:12<00:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9515, LAS: 0.9093, UEM: 0.6053, LEM: 0.3766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4246, partial_loss/deprel_loss: 0.5151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6678, loss: 0.6540, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||: 100%|##########| 111/111 [01:14<00:00,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9515, LAS: 0.9093, UEM: 0.6053, LEM: 0.3766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4246, partial_loss/deprel_loss: 0.5151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6678, loss: 0.6540, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
+      "2023-04-07 00:51:48,085 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.515  |       N/A\n",
+      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.425  |       N/A\n",
+      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.171  |       N/A\n",
+      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - UEM                      |     0.605  |       N/A\n",
+      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - LAS                      |     0.909  |       N/A\n",
+      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - loss                     |     0.654  |       N/A\n",
+      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - LEM                      |     0.377  |       N/A\n",
+      "2023-04-07 00:51:48,087 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:51:48,087 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:51:48,087 - INFO - combo.training.tensorboard_writer - UAS                      |     0.951  |       N/A\n",
+      "2023-04-07 00:51:48,087 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:51:48,087 - INFO - combo.training.tensorboard_writer - EM                       |     0.909  |       N/A\n",
+      "2023-04-07 00:51:48,087 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:51:48,092 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 00:51:53,928 - INFO - combo.training.trainer - Epoch duration: 0:01:23.555709\n",
+      "2023-04-07 00:51:53,928 - INFO - combo.training.trainer - Estimated training time remaining: 7:00:36\n",
+      "2023-04-07 00:51:53,928 - INFO - allennlp.training.trainer - Epoch 90/399\n",
+      "2023-04-07 00:51:53,928 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:51:53,929 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:51:53,937 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9586, LAS: 0.9155, UEM: 0.5270, LEM: 0.2716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4390, partial_loss/deprel_loss: 0.4760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6394, loss: 0.6227, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:   4%|3         | 4/111 [00:02<01:11,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9620, LAS: 0.9203, UEM: 0.6100, LEM: 0.3339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3636, partial_loss/deprel_loss: 0.3784, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5462, loss: 0.5838, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:   6%|6         | 7/111 [00:05<01:12,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8784, UAS: 0.9583, LAS: 0.9171, UEM: 0.6267, LEM: 0.3639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8749, partial_loss/deprel_loss: 0.6410, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8585, loss: 0.6021, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:  10%|9         | 11/111 [00:07<01:05,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8722, UAS: 0.9531, LAS: 0.9121, UEM: 0.5706, LEM: 0.3167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9044, partial_loss/deprel_loss: 0.6860, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9005, loss: 0.6420, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:  14%|#4        | 16/111 [00:09<00:56,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8670, UAS: 0.9505, LAS: 0.9098, UEM: 0.5415, LEM: 0.2919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0960, partial_loss/deprel_loss: 0.7426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9841, loss: 0.6564, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:  19%|#8        | 21/111 [00:11<00:50,  1.80it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9480, UAS: 0.9539, LAS: 0.9130, UEM: 0.6156, LEM: 0.3681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1117, partial_loss/deprel_loss: 0.2053, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3574, loss: 0.6258, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:  23%|##3       | 26/111 [00:14<00:48,  1.77it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9558, LAS: 0.9152, UEM: 0.6321, LEM: 0.3780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2744, partial_loss/deprel_loss: 0.3847, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5334, loss: 0.6117, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:  27%|##7       | 30/111 [00:17<00:47,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8664, UAS: 0.9541, LAS: 0.9137, UEM: 0.6241, LEM: 0.3791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0644, partial_loss/deprel_loss: 0.7645, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9952, loss: 0.6239, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:  31%|###       | 34/111 [00:20<00:48,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9553, LAS: 0.9151, UEM: 0.6368, LEM: 0.3920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2827, partial_loss/deprel_loss: 0.2994, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4668, loss: 0.6155, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:  34%|###4      | 38/111 [00:22<00:44,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9557, LAS: 0.9154, UEM: 0.6404, LEM: 0.3955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1780, partial_loss/deprel_loss: 0.3391, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4776, loss: 0.6130, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||:  38%|###7      | 42/111 [00:25<00:44,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8760, UAS: 0.9546, LAS: 0.9140, UEM: 0.6388, LEM: 0.3985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9500, partial_loss/deprel_loss: 0.6070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8463, loss: 0.6205, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||:  41%|####1     | 46/111 [00:28<00:44,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9547, LAS: 0.9141, UEM: 0.6337, LEM: 0.3903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3840, partial_loss/deprel_loss: 0.4231, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5860, loss: 0.6183, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||:  45%|####5     | 50/111 [00:30<00:39,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9541, LAS: 0.9134, UEM: 0.6280, LEM: 0.3864, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3573, partial_loss/deprel_loss: 0.4235, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5810, loss: 0.6211, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||:  49%|####8     | 54/111 [00:33<00:37,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9543, LAS: 0.9132, UEM: 0.6260, LEM: 0.3833, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3510, partial_loss/deprel_loss: 0.4607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6095, loss: 0.6207, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||:  52%|#####2    | 58/111 [00:36<00:36,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9543, LAS: 0.9130, UEM: 0.6279, LEM: 0.3851, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2470, partial_loss/deprel_loss: 0.3760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5209, loss: 0.6219, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||:  55%|#####4    | 61/111 [00:38<00:34,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8940, UAS: 0.9539, LAS: 0.9125, UEM: 0.6219, LEM: 0.3795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5638, partial_loss/deprel_loss: 0.5155, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6958, loss: 0.6253, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||:  59%|#####8    | 65/111 [00:41<00:30,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8806, UAS: 0.9537, LAS: 0.9121, UEM: 0.6204, LEM: 0.3791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8245, partial_loss/deprel_loss: 0.6926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8897, loss: 0.6278, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||:  61%|######1   | 68/111 [00:43<00:29,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9464, UAS: 0.9538, LAS: 0.9124, UEM: 0.6296, LEM: 0.3930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0910, partial_loss/deprel_loss: 0.2150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3609, loss: 0.6257, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||:  64%|######3   | 71/111 [00:45<00:29,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9180, UAS: 0.9534, LAS: 0.9119, UEM: 0.6202, LEM: 0.3844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3472, partial_loss/deprel_loss: 0.4775, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6221, loss: 0.6306, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  68%|######7   | 75/111 [00:48<00:25,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9531, LAS: 0.9114, UEM: 0.6143, LEM: 0.3787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8013, partial_loss/deprel_loss: 0.6878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8812, loss: 0.6355, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  70%|#######   | 78/111 [00:50<00:23,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9531, LAS: 0.9113, UEM: 0.6071, LEM: 0.3708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5766, partial_loss/deprel_loss: 0.6206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7825, loss: 0.6377, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  74%|#######3  | 82/111 [00:53<00:19,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8973, UAS: 0.9525, LAS: 0.9106, UEM: 0.6012, LEM: 0.3661, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4863, partial_loss/deprel_loss: 0.5547, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7117, loss: 0.6427, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  77%|#######6  | 85/111 [00:55<00:17,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8907, UAS: 0.9518, LAS: 0.9098, UEM: 0.5942, LEM: 0.3610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7252, partial_loss/deprel_loss: 0.6054, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8001, loss: 0.6498, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  79%|#######9  | 88/111 [00:57<00:15,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9520, LAS: 0.9100, UEM: 0.5902, LEM: 0.3561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2696, partial_loss/deprel_loss: 0.3801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5287, loss: 0.6494, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  83%|########2 | 92/111 [00:59<00:12,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9525, LAS: 0.9105, UEM: 0.5960, LEM: 0.3611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1836, partial_loss/deprel_loss: 0.2796, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4311, loss: 0.6452, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  86%|########5 | 95/111 [01:02<00:11,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8996, UAS: 0.9515, LAS: 0.9095, UEM: 0.5901, LEM: 0.3562, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6474, partial_loss/deprel_loss: 0.6101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7882, loss: 0.6541, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  89%|########9 | 99/111 [01:04<00:08,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8969, UAS: 0.9516, LAS: 0.9096, UEM: 0.5925, LEM: 0.3564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7554, partial_loss/deprel_loss: 0.5501, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7618, loss: 0.6533, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  92%|#########1| 102/111 [01:07<00:06,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9509, LAS: 0.9089, UEM: 0.5867, LEM: 0.3523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5455, partial_loss/deprel_loss: 0.5296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7035, loss: 0.6580, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  95%|#########4| 105/111 [01:09<00:04,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9513, LAS: 0.9093, UEM: 0.5920, LEM: 0.3550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2537, partial_loss/deprel_loss: 0.4396, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5731, loss: 0.6548, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  97%|#########7| 108/111 [01:11<00:02,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9515, LAS: 0.9096, UEM: 0.6028, LEM: 0.3725, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6137, partial_loss/deprel_loss: 0.5685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7482, loss: 0.6535, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 100%|##########| 111/111 [01:14<00:00,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9515, LAS: 0.9096, UEM: 0.6028, LEM: 0.3725, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6137, partial_loss/deprel_loss: 0.5685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7482, loss: 0.6535, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 100%|##########| 111/111 [01:14<00:00,  1.50it/s]\n",
+      "2023-04-07 00:53:10,727 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9140, UAS: 0.9666, LAS: 0.9178, UEM: 0.7733, LEM: 0.4474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4139, partial_loss/deprel_loss: 25.6641, partial_loss/cycle_loss: 0.0000, batch_loss: 20.6140, loss: 19.3419, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:08,  1.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8775, UAS: 0.9579, LAS: 0.9100, UEM: 0.7512, LEM: 0.4936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9262, partial_loss/deprel_loss: 35.7394, partial_loss/cycle_loss: 0.0000, batch_loss: 28.7767, loss: 21.8718, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  54%|#####3    | 7/13 [00:05<00:04,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8804, UAS: 0.9531, LAS: 0.9020, UEM: 0.6854, LEM: 0.4134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7791, partial_loss/deprel_loss: 28.9505, partial_loss/cycle_loss: 0.0000, batch_loss: 23.3162, loss: 23.2931, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:07<00:01,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8289, UAS: 0.9464, LAS: 0.8943, UEM: 0.6498, LEM: 0.3856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7166, partial_loss/deprel_loss: 55.2239, partial_loss/cycle_loss: 0.0000, batch_loss: 44.5224, loss: 25.0047, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:09<00:00,  1.39it/s]\n",
+      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.569  |    55.224\n",
+      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.614  |     1.717\n",
+      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.171  |     0.000\n",
+      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - UEM                      |     0.603  |     0.650\n",
+      "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - LAS                      |     0.910  |     0.894\n",
+      "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - loss                     |     0.654  |    25.005\n",
+      "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - LEM                      |     0.372  |     0.386\n",
+      "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - UAS                      |     0.951  |     0.946\n",
+      "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - EM                       |     0.904  |     0.829\n",
+      "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:53:20,063 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 00:53:24,854 - INFO - combo.training.trainer - Epoch duration: 0:01:30.925328\n",
+      "2023-04-07 00:53:24,854 - INFO - combo.training.trainer - Estimated training time remaining: 6:59:47\n",
+      "2023-04-07 00:53:24,854 - INFO - allennlp.training.trainer - Epoch 91/399\n",
+      "2023-04-07 00:53:24,854 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:53:24,855 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:53:24,864 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8414, UAS: 0.9196, LAS: 0.8740, UEM: 0.1556, LEM: 0.0356, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5877, partial_loss/deprel_loss: 0.9074, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2141, loss: 0.9081, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:   3%|2         | 3/111 [00:02<01:18,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9417, LAS: 0.9000, UEM: 0.5139, LEM: 0.2751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5749, partial_loss/deprel_loss: 0.4906, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6781, loss: 0.7202, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:   6%|6         | 7/111 [00:04<01:12,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8703, UAS: 0.9332, LAS: 0.8911, UEM: 0.4231, LEM: 0.2178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9388, partial_loss/deprel_loss: 0.7218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9358, loss: 0.7898, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  10%|9         | 11/111 [00:07<01:07,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8817, UAS: 0.9391, LAS: 0.8975, UEM: 0.5123, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6934, partial_loss/deprel_loss: 0.6334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8161, loss: 0.7382, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  14%|#3        | 15/111 [00:09<01:03,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9411, LAS: 0.8992, UEM: 0.4980, LEM: 0.2940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2657, partial_loss/deprel_loss: 0.3629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.7306, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  16%|#6        | 18/111 [00:11<01:03,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9448, LAS: 0.9035, UEM: 0.5821, LEM: 0.3803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1763, partial_loss/deprel_loss: 0.2714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4230, loss: 0.6973, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  19%|#8        | 21/111 [00:14<01:03,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9467, LAS: 0.9060, UEM: 0.5947, LEM: 0.3892, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1693, partial_loss/deprel_loss: 0.2629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4149, loss: 0.6790, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  22%|##1       | 24/111 [00:16<01:03,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9264, UAS: 0.9484, LAS: 0.9081, UEM: 0.5871, LEM: 0.3703, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2777, partial_loss/deprel_loss: 0.3964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5434, loss: 0.6673, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  25%|##5       | 28/111 [00:18<00:57,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9176, UAS: 0.9507, LAS: 0.9106, UEM: 0.6326, LEM: 0.4190, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3565, partial_loss/deprel_loss: 0.4421, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5957, loss: 0.6473, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  28%|##7       | 31/111 [00:21<00:58,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8635, UAS: 0.9501, LAS: 0.9099, UEM: 0.6233, LEM: 0.4070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1390, partial_loss/deprel_loss: 0.7462, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9954, loss: 0.6526, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  32%|###1      | 35/111 [00:23<00:53,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8896, UAS: 0.9501, LAS: 0.9099, UEM: 0.6146, LEM: 0.3962, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7562, partial_loss/deprel_loss: 0.6199, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8178, loss: 0.6525, batch_reg_loss: 0.1706, reg_loss: 0.1707 ||:  34%|###4      | 38/111 [00:26<00:50,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8731, UAS: 0.9507, LAS: 0.9103, UEM: 0.6202, LEM: 0.3983, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0333, partial_loss/deprel_loss: 0.7240, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9565, loss: 0.6498, batch_reg_loss: 0.1706, reg_loss: 0.1707 ||:  38%|###7      | 42/111 [00:28<00:47,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8811, UAS: 0.9501, LAS: 0.9096, UEM: 0.6078, LEM: 0.3855, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0019, partial_loss/deprel_loss: 0.5839, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8381, loss: 0.6546, batch_reg_loss: 0.1706, reg_loss: 0.1707 ||:  41%|####1     | 46/111 [00:31<00:42,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9508, LAS: 0.9102, UEM: 0.6114, LEM: 0.3855, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2693, partial_loss/deprel_loss: 0.4158, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5571, loss: 0.6488, batch_reg_loss: 0.1706, reg_loss: 0.1707 ||:  45%|####5     | 50/111 [00:33<00:40,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9505, LAS: 0.9100, UEM: 0.6099, LEM: 0.3849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2493, partial_loss/deprel_loss: 0.3717, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5179, loss: 0.6507, batch_reg_loss: 0.1706, reg_loss: 0.1707 ||:  49%|####8     | 54/111 [00:36<00:38,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9514, LAS: 0.9109, UEM: 0.6192, LEM: 0.3910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3527, partial_loss/deprel_loss: 0.4770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6227, loss: 0.6443, batch_reg_loss: 0.1706, reg_loss: 0.1707 ||:  52%|#####2    | 58/111 [00:39<00:36,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9037, UAS: 0.9515, LAS: 0.9108, UEM: 0.6114, LEM: 0.3828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6184, partial_loss/deprel_loss: 0.5387, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7252, loss: 0.6485, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||:  56%|#####5    | 62/111 [00:42<00:33,  1.45it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9513, LAS: 0.9104, UEM: 0.6053, LEM: 0.3773, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3285, partial_loss/deprel_loss: 0.4954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6326, loss: 0.6525, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||:  59%|#####9    | 66/111 [00:44<00:30,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8940, UAS: 0.9512, LAS: 0.9098, UEM: 0.5997, LEM: 0.3700, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4839, partial_loss/deprel_loss: 0.6563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7924, loss: 0.6560, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||:  63%|######3   | 70/111 [00:47<00:28,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9680, UAS: 0.9520, LAS: 0.9109, UEM: 0.6199, LEM: 0.3973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0445, partial_loss/deprel_loss: 0.1407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2920, loss: 0.6489, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||:  66%|######5   | 73/111 [00:49<00:27,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9522, LAS: 0.9109, UEM: 0.6165, LEM: 0.3915, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3092, partial_loss/deprel_loss: 0.4750, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6124, loss: 0.6500, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||:  68%|######8   | 76/111 [00:52<00:25,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8874, UAS: 0.9519, LAS: 0.9106, UEM: 0.6132, LEM: 0.3887, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7848, partial_loss/deprel_loss: 0.6318, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8330, loss: 0.6508, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||:  71%|#######1  | 79/111 [00:54<00:23,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9315, UAS: 0.9523, LAS: 0.9111, UEM: 0.6146, LEM: 0.3882, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2224, partial_loss/deprel_loss: 0.3762, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5160, loss: 0.6476, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||:  74%|#######3  | 82/111 [00:56<00:20,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9525, LAS: 0.9114, UEM: 0.6173, LEM: 0.3902, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7428, partial_loss/deprel_loss: 0.5632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7697, loss: 0.6460, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||:  77%|#######6  | 85/111 [00:58<00:19,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9521, LAS: 0.9110, UEM: 0.6158, LEM: 0.3891, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2247, partial_loss/deprel_loss: 0.3346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4831, loss: 0.6467, batch_reg_loss: 0.1705, reg_loss: 0.1706 ||:  81%|########1 | 90/111 [01:01<00:14,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9031, UAS: 0.9520, LAS: 0.9106, UEM: 0.6101, LEM: 0.3833, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5589, partial_loss/deprel_loss: 0.5639, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7335, loss: 0.6502, batch_reg_loss: 0.1705, reg_loss: 0.1706 ||:  85%|########4 | 94/111 [01:03<00:10,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9528, LAS: 0.9115, UEM: 0.6231, LEM: 0.3931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2567, partial_loss/deprel_loss: 0.3461, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4987, loss: 0.6430, batch_reg_loss: 0.1705, reg_loss: 0.1706 ||:  88%|########8 | 98/111 [01:06<00:08,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9529, LAS: 0.9116, UEM: 0.6202, LEM: 0.3901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6575, partial_loss/deprel_loss: 0.6112, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7910, loss: 0.6424, batch_reg_loss: 0.1705, reg_loss: 0.1706 ||:  92%|#########1| 102/111 [01:08<00:05,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8979, UAS: 0.9525, LAS: 0.9110, UEM: 0.6148, LEM: 0.3845, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5890, partial_loss/deprel_loss: 0.5102, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6965, loss: 0.6469, batch_reg_loss: 0.1705, reg_loss: 0.1706 ||:  95%|#########5| 106/111 [01:11<00:03,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8758, UAS: 0.9521, LAS: 0.9106, UEM: 0.6092, LEM: 0.3793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9806, partial_loss/deprel_loss: 0.7078, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9329, loss: 0.6498, batch_reg_loss: 0.1705, reg_loss: 0.1706 ||:  99%|#########9| 110/111 [01:13<00:00,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9520, LAS: 0.9104, UEM: 0.6071, LEM: 0.3778, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8246, partial_loss/deprel_loss: 0.6674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8694, loss: 0.6518, batch_reg_loss: 0.1705, reg_loss: 0.1706 ||: 100%|##########| 111/111 [01:13<00:00,  1.50it/s]\n",
+      "2023-04-07 00:54:41,915 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:54:41,915 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:54:41,915 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:54:41,915 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:54:41,915 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:54:41,915 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:54:41,915 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.667  |       N/A\n",
+      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.825  |       N/A\n",
+      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.171  |       N/A\n",
+      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - UEM                      |     0.607  |       N/A\n",
+      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - LAS                      |     0.910  |       N/A\n",
+      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - loss                     |     0.652  |       N/A\n",
+      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - LEM                      |     0.378  |       N/A\n",
+      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - UAS                      |     0.952  |       N/A\n",
+      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - EM                       |     0.891  |       N/A\n",
+      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:54:41,921 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:54:46,283 - INFO - combo.training.trainer - Epoch duration: 0:01:21.429347\n",
+      "2023-04-07 00:54:46,284 - INFO - combo.training.trainer - Estimated training time remaining: 6:58:25\n",
+      "2023-04-07 00:54:46,284 - INFO - allennlp.training.trainer - Epoch 92/399\n",
+      "2023-04-07 00:54:46,284 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:54:46,285 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:54:46,293 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9542, LAS: 0.9139, UEM: 0.7424, LEM: 0.5818, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5152, partial_loss/deprel_loss: 0.5199, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6895, loss: 0.6134, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||:   3%|2         | 3/111 [00:02<01:21,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9128, UAS: 0.9479, LAS: 0.9073, UEM: 0.6124, LEM: 0.4416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3346, partial_loss/deprel_loss: 0.4384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5882, loss: 0.6523, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||:   5%|5         | 6/111 [00:04<01:18,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9463, LAS: 0.9048, UEM: 0.6333, LEM: 0.4294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1418, partial_loss/deprel_loss: 0.3244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4584, loss: 0.6718, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||:   9%|9         | 10/111 [00:06<01:11,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9422, LAS: 0.9000, UEM: 0.5906, LEM: 0.3838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4059, partial_loss/deprel_loss: 0.4657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6242, loss: 0.7008, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||:  12%|#1        | 13/111 [00:09<01:10,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9447, LAS: 0.9030, UEM: 0.5856, LEM: 0.3780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2784, partial_loss/deprel_loss: 0.3270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4878, loss: 0.6912, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||:  15%|#5        | 17/111 [00:11<01:06,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9470, LAS: 0.9053, UEM: 0.5853, LEM: 0.3640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2329, partial_loss/deprel_loss: 0.3702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5132, loss: 0.6773, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||:  19%|#8        | 21/111 [00:14<01:00,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9460, LAS: 0.9037, UEM: 0.5511, LEM: 0.3347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6266, partial_loss/deprel_loss: 0.5975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7738, loss: 0.6872, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||:  23%|##2       | 25/111 [00:16<00:55,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9259, UAS: 0.9480, LAS: 0.9061, UEM: 0.5590, LEM: 0.3307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2587, partial_loss/deprel_loss: 0.3937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5371, loss: 0.6726, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||:  26%|##6       | 29/111 [00:19<00:52,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9489, LAS: 0.9070, UEM: 0.5670, LEM: 0.3330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7531, partial_loss/deprel_loss: 0.5853, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7893, loss: 0.6676, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||:  29%|##8       | 32/111 [00:21<00:52,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9460, UAS: 0.9491, LAS: 0.9076, UEM: 0.5801, LEM: 0.3557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1063, partial_loss/deprel_loss: 0.2096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3594, loss: 0.6631, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||:  32%|###1      | 35/111 [00:23<00:53,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9488, LAS: 0.9072, UEM: 0.5672, LEM: 0.3429, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3363, partial_loss/deprel_loss: 0.4694, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6132, loss: 0.6686, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||:  34%|###4      | 38/111 [00:25<00:52,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9494, LAS: 0.9079, UEM: 0.5780, LEM: 0.3534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1917, partial_loss/deprel_loss: 0.3255, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4692, loss: 0.6623, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||:  37%|###6      | 41/111 [00:28<00:51,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9505, LAS: 0.9092, UEM: 0.5912, LEM: 0.3617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2921, partial_loss/deprel_loss: 0.3574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5148, loss: 0.6529, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||:  40%|###9      | 44/111 [00:30<00:48,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8648, UAS: 0.9502, LAS: 0.9091, UEM: 0.5955, LEM: 0.3680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2522, partial_loss/deprel_loss: 0.6656, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9533, loss: 0.6536, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||:  42%|####2     | 47/111 [00:32<00:47,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9506, LAS: 0.9097, UEM: 0.5931, LEM: 0.3639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2855, partial_loss/deprel_loss: 0.3769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5290, loss: 0.6486, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||:  45%|####5     | 50/111 [00:35<00:47,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9503, LAS: 0.9092, UEM: 0.5891, LEM: 0.3591, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4746, partial_loss/deprel_loss: 0.4868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6548, loss: 0.6510, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||:  49%|####8     | 54/111 [00:37<00:40,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9506, LAS: 0.9095, UEM: 0.5857, LEM: 0.3544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3050, partial_loss/deprel_loss: 0.3623, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5212, loss: 0.6479, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||:  51%|#####1    | 57/111 [00:39<00:39,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9515, LAS: 0.9105, UEM: 0.5931, LEM: 0.3599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1843, partial_loss/deprel_loss: 0.2933, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4419, loss: 0.6429, batch_reg_loss: 0.1704, reg_loss: 0.1704 ||:  55%|#####4    | 61/111 [00:42<00:35,  1.40it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8981, UAS: 0.9504, LAS: 0.9094, UEM: 0.5806, LEM: 0.3502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6265, partial_loss/deprel_loss: 0.5127, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7059, loss: 0.6522, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||:  59%|#####8    | 65/111 [00:44<00:31,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9501, LAS: 0.9092, UEM: 0.5760, LEM: 0.3450, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9519, partial_loss/deprel_loss: 0.6115, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8500, loss: 0.6552, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||:  62%|######2   | 69/111 [00:47<00:27,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9514, LAS: 0.9108, UEM: 0.6083, LEM: 0.3858, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4295, partial_loss/deprel_loss: 0.4640, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6274, loss: 0.6452, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||:  66%|######5   | 73/111 [00:50<00:26,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9184, UAS: 0.9524, LAS: 0.9119, UEM: 0.6201, LEM: 0.3955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3675, partial_loss/deprel_loss: 0.3858, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5524, loss: 0.6368, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||:  69%|######9   | 77/111 [00:53<00:23,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9531, LAS: 0.9123, UEM: 0.6260, LEM: 0.3974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1469, partial_loss/deprel_loss: 0.3113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4487, loss: 0.6328, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||:  72%|#######2  | 80/111 [00:55<00:21,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9530, LAS: 0.9125, UEM: 0.6196, LEM: 0.3912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6422, partial_loss/deprel_loss: 0.5340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7260, loss: 0.6324, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||:  76%|#######5  | 84/111 [00:57<00:17,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9531, LAS: 0.9127, UEM: 0.6151, LEM: 0.3860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3872, partial_loss/deprel_loss: 0.4186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5826, loss: 0.6309, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||:  79%|#######9  | 88/111 [00:59<00:14,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9534, LAS: 0.9129, UEM: 0.6182, LEM: 0.3891, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1823, partial_loss/deprel_loss: 0.3832, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5133, loss: 0.6296, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||:  83%|########2 | 92/111 [01:02<00:11,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9536, LAS: 0.9132, UEM: 0.6242, LEM: 0.3969, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1635, partial_loss/deprel_loss: 0.3041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4462, loss: 0.6277, batch_reg_loss: 0.1702, reg_loss: 0.1704 ||:  86%|########6 | 96/111 [01:04<00:08,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9539, LAS: 0.9134, UEM: 0.6223, LEM: 0.3940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5956, partial_loss/deprel_loss: 0.5345, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7169, loss: 0.6272, batch_reg_loss: 0.1702, reg_loss: 0.1704 ||:  91%|######### | 101/111 [01:06<00:05,  1.80it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9542, LAS: 0.9139, UEM: 0.6224, LEM: 0.3937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2040, partial_loss/deprel_loss: 0.2981, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4494, loss: 0.6243, batch_reg_loss: 0.1702, reg_loss: 0.1704 ||:  95%|#########5| 106/111 [01:09<00:02,  1.82it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9536, LAS: 0.9133, UEM: 0.6157, LEM: 0.3883, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3588, partial_loss/deprel_loss: 0.4519, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6035, loss: 0.6290, batch_reg_loss: 0.1702, reg_loss: 0.1704 ||:  99%|#########9| 110/111 [01:12<00:00,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9536, LAS: 0.9133, UEM: 0.6142, LEM: 0.3870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4580, partial_loss/deprel_loss: 0.4665, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6350, loss: 0.6291, batch_reg_loss: 0.1702, reg_loss: 0.1704 ||: 100%|##########| 111/111 [01:12<00:00,  1.52it/s]\n",
+      "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.467  |       N/A\n",
+      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.458  |       N/A\n",
+      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.170  |       N/A\n",
+      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - UEM                      |     0.614  |       N/A\n",
+      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - LAS                      |     0.913  |       N/A\n",
+      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - loss                     |     0.629  |       N/A\n",
+      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - LEM                      |     0.387  |       N/A\n",
+      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - UAS                      |     0.954  |       N/A\n",
+      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - EM                       |     0.915  |       N/A\n",
+      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:56:02,425 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:56:07,411 - INFO - combo.training.trainer - Epoch duration: 0:01:21.127162\n",
+      "2023-04-07 00:56:07,412 - INFO - combo.training.trainer - Estimated training time remaining: 6:57:02\n",
+      "2023-04-07 00:56:07,412 - INFO - allennlp.training.trainer - Epoch 93/399\n",
+      "2023-04-07 00:56:07,412 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:56:07,413 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:56:07,422 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9622, LAS: 0.9221, UEM: 0.7398, LEM: 0.5281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1570, partial_loss/deprel_loss: 0.2857, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4302, loss: 0.5584, batch_reg_loss: 0.1702, reg_loss: 0.1702 ||:   4%|3         | 4/111 [00:02<01:17,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9572, LAS: 0.9153, UEM: 0.6616, LEM: 0.4305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2660, partial_loss/deprel_loss: 0.4206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5599, loss: 0.6086, batch_reg_loss: 0.1702, reg_loss: 0.1702 ||:   7%|7         | 8/111 [00:05<01:10,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9590, LAS: 0.9168, UEM: 0.6598, LEM: 0.4079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2378, partial_loss/deprel_loss: 0.3891, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5290, loss: 0.6018, batch_reg_loss: 0.1702, reg_loss: 0.1702 ||:  10%|9         | 11/111 [00:07<01:09,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9566, LAS: 0.9156, UEM: 0.6450, LEM: 0.4066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6822, partial_loss/deprel_loss: 0.5603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7548, loss: 0.6125, batch_reg_loss: 0.1702, reg_loss: 0.1702 ||:  13%|#2        | 14/111 [00:09<01:10,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9550, LAS: 0.9141, UEM: 0.6348, LEM: 0.3942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2216, partial_loss/deprel_loss: 0.3102, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4626, loss: 0.6239, batch_reg_loss: 0.1701, reg_loss: 0.1702 ||:  15%|#5        | 17/111 [00:11<01:07,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9546, LAS: 0.9142, UEM: 0.6136, LEM: 0.3776, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4356, partial_loss/deprel_loss: 0.4792, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6406, loss: 0.6247, batch_reg_loss: 0.1701, reg_loss: 0.1702 ||:  19%|#8        | 21/111 [00:14<01:01,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9557, LAS: 0.9156, UEM: 0.6347, LEM: 0.4037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1566, partial_loss/deprel_loss: 0.2693, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4169, loss: 0.6161, batch_reg_loss: 0.1701, reg_loss: 0.1702 ||:  23%|##2       | 25/111 [00:16<00:57,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9546, LAS: 0.9146, UEM: 0.6127, LEM: 0.3836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3816, partial_loss/deprel_loss: 0.4059, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5711, loss: 0.6273, batch_reg_loss: 0.1701, reg_loss: 0.1701 ||:  26%|##6       | 29/111 [00:19<00:53,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9565, LAS: 0.9172, UEM: 0.6595, LEM: 0.4441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1907, partial_loss/deprel_loss: 0.3468, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4857, loss: 0.6083, batch_reg_loss: 0.1701, reg_loss: 0.1701 ||:  29%|##8       | 32/111 [00:21<00:53,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9561, LAS: 0.9169, UEM: 0.6562, LEM: 0.4394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1723, partial_loss/deprel_loss: 0.3134, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4553, loss: 0.6078, batch_reg_loss: 0.1701, reg_loss: 0.1701 ||:  32%|###2      | 36/111 [00:24<00:52,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8968, UAS: 0.9555, LAS: 0.9164, UEM: 0.6497, LEM: 0.4317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7917, partial_loss/deprel_loss: 0.5317, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7538, loss: 0.6085, batch_reg_loss: 0.1701, reg_loss: 0.1701 ||:  35%|###5      | 39/111 [00:26<00:53,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9564, LAS: 0.9174, UEM: 0.6608, LEM: 0.4411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1739, partial_loss/deprel_loss: 0.3126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4549, loss: 0.6001, batch_reg_loss: 0.1701, reg_loss: 0.1701 ||:  38%|###7      | 42/111 [00:29<00:53,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9564, LAS: 0.9173, UEM: 0.6523, LEM: 0.4318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2875, partial_loss/deprel_loss: 0.3333, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4941, loss: 0.6016, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||:  41%|####      | 45/111 [00:31<00:49,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9236, UAS: 0.9561, LAS: 0.9169, UEM: 0.6436, LEM: 0.4207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2851, partial_loss/deprel_loss: 0.4227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5652, loss: 0.6044, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||:  44%|####4     | 49/111 [00:34<00:44,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9565, LAS: 0.9175, UEM: 0.6450, LEM: 0.4208, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6738, partial_loss/deprel_loss: 0.5516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7461, loss: 0.6009, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||:  48%|####7     | 53/111 [00:36<00:40,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9563, LAS: 0.9174, UEM: 0.6370, LEM: 0.4121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4258, partial_loss/deprel_loss: 0.3993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5746, loss: 0.6023, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||:  50%|#####     | 56/111 [00:38<00:38,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9077, UAS: 0.9566, LAS: 0.9178, UEM: 0.6402, LEM: 0.4125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5124, partial_loss/deprel_loss: 0.5456, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7090, loss: 0.6001, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||:  53%|#####3    | 59/111 [00:40<00:36,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9570, LAS: 0.9181, UEM: 0.6485, LEM: 0.4235, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3293, partial_loss/deprel_loss: 0.4408, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5885, loss: 0.5983, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||:  56%|#####5    | 62/111 [00:43<00:34,  1.42it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9567, LAS: 0.9178, UEM: 0.6434, LEM: 0.4176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2561, partial_loss/deprel_loss: 0.3669, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5147, loss: 0.5990, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||:  59%|#####8    | 65/111 [00:45<00:32,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9572, LAS: 0.9183, UEM: 0.6455, LEM: 0.4177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2146, partial_loss/deprel_loss: 0.2871, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4426, loss: 0.5950, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||:  61%|######1   | 68/111 [00:47<00:31,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9570, LAS: 0.9181, UEM: 0.6403, LEM: 0.4117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5097, partial_loss/deprel_loss: 0.4827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6581, loss: 0.5962, batch_reg_loss: 0.1699, reg_loss: 0.1701 ||:  64%|######3   | 71/111 [00:49<00:29,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9084, UAS: 0.9570, LAS: 0.9181, UEM: 0.6342, LEM: 0.4048, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6196, partial_loss/deprel_loss: 0.5692, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7492, loss: 0.5984, batch_reg_loss: 0.1699, reg_loss: 0.1701 ||:  68%|######8   | 76/111 [00:52<00:23,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9560, LAS: 0.9172, UEM: 0.6291, LEM: 0.4003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9994, partial_loss/deprel_loss: 0.7024, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9317, loss: 0.6070, batch_reg_loss: 0.1699, reg_loss: 0.1701 ||:  73%|#######2  | 81/111 [00:54<00:18,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8847, UAS: 0.9563, LAS: 0.9174, UEM: 0.6301, LEM: 0.3992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6907, partial_loss/deprel_loss: 0.7202, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8842, loss: 0.6059, batch_reg_loss: 0.1699, reg_loss: 0.1700 ||:  77%|#######7  | 86/111 [00:57<00:14,  1.76it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9553, LAS: 0.9163, UEM: 0.6202, LEM: 0.3909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5477, partial_loss/deprel_loss: 0.5488, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7185, loss: 0.6131, batch_reg_loss: 0.1699, reg_loss: 0.1700 ||:  82%|########1 | 91/111 [00:59<00:10,  1.82it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9557, LAS: 0.9167, UEM: 0.6267, LEM: 0.3972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4010, partial_loss/deprel_loss: 0.5455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6865, loss: 0.6099, batch_reg_loss: 0.1699, reg_loss: 0.1700 ||:  86%|########5 | 95/111 [01:02<00:09,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8950, UAS: 0.9554, LAS: 0.9163, UEM: 0.6206, LEM: 0.3909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6465, partial_loss/deprel_loss: 0.5652, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7514, loss: 0.6136, batch_reg_loss: 0.1699, reg_loss: 0.1700 ||:  89%|########9 | 99/111 [01:05<00:07,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9456, UAS: 0.9553, LAS: 0.9162, UEM: 0.6243, LEM: 0.3965, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1391, partial_loss/deprel_loss: 0.2918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4311, loss: 0.6134, batch_reg_loss: 0.1699, reg_loss: 0.1700 ||:  93%|#########2| 103/111 [01:07<00:05,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9549, LAS: 0.9158, UEM: 0.6186, LEM: 0.3910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3359, partial_loss/deprel_loss: 0.4198, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5729, loss: 0.6165, batch_reg_loss: 0.1698, reg_loss: 0.1700 ||:  96%|#########6| 107/111 [01:10<00:02,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9545, LAS: 0.9154, UEM: 0.6144, LEM: 0.3875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3012, partial_loss/deprel_loss: 0.3890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5413, loss: 0.6187, batch_reg_loss: 0.1698, reg_loss: 0.1700 ||: 100%|##########| 111/111 [01:13<00:00,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9545, LAS: 0.9154, UEM: 0.6144, LEM: 0.3875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3012, partial_loss/deprel_loss: 0.3890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5413, loss: 0.6187, batch_reg_loss: 0.1698, reg_loss: 0.1700 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
+      "2023-04-07 00:57:23,892 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:57:23,892 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:57:23,892 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:57:23,892 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:57:23,892 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:57:23,892 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:57:23,892 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.389  |       N/A\n",
+      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.301  |       N/A\n",
+      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.170  |       N/A\n",
+      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - UEM                      |     0.614  |       N/A\n",
+      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - LAS                      |     0.915  |       N/A\n",
+      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - loss                     |     0.619  |       N/A\n",
+      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - LEM                      |     0.388  |       N/A\n",
+      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:57:23,894 - INFO - combo.training.tensorboard_writer - UAS                      |     0.955  |       N/A\n",
+      "2023-04-07 00:57:23,894 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:57:23,894 - INFO - combo.training.tensorboard_writer - EM                       |     0.931  |       N/A\n",
+      "2023-04-07 00:57:23,894 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:57:23,899 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:57:29,960 - INFO - combo.training.trainer - Epoch duration: 0:01:22.548285\n",
+      "2023-04-07 00:57:29,961 - INFO - combo.training.trainer - Estimated training time remaining: 6:55:44\n",
+      "2023-04-07 00:57:29,961 - INFO - allennlp.training.trainer - Epoch 94/399\n",
+      "2023-04-07 00:57:29,961 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:57:29,962 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:57:29,970 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9521, LAS: 0.9133, UEM: 0.4149, LEM: 0.2060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3573, partial_loss/deprel_loss: 0.4357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5899, loss: 0.6595, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||:   3%|2         | 3/111 [00:02<01:12,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9224, UAS: 0.9525, LAS: 0.9124, UEM: 0.4244, LEM: 0.1976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2817, partial_loss/deprel_loss: 0.3916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5394, loss: 0.6374, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||:   6%|6         | 7/111 [00:04<01:06,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9542, LAS: 0.9137, UEM: 0.4699, LEM: 0.2229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2137, partial_loss/deprel_loss: 0.3456, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4891, loss: 0.6316, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||:  10%|9         | 11/111 [00:06<01:03,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9548, LAS: 0.9140, UEM: 0.4912, LEM: 0.2354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2900, partial_loss/deprel_loss: 0.4000, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5478, loss: 0.6281, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||:  13%|#2        | 14/111 [00:08<01:03,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9528, LAS: 0.9122, UEM: 0.4714, LEM: 0.2223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7772, partial_loss/deprel_loss: 0.5558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7698, loss: 0.6451, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||:  16%|#6        | 18/111 [00:11<01:00,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9527, LAS: 0.9119, UEM: 0.4715, LEM: 0.2221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8692, partial_loss/deprel_loss: 0.6261, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8445, loss: 0.6476, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||:  20%|#9        | 22/111 [00:13<00:57,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9716, UAS: 0.9558, LAS: 0.9159, UEM: 0.5880, LEM: 0.3642, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0331, partial_loss/deprel_loss: 0.1041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2597, loss: 0.6200, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||:  23%|##2       | 25/111 [00:16<00:59,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9140, UAS: 0.9549, LAS: 0.9152, UEM: 0.5827, LEM: 0.3626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5290, partial_loss/deprel_loss: 0.4605, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6440, loss: 0.6231, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||:  25%|##5       | 28/111 [00:18<01:00,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9192, UAS: 0.9555, LAS: 0.9158, UEM: 0.5982, LEM: 0.3751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3287, partial_loss/deprel_loss: 0.3859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5442, loss: 0.6142, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||:  28%|##7       | 31/111 [00:20<00:58,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8926, UAS: 0.9560, LAS: 0.9164, UEM: 0.6102, LEM: 0.3853, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7661, partial_loss/deprel_loss: 0.5392, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7543, loss: 0.6087, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||:  31%|###       | 34/111 [00:23<00:56,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9562, LAS: 0.9169, UEM: 0.6093, LEM: 0.3828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1732, partial_loss/deprel_loss: 0.2811, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4293, loss: 0.6057, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||:  33%|###3      | 37/111 [00:25<00:54,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9571, LAS: 0.9176, UEM: 0.6248, LEM: 0.3943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3037, partial_loss/deprel_loss: 0.3452, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5066, loss: 0.6012, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||:  37%|###6      | 41/111 [00:28<00:49,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9555, LAS: 0.9159, UEM: 0.6103, LEM: 0.3832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5706, partial_loss/deprel_loss: 0.5425, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7178, loss: 0.6149, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||:  40%|###9      | 44/111 [00:30<00:46,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9549, LAS: 0.9153, UEM: 0.6039, LEM: 0.3760, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2421, partial_loss/deprel_loss: 0.3133, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4688, loss: 0.6180, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||:  42%|####2     | 47/111 [00:32<00:45,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9551, LAS: 0.9155, UEM: 0.5987, LEM: 0.3679, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6414, partial_loss/deprel_loss: 0.5149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7099, loss: 0.6183, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||:  45%|####5     | 50/111 [00:34<00:43,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9556, LAS: 0.9162, UEM: 0.6107, LEM: 0.3821, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1239, partial_loss/deprel_loss: 0.2417, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3878, loss: 0.6148, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||:  48%|####7     | 53/111 [00:36<00:41,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9538, LAS: 0.9145, UEM: 0.6052, LEM: 0.3785, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2717, partial_loss/deprel_loss: 0.3415, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4972, loss: 0.6253, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||:  50%|#####     | 56/111 [00:38<00:38,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9546, LAS: 0.9152, UEM: 0.6152, LEM: 0.3848, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1899, partial_loss/deprel_loss: 0.2864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4368, loss: 0.6189, batch_reg_loss: 0.1697, reg_loss: 0.1697 ||:  55%|#####4    | 61/111 [00:40<00:31,  1.58it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9545, LAS: 0.9149, UEM: 0.6062, LEM: 0.3747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1938, partial_loss/deprel_loss: 0.3977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5266, loss: 0.6216, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||:  59%|#####9    | 66/111 [00:43<00:26,  1.72it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8609, UAS: 0.9538, LAS: 0.9138, UEM: 0.6011, LEM: 0.3702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0929, partial_loss/deprel_loss: 0.7331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9747, loss: 0.6295, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||:  64%|######3   | 71/111 [00:45<00:22,  1.79it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9542, LAS: 0.9143, UEM: 0.6086, LEM: 0.3763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1674, partial_loss/deprel_loss: 0.2936, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4380, loss: 0.6262, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||:  68%|######7   | 75/111 [00:48<00:20,  1.73it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9537, LAS: 0.9138, UEM: 0.6020, LEM: 0.3701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4646, partial_loss/deprel_loss: 0.4516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6238, loss: 0.6289, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||:  71%|#######1  | 79/111 [00:50<00:18,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9539, LAS: 0.9140, UEM: 0.5997, LEM: 0.3669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7002, partial_loss/deprel_loss: 0.6113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7987, loss: 0.6289, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||:  75%|#######4  | 83/111 [00:53<00:16,  1.71it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9544, LAS: 0.9147, UEM: 0.6118, LEM: 0.3806, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2079, partial_loss/deprel_loss: 0.3162, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4641, loss: 0.6233, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||:  78%|#######8  | 87/111 [00:56<00:15,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9549, LAS: 0.9153, UEM: 0.6189, LEM: 0.3865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5173, partial_loss/deprel_loss: 0.5162, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6860, loss: 0.6188, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||:  82%|########1 | 91/111 [00:58<00:13,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8417, UAS: 0.9545, LAS: 0.9148, UEM: 0.6184, LEM: 0.3841, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6372, partial_loss/deprel_loss: 0.7892, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1283, loss: 0.6222, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||:  86%|########5 | 95/111 [01:01<00:10,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9547, LAS: 0.9150, UEM: 0.6189, LEM: 0.3840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2109, partial_loss/deprel_loss: 0.3147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4635, loss: 0.6209, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||:  88%|########8 | 98/111 [01:04<00:09,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9547, LAS: 0.9151, UEM: 0.6162, LEM: 0.3814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3293, partial_loss/deprel_loss: 0.4396, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5871, loss: 0.6197, batch_reg_loss: 0.1695, reg_loss: 0.1697 ||:  92%|#########1| 102/111 [01:06<00:06,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9550, LAS: 0.9154, UEM: 0.6205, LEM: 0.3849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4263, partial_loss/deprel_loss: 0.4916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6481, loss: 0.6173, batch_reg_loss: 0.1695, reg_loss: 0.1697 ||:  95%|#########5| 106/111 [01:09<00:03,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9209, UAS: 0.9547, LAS: 0.9151, UEM: 0.6143, LEM: 0.3793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3580, partial_loss/deprel_loss: 0.4075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5671, loss: 0.6200, batch_reg_loss: 0.1695, reg_loss: 0.1697 ||:  99%|#########9| 110/111 [01:11<00:00,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9572, UAS: 0.9550, LAS: 0.9155, UEM: 0.6235, LEM: 0.3915, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0758, partial_loss/deprel_loss: 0.1748, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3245, loss: 0.6173, batch_reg_loss: 0.1695, reg_loss: 0.1697 ||: 100%|##########| 111/111 [01:12<00:00,  1.53it/s]\n",
+      "2023-04-07 00:58:45,473 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 00:58:45,473 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.175  |       N/A\n",
+      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.076  |       N/A\n",
+      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.170  |       N/A\n",
+      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - UEM                      |     0.624  |       N/A\n",
+      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - LAS                      |     0.915  |       N/A\n",
+      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - loss                     |     0.617  |       N/A\n",
+      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - LEM                      |     0.391  |       N/A\n",
+      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - UAS                      |     0.955  |       N/A\n",
+      "2023-04-07 00:58:45,475 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 00:58:45,475 - INFO - combo.training.tensorboard_writer - EM                       |     0.957  |       N/A\n",
+      "2023-04-07 00:58:45,475 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 00:58:45,479 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 00:58:50,382 - INFO - combo.training.trainer - Epoch duration: 0:01:20.421411\n",
+      "2023-04-07 00:58:50,383 - INFO - combo.training.trainer - Estimated training time remaining: 6:54:19\n",
+      "2023-04-07 00:58:50,383 - INFO - allennlp.training.trainer - Epoch 95/399\n",
+      "2023-04-07 00:58:50,383 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 00:58:50,384 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 00:58:50,393 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9403, LAS: 0.8966, UEM: 0.2033, LEM: 0.0664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7028, partial_loss/deprel_loss: 0.6247, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8098, loss: 0.7676, batch_reg_loss: 0.1695, reg_loss: 0.1695 ||:   3%|2         | 3/111 [00:02<01:13,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9138, UAS: 0.9443, LAS: 0.9015, UEM: 0.2599, LEM: 0.0791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5260, partial_loss/deprel_loss: 0.4491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6339, loss: 0.7219, batch_reg_loss: 0.1695, reg_loss: 0.1695 ||:   5%|5         | 6/111 [00:04<01:13,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9452, LAS: 0.9049, UEM: 0.4647, LEM: 0.2893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1432, partial_loss/deprel_loss: 0.2551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4022, loss: 0.6918, batch_reg_loss: 0.1695, reg_loss: 0.1695 ||:   8%|8         | 9/111 [00:06<01:11,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9517, LAS: 0.9121, UEM: 0.5362, LEM: 0.3248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2530, partial_loss/deprel_loss: 0.4008, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5407, loss: 0.6405, batch_reg_loss: 0.1695, reg_loss: 0.1695 ||:  12%|#1        | 13/111 [00:08<01:05,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9501, LAS: 0.9100, UEM: 0.5007, LEM: 0.2911, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4803, partial_loss/deprel_loss: 0.4817, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6508, loss: 0.6529, batch_reg_loss: 0.1695, reg_loss: 0.1695 ||:  14%|#4        | 16/111 [00:10<01:03,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9510, LAS: 0.9112, UEM: 0.5359, LEM: 0.3277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3315, partial_loss/deprel_loss: 0.3570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5214, loss: 0.6384, batch_reg_loss: 0.1695, reg_loss: 0.1695 ||:  17%|#7        | 19/111 [00:13<01:05,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9515, LAS: 0.9117, UEM: 0.5425, LEM: 0.3300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1692, partial_loss/deprel_loss: 0.3072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4491, loss: 0.6385, batch_reg_loss: 0.1694, reg_loss: 0.1695 ||:  21%|##        | 23/111 [00:15<00:59,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9527, LAS: 0.9131, UEM: 0.5493, LEM: 0.3301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4411, partial_loss/deprel_loss: 0.4339, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6048, loss: 0.6308, batch_reg_loss: 0.1694, reg_loss: 0.1695 ||:  23%|##3       | 26/111 [00:17<00:58,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9513, LAS: 0.9119, UEM: 0.5297, LEM: 0.3149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6417, partial_loss/deprel_loss: 0.5229, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7161, loss: 0.6360, batch_reg_loss: 0.1694, reg_loss: 0.1695 ||:  26%|##6       | 29/111 [00:19<00:56,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9096, UAS: 0.9521, LAS: 0.9128, UEM: 0.5411, LEM: 0.3158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6245, partial_loss/deprel_loss: 0.4886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6852, loss: 0.6294, batch_reg_loss: 0.1694, reg_loss: 0.1695 ||:  29%|##8       | 32/111 [00:22<00:57,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9525, LAS: 0.9133, UEM: 0.5363, LEM: 0.3086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4648, partial_loss/deprel_loss: 0.4901, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6544, loss: 0.6274, batch_reg_loss: 0.1694, reg_loss: 0.1695 ||:  32%|###1      | 35/111 [00:24<00:54,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9053, UAS: 0.9525, LAS: 0.9130, UEM: 0.5261, LEM: 0.2956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6211, partial_loss/deprel_loss: 0.5475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7316, loss: 0.6312, batch_reg_loss: 0.1694, reg_loss: 0.1694 ||:  35%|###5      | 39/111 [00:26<00:49,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9537, LAS: 0.9144, UEM: 0.5419, LEM: 0.3059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4597, partial_loss/deprel_loss: 0.4636, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6322, loss: 0.6227, batch_reg_loss: 0.1694, reg_loss: 0.1694 ||:  39%|###8      | 43/111 [00:28<00:44,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9520, LAS: 0.9128, UEM: 0.5411, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1825, partial_loss/deprel_loss: 0.3025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4479, loss: 0.6364, batch_reg_loss: 0.1694, reg_loss: 0.1694 ||:  42%|####2     | 47/111 [00:30<00:38,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9530, LAS: 0.9136, UEM: 0.5572, LEM: 0.3243, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4463, partial_loss/deprel_loss: 0.5523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7004, loss: 0.6296, batch_reg_loss: 0.1694, reg_loss: 0.1694 ||:  46%|####5     | 51/111 [00:33<00:34,  1.71it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9099, UAS: 0.9539, LAS: 0.9149, UEM: 0.5827, LEM: 0.3534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6151, partial_loss/deprel_loss: 0.5066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6976, loss: 0.6191, batch_reg_loss: 0.1693, reg_loss: 0.1694 ||:  50%|#####     | 56/111 [00:35<00:30,  1.80it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9541, LAS: 0.9150, UEM: 0.5864, LEM: 0.3552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2266, partial_loss/deprel_loss: 0.3339, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4818, loss: 0.6187, batch_reg_loss: 0.1693, reg_loss: 0.1694 ||:  54%|#####4    | 60/111 [00:38<00:29,  1.73it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9704, UAS: 0.9552, LAS: 0.9164, UEM: 0.6180, LEM: 0.3964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0377, partial_loss/deprel_loss: 0.1045, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2604, loss: 0.6088, batch_reg_loss: 0.1693, reg_loss: 0.1694 ||:  58%|#####7    | 64/111 [00:41<00:32,  1.45it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9551, LAS: 0.9162, UEM: 0.6103, LEM: 0.3890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2907, partial_loss/deprel_loss: 0.3677, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5216, loss: 0.6092, batch_reg_loss: 0.1693, reg_loss: 0.1694 ||:  61%|######1   | 68/111 [00:44<00:28,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9553, LAS: 0.9164, UEM: 0.6085, LEM: 0.3851, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2413, partial_loss/deprel_loss: 0.3382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4881, loss: 0.6091, batch_reg_loss: 0.1693, reg_loss: 0.1694 ||:  65%|######4   | 72/111 [00:46<00:24,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9551, LAS: 0.9161, UEM: 0.6072, LEM: 0.3825, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1896, partial_loss/deprel_loss: 0.3795, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5108, loss: 0.6118, batch_reg_loss: 0.1693, reg_loss: 0.1694 ||:  68%|######8   | 76/111 [00:49<00:22,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9546, LAS: 0.9153, UEM: 0.6000, LEM: 0.3749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6490, partial_loss/deprel_loss: 0.6409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8118, loss: 0.6166, batch_reg_loss: 0.1693, reg_loss: 0.1694 ||:  72%|#######2  | 80/111 [00:51<00:20,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9319, UAS: 0.9547, LAS: 0.9156, UEM: 0.5963, LEM: 0.3708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2473, partial_loss/deprel_loss: 0.3526, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5008, loss: 0.6157, batch_reg_loss: 0.1692, reg_loss: 0.1694 ||:  76%|#######5  | 84/111 [00:54<00:18,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9303, UAS: 0.9548, LAS: 0.9158, UEM: 0.5937, LEM: 0.3677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2914, partial_loss/deprel_loss: 0.3522, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5093, loss: 0.6155, batch_reg_loss: 0.1692, reg_loss: 0.1694 ||:  79%|#######9  | 88/111 [00:58<00:16,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9547, LAS: 0.9157, UEM: 0.5955, LEM: 0.3694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2497, partial_loss/deprel_loss: 0.3107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4677, loss: 0.6151, batch_reg_loss: 0.1692, reg_loss: 0.1694 ||:  82%|########1 | 91/111 [01:00<00:14,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8947, UAS: 0.9548, LAS: 0.9158, UEM: 0.5948, LEM: 0.3669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6732, partial_loss/deprel_loss: 0.6229, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8022, loss: 0.6142, batch_reg_loss: 0.1692, reg_loss: 0.1694 ||:  86%|########5 | 95/111 [01:02<00:10,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9550, LAS: 0.9159, UEM: 0.5965, LEM: 0.3674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1758, partial_loss/deprel_loss: 0.2661, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4172, loss: 0.6134, batch_reg_loss: 0.1692, reg_loss: 0.1694 ||:  89%|########9 | 99/111 [01:05<00:07,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9549, LAS: 0.9159, UEM: 0.6031, LEM: 0.3734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2254, partial_loss/deprel_loss: 0.3636, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5051, loss: 0.6133, batch_reg_loss: 0.1692, reg_loss: 0.1693 ||:  93%|#########2| 103/111 [01:07<00:05,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9552, LAS: 0.9162, UEM: 0.6069, LEM: 0.3765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2262, partial_loss/deprel_loss: 0.3421, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4881, loss: 0.6110, batch_reg_loss: 0.1692, reg_loss: 0.1693 ||:  96%|#########6| 107/111 [01:09<00:02,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9548, UAS: 0.9559, LAS: 0.9168, UEM: 0.6223, LEM: 0.3930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0805, partial_loss/deprel_loss: 0.1551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3094, loss: 0.6056, batch_reg_loss: 0.1692, reg_loss: 0.1693 ||: 100%|##########| 111/111 [01:12<00:00,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9548, UAS: 0.9559, LAS: 0.9168, UEM: 0.6223, LEM: 0.3930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0805, partial_loss/deprel_loss: 0.1551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3094, loss: 0.6056, batch_reg_loss: 0.1692, reg_loss: 0.1693 ||: 100%|##########| 111/111 [01:12<00:00,  1.52it/s]\n",
+      "2023-04-07 01:00:06,571 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8717, UAS: 0.9433, LAS: 0.8922, UEM: 0.5839, LEM: 0.2975, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3625, partial_loss/deprel_loss: 45.9887, partial_loss/cycle_loss: 0.0000, batch_loss: 37.0634, loss: 28.0423, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:03<00:10,  1.02s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9475, LAS: 0.8973, UEM: 0.5948, LEM: 0.3034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5580, partial_loss/deprel_loss: 23.4960, partial_loss/cycle_loss: 0.0000, batch_loss: 18.9084, loss: 23.4430, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:06,  1.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9461, LAS: 0.8943, UEM: 0.5695, LEM: 0.2727, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1060, partial_loss/deprel_loss: 41.4238, partial_loss/cycle_loss: 0.0000, batch_loss: 33.3602, loss: 24.6334, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  69%|######9   | 9/13 [00:08<00:03,  1.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9515, LAS: 0.9013, UEM: 0.6730, LEM: 0.4032, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1632, partial_loss/deprel_loss: 22.7933, partial_loss/cycle_loss: 0.0000, batch_loss: 18.2673, loss: 23.1488, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  92%|#########2| 12/13 [00:11<00:00,  1.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8296, UAS: 0.9464, LAS: 0.8957, UEM: 0.6553, LEM: 0.3920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6588, partial_loss/deprel_loss: 54.3492, partial_loss/cycle_loss: 0.0000, batch_loss: 43.8111, loss: 24.7382, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.02it/s]\n",
+      "2023-04-07 01:00:19,335 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:00:19,335 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:00:19,335 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:00:19,335 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:00:19,335 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 01:00:19,335 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.155  |    54.349\n",
+      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.081  |     1.659\n",
+      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.169  |     0.000\n",
+      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - UEM                      |     0.622  |     0.655\n",
+      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - LAS                      |     0.917  |     0.896\n",
+      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - loss                     |     0.606  |    24.738\n",
+      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - LEM                      |     0.393  |     0.392\n",
+      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - UAS                      |     0.956  |     0.946\n",
+      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - EM                       |     0.955  |     0.830\n",
+      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:00:19,341 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:00:24,554 - INFO - combo.training.trainer - Epoch duration: 0:01:34.171200\n",
+      "2023-04-07 01:00:24,555 - INFO - combo.training.trainer - Estimated training time remaining: 6:53:37\n",
+      "2023-04-07 01:00:24,555 - INFO - allennlp.training.trainer - Epoch 96/399\n",
+      "2023-04-07 01:00:24,555 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:00:24,555 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:00:24,562 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9391, LAS: 0.8974, UEM: 0.2827, LEM: 0.1307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7643, partial_loss/deprel_loss: 0.5785, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7848, loss: 0.7524, batch_reg_loss: 0.1692, reg_loss: 0.1692 ||:   4%|3         | 4/111 [00:02<01:00,  1.76it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8979, UAS: 0.9463, LAS: 0.9054, UEM: 0.4872, LEM: 0.2904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7313, partial_loss/deprel_loss: 0.5896, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7871, loss: 0.6933, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||:   8%|8         | 9/111 [00:04<00:56,  1.80it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9499, LAS: 0.9104, UEM: 0.5896, LEM: 0.3841, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1736, partial_loss/deprel_loss: 0.2812, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4288, loss: 0.6497, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||:  11%|#         | 12/111 [00:07<01:00,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9004, UAS: 0.9503, LAS: 0.9112, UEM: 0.5665, LEM: 0.3555, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5769, partial_loss/deprel_loss: 0.5445, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7201, loss: 0.6425, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||:  14%|#4        | 16/111 [00:09<00:55,  1.72it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9122, UAS: 0.9521, LAS: 0.9129, UEM: 0.5732, LEM: 0.3552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4876, partial_loss/deprel_loss: 0.4542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6300, loss: 0.6335, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||:  17%|#7        | 19/111 [00:11<00:56,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8980, UAS: 0.9524, LAS: 0.9133, UEM: 0.5812, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7037, partial_loss/deprel_loss: 0.5797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7736, loss: 0.6279, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||:  21%|##        | 23/111 [00:13<00:54,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9520, LAS: 0.9131, UEM: 0.5641, LEM: 0.3448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2893, partial_loss/deprel_loss: 0.3722, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5247, loss: 0.6309, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||:  24%|##4       | 27/111 [00:15<00:50,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9548, LAS: 0.9162, UEM: 0.6015, LEM: 0.3720, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3965, partial_loss/deprel_loss: 0.4824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6343, loss: 0.6099, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||:  29%|##8       | 32/111 [00:18<00:43,  1.82it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9558, LAS: 0.9175, UEM: 0.6238, LEM: 0.3993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7691, partial_loss/deprel_loss: 0.5358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7515, loss: 0.6023, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||:  33%|###3      | 37/111 [00:20<00:40,  1.84it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9252, UAS: 0.9561, LAS: 0.9177, UEM: 0.6109, LEM: 0.3852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2981, partial_loss/deprel_loss: 0.4184, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5634, loss: 0.6028, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||:  37%|###6      | 41/111 [00:23<00:39,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9546, LAS: 0.9165, UEM: 0.6138, LEM: 0.3904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2492, partial_loss/deprel_loss: 0.3801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5230, loss: 0.6106, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||:  41%|####      | 45/111 [00:26<00:42,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9550, LAS: 0.9170, UEM: 0.6111, LEM: 0.3871, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6034, partial_loss/deprel_loss: 0.4635, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6605, loss: 0.6057, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||:  44%|####4     | 49/111 [00:29<00:39,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9554, LAS: 0.9174, UEM: 0.6144, LEM: 0.3896, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4303, partial_loss/deprel_loss: 0.4575, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6211, loss: 0.6032, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||:  48%|####7     | 53/111 [00:31<00:37,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9550, LAS: 0.9167, UEM: 0.6106, LEM: 0.3844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6086, partial_loss/deprel_loss: 0.5597, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7385, loss: 0.6088, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||:  51%|#####1    | 57/111 [00:34<00:35,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9007, UAS: 0.9552, LAS: 0.9167, UEM: 0.6143, LEM: 0.3884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4830, partial_loss/deprel_loss: 0.5003, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6658, loss: 0.6087, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||:  55%|#####4    | 61/111 [00:37<00:33,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9551, LAS: 0.9167, UEM: 0.6094, LEM: 0.3821, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4728, partial_loss/deprel_loss: 0.3934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5782, loss: 0.6072, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||:  59%|#####8    | 65/111 [00:39<00:29,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9551, LAS: 0.9168, UEM: 0.6119, LEM: 0.3843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1561, partial_loss/deprel_loss: 0.2667, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4136, loss: 0.6057, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||:  62%|######2   | 69/111 [00:42<00:26,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9236, UAS: 0.9551, LAS: 0.9169, UEM: 0.6096, LEM: 0.3808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3390, partial_loss/deprel_loss: 0.3907, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5493, loss: 0.6053, batch_reg_loss: 0.1689, reg_loss: 0.1691 ||:  66%|######5   | 73/111 [00:44<00:24,  1.54it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9560, LAS: 0.9179, UEM: 0.6290, LEM: 0.4057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2955, partial_loss/deprel_loss: 0.3446, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5037, loss: 0.5985, batch_reg_loss: 0.1689, reg_loss: 0.1690 ||:  69%|######9   | 77/111 [00:47<00:23,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9036, UAS: 0.9564, LAS: 0.9185, UEM: 0.6391, LEM: 0.4171, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5531, partial_loss/deprel_loss: 0.4909, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6723, loss: 0.5941, batch_reg_loss: 0.1689, reg_loss: 0.1690 ||:  72%|#######2  | 80/111 [00:50<00:21,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9565, LAS: 0.9185, UEM: 0.6354, LEM: 0.4115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3544, partial_loss/deprel_loss: 0.4211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5767, loss: 0.5948, batch_reg_loss: 0.1689, reg_loss: 0.1690 ||:  76%|#######5  | 84/111 [00:52<00:17,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9563, LAS: 0.9183, UEM: 0.6299, LEM: 0.4058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2253, partial_loss/deprel_loss: 0.3211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4708, loss: 0.5979, batch_reg_loss: 0.1689, reg_loss: 0.1690 ||:  79%|#######9  | 88/111 [00:55<00:15,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9556, LAS: 0.9175, UEM: 0.6254, LEM: 0.4005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5456, partial_loss/deprel_loss: 0.4963, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6750, loss: 0.6032, batch_reg_loss: 0.1689, reg_loss: 0.1690 ||:  83%|########2 | 92/111 [00:58<00:13,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9555, LAS: 0.9173, UEM: 0.6257, LEM: 0.4025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5814, partial_loss/deprel_loss: 0.5300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7091, loss: 0.6043, batch_reg_loss: 0.1689, reg_loss: 0.1690 ||:  86%|########6 | 96/111 [01:00<00:09,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9556, LAS: 0.9175, UEM: 0.6248, LEM: 0.4004, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1825, partial_loss/deprel_loss: 0.2865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4346, loss: 0.6037, batch_reg_loss: 0.1689, reg_loss: 0.1690 ||:  90%|######### | 100/111 [01:03<00:07,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8807, UAS: 0.9557, LAS: 0.9176, UEM: 0.6292, LEM: 0.4046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9167, partial_loss/deprel_loss: 0.6152, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8444, loss: 0.6018, batch_reg_loss: 0.1688, reg_loss: 0.1690 ||:  94%|#########3| 104/111 [01:06<00:04,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9550, LAS: 0.9170, UEM: 0.6240, LEM: 0.4016, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2415, partial_loss/deprel_loss: 0.3029, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4594, loss: 0.6050, batch_reg_loss: 0.1688, reg_loss: 0.1690 ||:  97%|#########7| 108/111 [01:08<00:02,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9550, LAS: 0.9168, UEM: 0.6213, LEM: 0.3972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2427, partial_loss/deprel_loss: 0.4258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5580, loss: 0.6063, batch_reg_loss: 0.1688, reg_loss: 0.1690 ||: 100%|##########| 111/111 [01:10<00:00,  1.57it/s]\n",
+      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.426  |       N/A\n",
+      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.243  |       N/A\n",
+      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.169  |       N/A\n",
+      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - UEM                      |     0.621  |       N/A\n",
+      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - LAS                      |     0.917  |       N/A\n",
+      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - loss                     |     0.606  |       N/A\n",
+      "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - LEM                      |     0.397  |       N/A\n",
+      "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - UAS                      |     0.955  |       N/A\n",
+      "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - EM                       |     0.920  |       N/A\n",
+      "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:01:38,123 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:01:41,735 - INFO - combo.training.trainer - Epoch duration: 0:01:17.180312\n",
+      "2023-04-07 01:01:41,736 - INFO - combo.training.trainer - Estimated training time remaining: 6:52:02\n",
+      "2023-04-07 01:01:41,736 - INFO - allennlp.training.trainer - Epoch 97/399\n",
+      "2023-04-07 01:01:41,736 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:01:41,737 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:01:41,751 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9212, UAS: 0.9528, LAS: 0.9152, UEM: 0.4238, LEM: 0.1726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2883, partial_loss/deprel_loss: 0.4121, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5561, loss: 0.6364, batch_reg_loss: 0.1688, reg_loss: 0.1688 ||:   4%|3         | 4/111 [00:02<01:05,  1.63it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9295, UAS: 0.9571, LAS: 0.9196, UEM: 0.4810, LEM: 0.2370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3336, partial_loss/deprel_loss: 0.3597, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5233, loss: 0.5891, batch_reg_loss: 0.1688, reg_loss: 0.1688 ||:   7%|7         | 8/111 [00:04<01:00,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9574, LAS: 0.9207, UEM: 0.5548, LEM: 0.3183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2063, partial_loss/deprel_loss: 0.2908, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4427, loss: 0.5791, batch_reg_loss: 0.1688, reg_loss: 0.1688 ||:  12%|#1        | 13/111 [00:06<00:54,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9551, LAS: 0.9179, UEM: 0.5253, LEM: 0.2913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4222, partial_loss/deprel_loss: 0.4357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6018, loss: 0.6009, batch_reg_loss: 0.1688, reg_loss: 0.1688 ||:  16%|#6        | 18/111 [00:09<00:48,  1.91it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9556, LAS: 0.9183, UEM: 0.5201, LEM: 0.2861, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5889, partial_loss/deprel_loss: 0.4690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6618, loss: 0.5964, batch_reg_loss: 0.1688, reg_loss: 0.1688 ||:  21%|##        | 23/111 [00:11<00:44,  1.99it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9550, LAS: 0.9174, UEM: 0.5125, LEM: 0.2803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6726, partial_loss/deprel_loss: 0.5126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7134, loss: 0.5991, batch_reg_loss: 0.1687, reg_loss: 0.1688 ||:  24%|##4       | 27/111 [00:14<00:45,  1.83it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9525, LAS: 0.9149, UEM: 0.5015, LEM: 0.2737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8222, partial_loss/deprel_loss: 0.5603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7814, loss: 0.6175, batch_reg_loss: 0.1687, reg_loss: 0.1688 ||:  28%|##7       | 31/111 [00:16<00:46,  1.71it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9539, LAS: 0.9157, UEM: 0.5416, LEM: 0.3111, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2850, partial_loss/deprel_loss: 0.3523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5076, loss: 0.6092, batch_reg_loss: 0.1687, reg_loss: 0.1688 ||:  32%|###1      | 35/111 [00:19<00:47,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9371, UAS: 0.9550, LAS: 0.9171, UEM: 0.5771, LEM: 0.3557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1882, partial_loss/deprel_loss: 0.3070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4520, loss: 0.5997, batch_reg_loss: 0.1687, reg_loss: 0.1688 ||:  35%|###5      | 39/111 [00:22<00:47,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8661, UAS: 0.9541, LAS: 0.9158, UEM: 0.5798, LEM: 0.3571, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0605, partial_loss/deprel_loss: 0.7466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9781, loss: 0.6078, batch_reg_loss: 0.1687, reg_loss: 0.1688 ||:  39%|###8      | 43/111 [00:25<00:47,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9136, UAS: 0.9541, LAS: 0.9158, UEM: 0.5736, LEM: 0.3501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5492, partial_loss/deprel_loss: 0.4876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6686, loss: 0.6089, batch_reg_loss: 0.1687, reg_loss: 0.1688 ||:  42%|####2     | 47/111 [00:28<00:43,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9149, UAS: 0.9544, LAS: 0.9162, UEM: 0.5777, LEM: 0.3527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4814, partial_loss/deprel_loss: 0.5070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6706, loss: 0.6079, batch_reg_loss: 0.1687, reg_loss: 0.1688 ||:  45%|####5     | 50/111 [00:30<00:42,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9539, LAS: 0.9156, UEM: 0.5682, LEM: 0.3432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3379, partial_loss/deprel_loss: 0.4453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5925, loss: 0.6127, batch_reg_loss: 0.1687, reg_loss: 0.1687 ||:  49%|####8     | 54/111 [00:32<00:38,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9547, LAS: 0.9161, UEM: 0.5806, LEM: 0.3531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4688, partial_loss/deprel_loss: 0.5378, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6927, loss: 0.6084, batch_reg_loss: 0.1687, reg_loss: 0.1687 ||:  52%|#####2    | 58/111 [00:35<00:35,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9279, UAS: 0.9558, LAS: 0.9174, UEM: 0.6119, LEM: 0.3931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2852, partial_loss/deprel_loss: 0.3170, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4793, loss: 0.5991, batch_reg_loss: 0.1687, reg_loss: 0.1687 ||:  56%|#####5    | 62/111 [00:39<00:36,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9561, LAS: 0.9176, UEM: 0.6116, LEM: 0.3917, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4259, partial_loss/deprel_loss: 0.5426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6879, loss: 0.5979, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||:  59%|#####8    | 65/111 [00:41<00:34,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9558, LAS: 0.9175, UEM: 0.6148, LEM: 0.3955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4009, partial_loss/deprel_loss: 0.4690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6240, loss: 0.5995, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||:  61%|######1   | 68/111 [00:43<00:32,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9559, LAS: 0.9177, UEM: 0.6136, LEM: 0.3943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1631, partial_loss/deprel_loss: 0.2949, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4371, loss: 0.5977, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||:  64%|######3   | 71/111 [00:45<00:30,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9109, UAS: 0.9551, LAS: 0.9166, UEM: 0.6049, LEM: 0.3879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4649, partial_loss/deprel_loss: 0.4780, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6440, loss: 0.6042, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||:  67%|######6   | 74/111 [00:47<00:26,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9020, UAS: 0.9549, LAS: 0.9165, UEM: 0.6025, LEM: 0.3856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6400, partial_loss/deprel_loss: 0.5306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7211, loss: 0.6049, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||:  70%|#######   | 78/111 [00:50<00:23,  1.40it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9473, UAS: 0.9559, LAS: 0.9177, UEM: 0.6219, LEM: 0.4045, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1427, partial_loss/deprel_loss: 0.2165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3704, loss: 0.5963, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||:  74%|#######3  | 82/111 [00:53<00:19,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9562, LAS: 0.9179, UEM: 0.6242, LEM: 0.4047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5192, partial_loss/deprel_loss: 0.5186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6873, loss: 0.5945, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||:  77%|#######6  | 85/111 [00:55<00:17,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9559, LAS: 0.9177, UEM: 0.6176, LEM: 0.3978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4235, partial_loss/deprel_loss: 0.4227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5915, loss: 0.5972, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||:  80%|########  | 89/111 [00:57<00:14,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9562, LAS: 0.9180, UEM: 0.6208, LEM: 0.4008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1388, partial_loss/deprel_loss: 0.2387, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3873, loss: 0.5943, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||:  84%|########3 | 93/111 [01:00<00:11,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8943, UAS: 0.9562, LAS: 0.9179, UEM: 0.6276, LEM: 0.4098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8061, partial_loss/deprel_loss: 0.5951, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8058, loss: 0.5943, batch_reg_loss: 0.1685, reg_loss: 0.1687 ||:  87%|########7 | 97/111 [01:03<00:09,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9561, LAS: 0.9178, UEM: 0.6256, LEM: 0.4068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2770, partial_loss/deprel_loss: 0.3365, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4931, loss: 0.5947, batch_reg_loss: 0.1685, reg_loss: 0.1687 ||:  91%|######### | 101/111 [01:06<00:06,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9560, LAS: 0.9177, UEM: 0.6224, LEM: 0.4029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3510, partial_loss/deprel_loss: 0.3745, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5384, loss: 0.5959, batch_reg_loss: 0.1685, reg_loss: 0.1687 ||:  94%|#########3| 104/111 [01:08<00:04,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9560, LAS: 0.9176, UEM: 0.6200, LEM: 0.3996, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3526, partial_loss/deprel_loss: 0.3979, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5573, loss: 0.5966, batch_reg_loss: 0.1685, reg_loss: 0.1687 ||:  96%|#########6| 107/111 [01:10<00:02,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9413, UAS: 0.9562, LAS: 0.9178, UEM: 0.6249, LEM: 0.4043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1825, partial_loss/deprel_loss: 0.2514, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4061, loss: 0.5948, batch_reg_loss: 0.1685, reg_loss: 0.1687 ||:  99%|#########9| 110/111 [01:12<00:00,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9291, UAS: 0.9563, LAS: 0.9179, UEM: 0.6249, LEM: 0.4038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2849, partial_loss/deprel_loss: 0.3783, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5281, loss: 0.5942, batch_reg_loss: 0.1685, reg_loss: 0.1687 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
+      "2023-04-07 01:02:57,808 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.378  |       N/A\n",
+      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.285  |       N/A\n",
+      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.169  |       N/A\n",
+      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - UEM                      |     0.625  |       N/A\n",
+      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - LAS                      |     0.918  |       N/A\n",
+      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - loss                     |     0.594  |       N/A\n",
+      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:02:57,810 - INFO - combo.training.tensorboard_writer - LEM                      |     0.404  |       N/A\n",
+      "2023-04-07 01:02:57,810 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:02:57,810 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:02:57,810 - INFO - combo.training.tensorboard_writer - UAS                      |     0.956  |       N/A\n",
+      "2023-04-07 01:02:57,810 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:02:57,810 - INFO - combo.training.tensorboard_writer - EM                       |     0.929  |       N/A\n",
+      "2023-04-07 01:02:57,810 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:02:57,814 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:03:02,067 - INFO - combo.training.trainer - Epoch duration: 0:01:20.331514\n",
+      "2023-04-07 01:03:02,068 - INFO - combo.training.trainer - Estimated training time remaining: 6:50:36\n",
+      "2023-04-07 01:03:02,068 - INFO - allennlp.training.trainer - Epoch 98/399\n",
+      "2023-04-07 01:03:02,068 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:03:02,069 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:03:02,078 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9541, LAS: 0.9186, UEM: 0.5242, LEM: 0.3288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5159, partial_loss/deprel_loss: 0.5113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6807, loss: 0.6171, batch_reg_loss: 0.1685, reg_loss: 0.1685 ||:   5%|4         | 5/111 [00:02<00:44,  2.36it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9596, UAS: 0.9624, LAS: 0.9276, UEM: 0.7138, LEM: 0.5187, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0722, partial_loss/deprel_loss: 0.1715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3201, loss: 0.5430, batch_reg_loss: 0.1685, reg_loss: 0.1685 ||:   8%|8         | 9/111 [00:04<00:45,  2.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9602, LAS: 0.9251, UEM: 0.6759, LEM: 0.4770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2314, partial_loss/deprel_loss: 0.3308, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4794, loss: 0.5607, batch_reg_loss: 0.1685, reg_loss: 0.1685 ||:  12%|#1        | 13/111 [00:06<00:47,  2.05it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9616, LAS: 0.9257, UEM: 0.6847, LEM: 0.4680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1678, partial_loss/deprel_loss: 0.2828, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4282, loss: 0.5542, batch_reg_loss: 0.1684, reg_loss: 0.1685 ||:  14%|#4        | 16/111 [00:08<00:56,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9788, UAS: 0.9625, LAS: 0.9276, UEM: 0.7210, LEM: 0.5319, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0258, partial_loss/deprel_loss: 0.0861, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2424, loss: 0.5429, batch_reg_loss: 0.1684, reg_loss: 0.1685 ||:  17%|#7        | 19/111 [00:11<01:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9600, LAS: 0.9245, UEM: 0.6866, LEM: 0.4975, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7137, partial_loss/deprel_loss: 0.5098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7190, loss: 0.5636, batch_reg_loss: 0.1684, reg_loss: 0.1685 ||:  21%|##        | 23/111 [00:14<00:59,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9593, LAS: 0.9240, UEM: 0.6749, LEM: 0.4812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2493, partial_loss/deprel_loss: 0.3284, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4810, loss: 0.5654, batch_reg_loss: 0.1684, reg_loss: 0.1685 ||:  23%|##3       | 26/111 [00:16<00:57,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9578, LAS: 0.9217, UEM: 0.6691, LEM: 0.4742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5636, partial_loss/deprel_loss: 0.5041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6844, loss: 0.5787, batch_reg_loss: 0.1684, reg_loss: 0.1685 ||:  27%|##7       | 30/111 [00:18<00:53,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.9563, LAS: 0.9197, UEM: 0.6634, LEM: 0.4649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8823, partial_loss/deprel_loss: 0.6261, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8457, loss: 0.5912, batch_reg_loss: 0.1684, reg_loss: 0.1684 ||:  31%|###       | 34/111 [00:21<00:50,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9540, LAS: 0.9172, UEM: 0.6384, LEM: 0.4451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7668, partial_loss/deprel_loss: 0.6458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8384, loss: 0.6081, batch_reg_loss: 0.1684, reg_loss: 0.1684 ||:  34%|###4      | 38/111 [00:23<00:47,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9545, LAS: 0.9177, UEM: 0.6341, LEM: 0.4378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6419, partial_loss/deprel_loss: 0.4970, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6943, loss: 0.6035, batch_reg_loss: 0.1684, reg_loss: 0.1684 ||:  38%|###7      | 42/111 [00:26<00:44,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9048, UAS: 0.9552, LAS: 0.9182, UEM: 0.6314, LEM: 0.4292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5426, partial_loss/deprel_loss: 0.5139, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6880, loss: 0.5989, batch_reg_loss: 0.1684, reg_loss: 0.1684 ||:  41%|####1     | 46/111 [00:29<00:42,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9548, LAS: 0.9177, UEM: 0.6174, LEM: 0.4134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2994, partial_loss/deprel_loss: 0.4110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5570, loss: 0.6036, batch_reg_loss: 0.1684, reg_loss: 0.1684 ||:  45%|####5     | 50/111 [00:31<00:40,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9551, LAS: 0.9179, UEM: 0.6165, LEM: 0.4088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3775, partial_loss/deprel_loss: 0.3967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5612, loss: 0.6012, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||:  48%|####7     | 53/111 [00:33<00:38,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9366, UAS: 0.9557, LAS: 0.9184, UEM: 0.6215, LEM: 0.4096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2372, partial_loss/deprel_loss: 0.3011, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4567, loss: 0.5959, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||:  50%|#####     | 56/111 [00:35<00:36,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9561, LAS: 0.9188, UEM: 0.6278, LEM: 0.4150, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2137, partial_loss/deprel_loss: 0.2977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4492, loss: 0.5927, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||:  53%|#####3    | 59/111 [00:38<00:36,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9563, LAS: 0.9188, UEM: 0.6229, LEM: 0.4084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3157, partial_loss/deprel_loss: 0.3908, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5441, loss: 0.5923, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||:  56%|#####5    | 62/111 [00:40<00:34,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9559, LAS: 0.9182, UEM: 0.6228, LEM: 0.4062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2031, partial_loss/deprel_loss: 0.3757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5095, loss: 0.5966, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||:  59%|#####8    | 65/111 [00:42<00:32,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9560, LAS: 0.9184, UEM: 0.6212, LEM: 0.4057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1784, partial_loss/deprel_loss: 0.2485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4028, loss: 0.5939, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||:  62%|######2   | 69/111 [00:45<00:29,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9566, LAS: 0.9191, UEM: 0.6341, LEM: 0.4180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1107, partial_loss/deprel_loss: 0.2521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3921, loss: 0.5892, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||:  65%|######4   | 72/111 [00:47<00:28,  1.35it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9188, UAS: 0.9566, LAS: 0.9189, UEM: 0.6289, LEM: 0.4104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3712, partial_loss/deprel_loss: 0.4228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5807, loss: 0.5898, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||:  68%|######8   | 76/111 [00:50<00:24,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9571, LAS: 0.9195, UEM: 0.6385, LEM: 0.4207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2057, partial_loss/deprel_loss: 0.3700, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5054, loss: 0.5858, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||:  71%|#######1  | 79/111 [00:52<00:22,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9571, LAS: 0.9194, UEM: 0.6355, LEM: 0.4166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3003, partial_loss/deprel_loss: 0.4440, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5835, loss: 0.5865, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||:  74%|#######3  | 82/111 [00:54<00:21,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9572, LAS: 0.9194, UEM: 0.6377, LEM: 0.4172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2213, partial_loss/deprel_loss: 0.3443, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4880, loss: 0.5859, batch_reg_loss: 0.1682, reg_loss: 0.1684 ||:  77%|#######6  | 85/111 [00:57<00:19,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8670, UAS: 0.9567, LAS: 0.9189, UEM: 0.6401, LEM: 0.4216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1453, partial_loss/deprel_loss: 0.6996, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9569, loss: 0.5903, batch_reg_loss: 0.1682, reg_loss: 0.1684 ||:  79%|#######9  | 88/111 [00:59<00:17,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9568, LAS: 0.9189, UEM: 0.6360, LEM: 0.4162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4078, partial_loss/deprel_loss: 0.4475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6078, loss: 0.5904, batch_reg_loss: 0.1682, reg_loss: 0.1684 ||:  82%|########1 | 91/111 [01:01<00:14,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9060, UAS: 0.9564, LAS: 0.9184, UEM: 0.6309, LEM: 0.4100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6180, partial_loss/deprel_loss: 0.5235, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7107, loss: 0.5933, batch_reg_loss: 0.1682, reg_loss: 0.1684 ||:  86%|########5 | 95/111 [01:03<00:11,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9568, LAS: 0.9188, UEM: 0.6325, LEM: 0.4108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6260, partial_loss/deprel_loss: 0.5665, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7466, loss: 0.5919, batch_reg_loss: 0.1682, reg_loss: 0.1683 ||:  89%|########9 | 99/111 [01:06<00:08,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9567, LAS: 0.9188, UEM: 0.6271, LEM: 0.4056, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4285, partial_loss/deprel_loss: 0.4146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5855, loss: 0.5936, batch_reg_loss: 0.1682, reg_loss: 0.1683 ||:  93%|#########2| 103/111 [01:08<00:05,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9573, LAS: 0.9193, UEM: 0.6311, LEM: 0.4069, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1397, partial_loss/deprel_loss: 0.2701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4122, loss: 0.5898, batch_reg_loss: 0.1682, reg_loss: 0.1683 ||:  96%|#########6| 107/111 [01:10<00:02,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9572, LAS: 0.9193, UEM: 0.6285, LEM: 0.4040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3200, partial_loss/deprel_loss: 0.4264, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5733, loss: 0.5914, batch_reg_loss: 0.1682, reg_loss: 0.1683 ||: 100%|##########| 111/111 [01:12<00:00,  1.53it/s]\n",
+      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.426  |       N/A\n",
+      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.320  |       N/A\n",
+      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.168  |       N/A\n",
+      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - UEM                      |     0.628  |       N/A\n",
+      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - LAS                      |     0.919  |       N/A\n",
+      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - loss                     |     0.591  |       N/A\n",
+      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - LEM                      |     0.404  |       N/A\n",
+      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - UAS                      |     0.957  |       N/A\n",
+      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - EM                       |     0.927  |       N/A\n",
+      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:04:18,236 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:04:23,599 - INFO - combo.training.trainer - Epoch duration: 0:01:21.530588\n",
+      "2023-04-07 01:04:23,599 - INFO - combo.training.trainer - Estimated training time remaining: 6:49:15\n",
+      "2023-04-07 01:04:23,599 - INFO - allennlp.training.trainer - Epoch 99/399\n",
+      "2023-04-07 01:04:23,600 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:04:23,600 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:04:23,610 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9617, LAS: 0.9249, UEM: 0.5893, LEM: 0.3322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4106, partial_loss/deprel_loss: 0.4330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5967, loss: 0.5332, batch_reg_loss: 0.1681, reg_loss: 0.1682 ||:   4%|3         | 4/111 [00:02<01:07,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9595, LAS: 0.9213, UEM: 0.6843, LEM: 0.4378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1692, partial_loss/deprel_loss: 0.2754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4223, loss: 0.5445, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||:   6%|6         | 7/111 [00:05<01:13,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9636, LAS: 0.9278, UEM: 0.7559, LEM: 0.5669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4117, partial_loss/deprel_loss: 0.4424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6044, loss: 0.5165, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||:   9%|9         | 10/111 [00:07<01:14,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9228, UAS: 0.9641, LAS: 0.9285, UEM: 0.7408, LEM: 0.5375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3300, partial_loss/deprel_loss: 0.3917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5475, loss: 0.5127, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||:  12%|#1        | 13/111 [00:09<01:13,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9580, LAS: 0.9216, UEM: 0.7034, LEM: 0.4986, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6043, partial_loss/deprel_loss: 0.5621, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7386, loss: 0.5675, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||:  15%|#5        | 17/111 [00:12<01:08,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9556, LAS: 0.9192, UEM: 0.6625, LEM: 0.4607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7397, partial_loss/deprel_loss: 0.5515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7573, loss: 0.5879, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||:  19%|#8        | 21/111 [00:15<01:02,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9563, LAS: 0.9201, UEM: 0.6492, LEM: 0.4395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2487, partial_loss/deprel_loss: 0.3765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5190, loss: 0.5868, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||:  23%|##2       | 25/111 [00:17<00:57,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9579, LAS: 0.9217, UEM: 0.6643, LEM: 0.4489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1325, partial_loss/deprel_loss: 0.2781, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4171, loss: 0.5753, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||:  26%|##6       | 29/111 [00:19<00:53,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9312, UAS: 0.9570, LAS: 0.9207, UEM: 0.6437, LEM: 0.4288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3022, partial_loss/deprel_loss: 0.4089, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5556, loss: 0.5883, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||:  30%|##9       | 33/111 [00:22<00:51,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9567, LAS: 0.9202, UEM: 0.6330, LEM: 0.4166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6738, partial_loss/deprel_loss: 0.5017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7042, loss: 0.5906, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||:  33%|###3      | 37/111 [00:25<00:48,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9351, UAS: 0.9578, LAS: 0.9212, UEM: 0.6431, LEM: 0.4213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2221, partial_loss/deprel_loss: 0.3180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4669, loss: 0.5836, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||:  36%|###6      | 40/111 [00:27<00:48,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9473, UAS: 0.9584, LAS: 0.9217, UEM: 0.6527, LEM: 0.4313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1170, partial_loss/deprel_loss: 0.2165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3646, loss: 0.5801, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||:  39%|###8      | 43/111 [00:29<00:46,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9586, LAS: 0.9219, UEM: 0.6642, LEM: 0.4476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6093, partial_loss/deprel_loss: 0.5565, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7350, loss: 0.5771, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||:  41%|####1     | 46/111 [00:32<00:47,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9250, UAS: 0.9580, LAS: 0.9211, UEM: 0.6541, LEM: 0.4386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3014, partial_loss/deprel_loss: 0.3756, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5288, loss: 0.5832, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||:  45%|####5     | 50/111 [00:34<00:42,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9034, UAS: 0.9584, LAS: 0.9217, UEM: 0.6583, LEM: 0.4435, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6870, partial_loss/deprel_loss: 0.4964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7025, loss: 0.5790, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||:  49%|####8     | 54/111 [00:37<00:39,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9400, UAS: 0.9592, LAS: 0.9225, UEM: 0.6651, LEM: 0.4454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1660, partial_loss/deprel_loss: 0.2901, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4333, loss: 0.5727, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||:  52%|#####2    | 58/111 [00:39<00:34,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9359, UAS: 0.9592, LAS: 0.9223, UEM: 0.6643, LEM: 0.4408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1708, partial_loss/deprel_loss: 0.3220, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4597, loss: 0.5735, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||:  56%|#####5    | 62/111 [00:42<00:33,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9582, LAS: 0.9212, UEM: 0.6523, LEM: 0.4309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7255, partial_loss/deprel_loss: 0.4816, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6983, loss: 0.5811, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||:  59%|#####9    | 66/111 [00:44<00:29,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9084, UAS: 0.9577, LAS: 0.9206, UEM: 0.6417, LEM: 0.4212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5670, partial_loss/deprel_loss: 0.5030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6838, loss: 0.5851, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||:  63%|######3   | 70/111 [00:47<00:26,  1.52it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9118, UAS: 0.9571, LAS: 0.9201, UEM: 0.6357, LEM: 0.4142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5721, partial_loss/deprel_loss: 0.4689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6575, loss: 0.5889, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||:  67%|######6   | 74/111 [00:50<00:25,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9568, LAS: 0.9196, UEM: 0.6329, LEM: 0.4119, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2059, partial_loss/deprel_loss: 0.3338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4761, loss: 0.5904, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||:  69%|######9   | 77/111 [00:53<00:25,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9567, LAS: 0.9194, UEM: 0.6282, LEM: 0.4061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4504, partial_loss/deprel_loss: 0.4251, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5981, loss: 0.5918, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||:  72%|#######2  | 80/111 [00:55<00:22,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9568, LAS: 0.9194, UEM: 0.6270, LEM: 0.4034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2898, partial_loss/deprel_loss: 0.4051, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5499, loss: 0.5915, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||:  75%|#######4  | 83/111 [00:57<00:20,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9567, LAS: 0.9193, UEM: 0.6383, LEM: 0.4165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1086, partial_loss/deprel_loss: 0.2315, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3748, loss: 0.5910, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||:  77%|#######7  | 86/111 [00:59<00:19,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9568, LAS: 0.9194, UEM: 0.6343, LEM: 0.4114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2650, partial_loss/deprel_loss: 0.3856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5293, loss: 0.5909, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||:  81%|########1 | 90/111 [01:02<00:14,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9573, LAS: 0.9200, UEM: 0.6318, LEM: 0.4070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3063, partial_loss/deprel_loss: 0.3247, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4889, loss: 0.5869, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||:  86%|########5 | 95/111 [01:04<00:10,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9572, LAS: 0.9199, UEM: 0.6300, LEM: 0.4040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2153, partial_loss/deprel_loss: 0.3539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4941, loss: 0.5871, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||:  90%|######### | 100/111 [01:06<00:06,  1.74it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9572, LAS: 0.9199, UEM: 0.6342, LEM: 0.4089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1752, partial_loss/deprel_loss: 0.2231, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3814, loss: 0.5868, batch_reg_loss: 0.1678, reg_loss: 0.1680 ||:  95%|#########4| 105/111 [01:09<00:03,  1.78it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9574, LAS: 0.9199, UEM: 0.6347, LEM: 0.4082, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1745, partial_loss/deprel_loss: 0.3159, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4555, loss: 0.5861, batch_reg_loss: 0.1678, reg_loss: 0.1680 ||:  98%|#########8| 109/111 [01:12<00:01,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9573, LAS: 0.9198, UEM: 0.6335, LEM: 0.4064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2176, partial_loss/deprel_loss: 0.3469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4889, loss: 0.5870, batch_reg_loss: 0.1678, reg_loss: 0.1680 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
+      "2023-04-07 01:05:40,141 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.347  |       N/A\n",
+      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.218  |       N/A\n",
+      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.168  |       N/A\n",
+      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - UEM                      |     0.633  |       N/A\n",
+      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - LAS                      |     0.920  |       N/A\n",
+      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - loss                     |     0.587  |       N/A\n",
+      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - LEM                      |     0.406  |       N/A\n",
+      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:05:40,143 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:05:40,143 - INFO - combo.training.tensorboard_writer - UAS                      |     0.957  |       N/A\n",
+      "2023-04-07 01:05:40,143 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:05:40,143 - INFO - combo.training.tensorboard_writer - EM                       |     0.935  |       N/A\n",
+      "2023-04-07 01:05:40,143 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:05:40,148 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:05:45,118 - INFO - combo.training.trainer - Epoch duration: 0:01:21.518221\n",
+      "2023-04-07 01:05:45,118 - INFO - combo.training.trainer - Estimated training time remaining: 6:47:53\n",
+      "2023-04-07 01:05:45,118 - INFO - allennlp.training.trainer - Epoch 100/399\n",
+      "2023-04-07 01:05:45,119 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:05:45,119 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:05:45,132 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9520, LAS: 0.9132, UEM: 0.6094, LEM: 0.3990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6790, partial_loss/deprel_loss: 0.5050, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7076, loss: 0.6213, batch_reg_loss: 0.1678, reg_loss: 0.1678 ||:   4%|3         | 4/111 [00:02<01:06,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9586, LAS: 0.9210, UEM: 0.6494, LEM: 0.4174, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4590, partial_loss/deprel_loss: 0.4715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6368, loss: 0.5710, batch_reg_loss: 0.1678, reg_loss: 0.1678 ||:   6%|6         | 7/111 [00:05<01:11,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9576, LAS: 0.9206, UEM: 0.5918, LEM: 0.3678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4997, partial_loss/deprel_loss: 0.4244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6072, loss: 0.5797, batch_reg_loss: 0.1678, reg_loss: 0.1678 ||:  10%|9         | 11/111 [00:07<01:06,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9606, LAS: 0.9235, UEM: 0.6388, LEM: 0.3973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2654, partial_loss/deprel_loss: 0.3501, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5009, loss: 0.5600, batch_reg_loss: 0.1678, reg_loss: 0.1678 ||:  13%|#2        | 14/111 [00:09<01:05,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9619, LAS: 0.9246, UEM: 0.6601, LEM: 0.4154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2255, partial_loss/deprel_loss: 0.3886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5238, loss: 0.5466, batch_reg_loss: 0.1678, reg_loss: 0.1678 ||:  15%|#5        | 17/111 [00:11<01:04,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9304, UAS: 0.9631, LAS: 0.9255, UEM: 0.6556, LEM: 0.4027, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2328, partial_loss/deprel_loss: 0.3960, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5311, loss: 0.5455, batch_reg_loss: 0.1677, reg_loss: 0.1678 ||:  19%|#8        | 21/111 [00:14<00:59,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9625, LAS: 0.9246, UEM: 0.6400, LEM: 0.3836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4028, partial_loss/deprel_loss: 0.4304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5926, loss: 0.5531, batch_reg_loss: 0.1677, reg_loss: 0.1678 ||:  23%|##2       | 25/111 [00:16<00:56,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9613, LAS: 0.9235, UEM: 0.6279, LEM: 0.3736, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2863, partial_loss/deprel_loss: 0.4400, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5770, loss: 0.5629, batch_reg_loss: 0.1677, reg_loss: 0.1678 ||:  26%|##6       | 29/111 [00:19<00:52,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9605, LAS: 0.9226, UEM: 0.6154, LEM: 0.3619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2613, partial_loss/deprel_loss: 0.3544, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5035, loss: 0.5694, batch_reg_loss: 0.1677, reg_loss: 0.1678 ||:  30%|##9       | 33/111 [00:21<00:50,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8827, UAS: 0.9584, LAS: 0.9204, UEM: 0.5967, LEM: 0.3468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0388, partial_loss/deprel_loss: 0.6088, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8625, loss: 0.5841, batch_reg_loss: 0.1677, reg_loss: 0.1678 ||:  33%|###3      | 37/111 [00:24<00:47,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9586, LAS: 0.9211, UEM: 0.6047, LEM: 0.3567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3691, partial_loss/deprel_loss: 0.3959, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5582, loss: 0.5811, batch_reg_loss: 0.1677, reg_loss: 0.1677 ||:  37%|###6      | 41/111 [00:26<00:44,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9586, LAS: 0.9207, UEM: 0.6054, LEM: 0.3582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1545, partial_loss/deprel_loss: 0.2843, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4260, loss: 0.5829, batch_reg_loss: 0.1677, reg_loss: 0.1677 ||:  41%|####      | 45/111 [00:29<00:41,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9592, LAS: 0.9213, UEM: 0.6040, LEM: 0.3553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2283, partial_loss/deprel_loss: 0.3198, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4692, loss: 0.5803, batch_reg_loss: 0.1677, reg_loss: 0.1677 ||:  44%|####4     | 49/111 [00:31<00:38,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9581, LAS: 0.9202, UEM: 0.5987, LEM: 0.3523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2588, partial_loss/deprel_loss: 0.3593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5069, loss: 0.5898, batch_reg_loss: 0.1677, reg_loss: 0.1677 ||:  48%|####7     | 53/111 [00:34<00:36,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9367, UAS: 0.9587, LAS: 0.9208, UEM: 0.6148, LEM: 0.3702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2090, partial_loss/deprel_loss: 0.3186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4643, loss: 0.5836, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||:  51%|#####1    | 57/111 [00:36<00:33,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9587, LAS: 0.9209, UEM: 0.6090, LEM: 0.3644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5263, partial_loss/deprel_loss: 0.4598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6407, loss: 0.5827, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||:  55%|#####4    | 61/111 [00:39<00:30,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9588, LAS: 0.9210, UEM: 0.6164, LEM: 0.3774, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2336, partial_loss/deprel_loss: 0.3478, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4926, loss: 0.5814, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||:  59%|#####8    | 65/111 [00:42<00:30,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9596, LAS: 0.9221, UEM: 0.6403, LEM: 0.4112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1878, partial_loss/deprel_loss: 0.2835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4319, loss: 0.5750, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||:  62%|######2   | 69/111 [00:45<00:31,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9076, UAS: 0.9595, LAS: 0.9220, UEM: 0.6402, LEM: 0.4117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5404, partial_loss/deprel_loss: 0.5082, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6823, loss: 0.5753, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||:  65%|######4   | 72/111 [00:47<00:28,  1.36it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9078, UAS: 0.9578, LAS: 0.9204, UEM: 0.6296, LEM: 0.4033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5869, partial_loss/deprel_loss: 0.5256, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7055, loss: 0.5868, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||:  68%|######8   | 76/111 [00:50<00:23,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9583, LAS: 0.9208, UEM: 0.6404, LEM: 0.4149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1843, partial_loss/deprel_loss: 0.3322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4702, loss: 0.5836, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||:  72%|#######2  | 80/111 [00:52<00:20,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9581, LAS: 0.9206, UEM: 0.6366, LEM: 0.4112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3103, partial_loss/deprel_loss: 0.3814, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5347, loss: 0.5845, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||:  76%|#######5  | 84/111 [00:54<00:16,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9580, LAS: 0.9205, UEM: 0.6320, LEM: 0.4065, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7726, partial_loss/deprel_loss: 0.5384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7528, loss: 0.5854, batch_reg_loss: 0.1675, reg_loss: 0.1677 ||:  79%|#######9  | 88/111 [00:59<00:18,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9584, LAS: 0.9209, UEM: 0.6349, LEM: 0.4081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4949, partial_loss/deprel_loss: 0.5901, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7386, loss: 0.5834, batch_reg_loss: 0.1675, reg_loss: 0.1677 ||:  83%|########2 | 92/111 [01:01<00:13,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9585, LAS: 0.9210, UEM: 0.6396, LEM: 0.4122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1842, partial_loss/deprel_loss: 0.3661, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4972, loss: 0.5819, batch_reg_loss: 0.1675, reg_loss: 0.1677 ||:  86%|########6 | 96/111 [01:03<00:10,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9583, LAS: 0.9208, UEM: 0.6358, LEM: 0.4079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4180, partial_loss/deprel_loss: 0.4352, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5993, loss: 0.5829, batch_reg_loss: 0.1675, reg_loss: 0.1677 ||:  91%|######### | 101/111 [01:06<00:06,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9464, UAS: 0.9589, LAS: 0.9215, UEM: 0.6489, LEM: 0.4200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1436, partial_loss/deprel_loss: 0.2605, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4046, loss: 0.5776, batch_reg_loss: 0.1675, reg_loss: 0.1676 ||:  95%|#########4| 105/111 [01:08<00:03,  1.73it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9582, LAS: 0.9207, UEM: 0.6415, LEM: 0.4139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4188, partial_loss/deprel_loss: 0.4373, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6011, loss: 0.5831, batch_reg_loss: 0.1675, reg_loss: 0.1676 ||:  98%|#########8| 109/111 [01:10<00:01,  1.74it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9578, LAS: 0.9203, UEM: 0.6389, LEM: 0.4113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3320, partial_loss/deprel_loss: 0.4104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5622, loss: 0.5859, batch_reg_loss: 0.1675, reg_loss: 0.1676 ||: 100%|##########| 111/111 [01:11<00:00,  1.55it/s]\n",
+      "2023-04-07 01:07:00,073 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9546, LAS: 0.9047, UEM: 0.6395, LEM: 0.3262, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4405, partial_loss/deprel_loss: 24.0473, partial_loss/cycle_loss: 0.0000, batch_loss: 19.3259, loss: 22.2299, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:09,  1.10it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8763, UAS: 0.9455, LAS: 0.8921, UEM: 0.5202, LEM: 0.2292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9855, partial_loss/deprel_loss: 35.7936, partial_loss/cycle_loss: 0.0000, batch_loss: 28.8320, loss: 23.8770, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:06,  1.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8697, UAS: 0.9455, LAS: 0.8928, UEM: 0.5466, LEM: 0.2615, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3333, partial_loss/deprel_loss: 46.5675, partial_loss/cycle_loss: 0.0000, batch_loss: 37.5207, loss: 25.1771, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:07<00:04,  1.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8289, UAS: 0.9443, LAS: 0.8922, UEM: 0.5920, LEM: 0.3072, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7122, partial_loss/deprel_loss: 54.8760, partial_loss/cycle_loss: 0.0000, batch_loss: 44.2433, loss: 25.7398, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:10<00:01,  1.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9467, LAS: 0.8962, UEM: 0.6526, LEM: 0.3920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7148, partial_loss/deprel_loss: 33.5731, partial_loss/cycle_loss: 0.0000, batch_loss: 27.0014, loss: 24.9927, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.02it/s]\n",
+      "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.410  |    33.573\n",
+      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.332  |     0.715\n",
+      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.168  |     0.000\n",
+      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - UEM                      |     0.639  |     0.653\n",
+      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - LAS                      |     0.920  |     0.896\n",
+      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - loss                     |     0.586  |    24.993\n",
+      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - LEM                      |     0.411  |     0.392\n",
+      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - UAS                      |     0.958  |     0.947\n",
+      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - EM                       |     0.922  |     0.888\n",
+      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:07:12,774 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:07:17,870 - INFO - combo.training.trainer - Epoch duration: 0:01:32.751562\n",
+      "2023-04-07 01:07:17,870 - INFO - combo.training.trainer - Estimated training time remaining: 6:47:04\n",
+      "2023-04-07 01:07:17,870 - INFO - allennlp.training.trainer - Epoch 101/399\n",
+      "2023-04-07 01:07:17,871 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:07:17,871 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:07:17,886 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9584, LAS: 0.9224, UEM: 0.5521, LEM: 0.3333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2957, partial_loss/deprel_loss: 0.4164, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5597, loss: 0.5687, batch_reg_loss: 0.1675, reg_loss: 0.1675 ||:   4%|3         | 4/111 [00:02<01:07,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9619, LAS: 0.9268, UEM: 0.5710, LEM: 0.3375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3029, partial_loss/deprel_loss: 0.3438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5031, loss: 0.5421, batch_reg_loss: 0.1675, reg_loss: 0.1675 ||:   6%|6         | 7/111 [00:04<01:08,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9637, LAS: 0.9273, UEM: 0.6240, LEM: 0.3714, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1911, partial_loss/deprel_loss: 0.3880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5160, loss: 0.5432, batch_reg_loss: 0.1674, reg_loss: 0.1675 ||:  10%|9         | 11/111 [00:07<01:06,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8927, UAS: 0.9639, LAS: 0.9273, UEM: 0.6749, LEM: 0.4358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7485, partial_loss/deprel_loss: 0.5903, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7893, loss: 0.5387, batch_reg_loss: 0.1674, reg_loss: 0.1675 ||:  13%|#2        | 14/111 [00:09<01:08,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9642, LAS: 0.9277, UEM: 0.6725, LEM: 0.4326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1768, partial_loss/deprel_loss: 0.3002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4429, loss: 0.5336, batch_reg_loss: 0.1674, reg_loss: 0.1675 ||:  15%|#5        | 17/111 [00:11<01:05,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9644, LAS: 0.9284, UEM: 0.6859, LEM: 0.4493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2393, partial_loss/deprel_loss: 0.3348, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4831, loss: 0.5291, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||:  18%|#8        | 20/111 [00:13<01:03,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9625, LAS: 0.9264, UEM: 0.6755, LEM: 0.4419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8730, partial_loss/deprel_loss: 0.5417, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7753, loss: 0.5407, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||:  22%|##1       | 24/111 [00:16<00:58,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9616, LAS: 0.9251, UEM: 0.6596, LEM: 0.4235, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1901, partial_loss/deprel_loss: 0.3190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4606, loss: 0.5484, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||:  25%|##5       | 28/111 [00:18<00:54,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9613, LAS: 0.9247, UEM: 0.6721, LEM: 0.4391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1284, partial_loss/deprel_loss: 0.2451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3892, loss: 0.5513, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||:  28%|##7       | 31/111 [00:21<00:55,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9605, LAS: 0.9233, UEM: 0.6628, LEM: 0.4289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3010, partial_loss/deprel_loss: 0.4006, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5480, loss: 0.5633, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||:  32%|###1      | 35/111 [00:23<00:51,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9603, LAS: 0.9233, UEM: 0.6703, LEM: 0.4406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8033, partial_loss/deprel_loss: 0.5819, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7936, loss: 0.5633, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||:  34%|###4      | 38/111 [00:26<00:51,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9592, LAS: 0.9221, UEM: 0.6568, LEM: 0.4260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3455, partial_loss/deprel_loss: 0.4157, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5690, loss: 0.5733, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||:  38%|###7      | 42/111 [00:28<00:46,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9601, LAS: 0.9232, UEM: 0.6750, LEM: 0.4480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2816, partial_loss/deprel_loss: 0.3762, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5246, loss: 0.5658, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||:  41%|####      | 45/111 [00:30<00:47,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9595, LAS: 0.9226, UEM: 0.6701, LEM: 0.4451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1848, partial_loss/deprel_loss: 0.2736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4232, loss: 0.5682, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||:  43%|####3     | 48/111 [00:33<00:46,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9156, UAS: 0.9591, LAS: 0.9219, UEM: 0.6620, LEM: 0.4339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3598, partial_loss/deprel_loss: 0.3840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5465, loss: 0.5704, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||:  47%|####6     | 52/111 [00:35<00:42,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9343, UAS: 0.9588, LAS: 0.9216, UEM: 0.6517, LEM: 0.4234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2664, partial_loss/deprel_loss: 0.3243, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4800, loss: 0.5722, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||:  51%|#####1    | 57/111 [00:38<00:34,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9581, LAS: 0.9209, UEM: 0.6493, LEM: 0.4205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7026, partial_loss/deprel_loss: 0.5731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7663, loss: 0.5773, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||:  55%|#####4    | 61/111 [00:40<00:30,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9588, LAS: 0.9219, UEM: 0.6482, LEM: 0.4178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1957, partial_loss/deprel_loss: 0.2670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4201, loss: 0.5711, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||:  59%|#####9    | 66/111 [00:42<00:24,  1.83it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9582, LAS: 0.9211, UEM: 0.6423, LEM: 0.4135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4466, partial_loss/deprel_loss: 0.4426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6107, loss: 0.5769, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||:  63%|######3   | 70/111 [00:44<00:21,  1.88it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8596, UAS: 0.9577, LAS: 0.9206, UEM: 0.6412, LEM: 0.4125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3618, partial_loss/deprel_loss: 0.7365, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0288, loss: 0.5812, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||:  67%|######6   | 74/111 [00:47<00:21,  1.73it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9579, LAS: 0.9208, UEM: 0.6425, LEM: 0.4136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1749, partial_loss/deprel_loss: 0.2488, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4013, loss: 0.5804, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||:  70%|#######   | 78/111 [00:49<00:20,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9581, LAS: 0.9210, UEM: 0.6432, LEM: 0.4122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2130, partial_loss/deprel_loss: 0.3557, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4944, loss: 0.5795, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||:  74%|#######3  | 82/111 [00:52<00:18,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9580, LAS: 0.9209, UEM: 0.6464, LEM: 0.4164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1589, partial_loss/deprel_loss: 0.2839, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4262, loss: 0.5795, batch_reg_loss: 0.1672, reg_loss: 0.1674 ||:  77%|#######7  | 86/111 [00:55<00:16,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9579, LAS: 0.9210, UEM: 0.6548, LEM: 0.4326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8256, partial_loss/deprel_loss: 0.5331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7588, loss: 0.5791, batch_reg_loss: 0.1672, reg_loss: 0.1673 ||:  81%|########1 | 90/111 [00:58<00:15,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9581, LAS: 0.9212, UEM: 0.6497, LEM: 0.4266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3404, partial_loss/deprel_loss: 0.3952, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5515, loss: 0.5793, batch_reg_loss: 0.1672, reg_loss: 0.1673 ||:  85%|########4 | 94/111 [01:01<00:11,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9577, LAS: 0.9208, UEM: 0.6408, LEM: 0.4191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4775, partial_loss/deprel_loss: 0.4866, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6519, loss: 0.5825, batch_reg_loss: 0.1672, reg_loss: 0.1673 ||:  88%|########8 | 98/111 [01:04<00:08,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9580, LAS: 0.9210, UEM: 0.6418, LEM: 0.4177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3033, partial_loss/deprel_loss: 0.3534, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5105, loss: 0.5806, batch_reg_loss: 0.1672, reg_loss: 0.1673 ||:  92%|#########1| 102/111 [01:06<00:05,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9581, LAS: 0.9211, UEM: 0.6415, LEM: 0.4162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4302, partial_loss/deprel_loss: 0.4356, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6017, loss: 0.5786, batch_reg_loss: 0.1672, reg_loss: 0.1673 ||:  95%|#########5| 106/111 [01:09<00:03,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9576, LAS: 0.9205, UEM: 0.6366, LEM: 0.4116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3003, partial_loss/deprel_loss: 0.4267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5686, loss: 0.5836, batch_reg_loss: 0.1672, reg_loss: 0.1673 ||:  99%|#########9| 110/111 [01:12<00:00,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9574, LAS: 0.9204, UEM: 0.6345, LEM: 0.4100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6024, partial_loss/deprel_loss: 0.4961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6845, loss: 0.5845, batch_reg_loss: 0.1672, reg_loss: 0.1673 ||: 100%|##########| 111/111 [01:12<00:00,  1.52it/s]\n",
+      "2023-04-07 01:08:33,893 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.496  |       N/A\n",
+      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.602  |       N/A\n",
+      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.167  |       N/A\n",
+      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - UEM                      |     0.635  |       N/A\n",
+      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - LAS                      |     0.920  |       N/A\n",
+      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - loss                     |     0.584  |       N/A\n",
+      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - LEM                      |     0.410  |       N/A\n",
+      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:08:33,895 - INFO - combo.training.tensorboard_writer - UAS                      |     0.957  |       N/A\n",
+      "2023-04-07 01:08:33,895 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:08:33,895 - INFO - combo.training.tensorboard_writer - EM                       |     0.908  |       N/A\n",
+      "2023-04-07 01:08:33,895 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:08:33,900 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:08:38,949 - INFO - combo.training.trainer - Epoch duration: 0:01:21.078534\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:08:38,950 - INFO - combo.training.trainer - Estimated training time remaining: 6:45:41\n",
+      "2023-04-07 01:08:38,950 - INFO - allennlp.training.trainer - Epoch 102/399\n",
+      "2023-04-07 01:08:38,950 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:08:38,951 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:08:38,961 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9606, LAS: 0.9211, UEM: 0.6524, LEM: 0.4456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4132, partial_loss/deprel_loss: 0.3944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5653, loss: 0.5691, batch_reg_loss: 0.1672, reg_loss: 0.1672 ||:   4%|3         | 4/111 [00:02<01:05,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9652, LAS: 0.9307, UEM: 0.7796, LEM: 0.6236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2336, partial_loss/deprel_loss: 0.2765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4351, loss: 0.5078, batch_reg_loss: 0.1672, reg_loss: 0.1672 ||:   6%|6         | 7/111 [00:04<01:08,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9618, LAS: 0.9261, UEM: 0.7107, LEM: 0.5336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3021, partial_loss/deprel_loss: 0.3575, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5136, loss: 0.5332, batch_reg_loss: 0.1671, reg_loss: 0.1672 ||:  10%|9         | 11/111 [00:07<01:04,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9556, UAS: 0.9634, LAS: 0.9282, UEM: 0.7425, LEM: 0.5678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0768, partial_loss/deprel_loss: 0.1740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3217, loss: 0.5227, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||:  13%|#2        | 14/111 [00:09<01:07,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9632, LAS: 0.9276, UEM: 0.7412, LEM: 0.5525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7525, partial_loss/deprel_loss: 0.5876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7877, loss: 0.5288, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||:  15%|#5        | 17/111 [00:11<01:06,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8545, UAS: 0.9589, LAS: 0.9228, UEM: 0.7120, LEM: 0.5238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5075, partial_loss/deprel_loss: 0.7973, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1065, loss: 0.5675, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||:  18%|#8        | 20/111 [00:13<01:03,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9608, LAS: 0.9247, UEM: 0.7363, LEM: 0.5412, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2577, partial_loss/deprel_loss: 0.3379, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4890, loss: 0.5495, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||:  21%|##        | 23/111 [00:15<01:01,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8870, UAS: 0.9585, LAS: 0.9220, UEM: 0.7148, LEM: 0.5201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8773, partial_loss/deprel_loss: 0.6363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8516, loss: 0.5670, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||:  24%|##4       | 27/111 [00:18<00:56,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9581, LAS: 0.9220, UEM: 0.7103, LEM: 0.5096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2279, partial_loss/deprel_loss: 0.3713, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5097, loss: 0.5672, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||:  28%|##7       | 31/111 [00:21<00:53,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9580, LAS: 0.9217, UEM: 0.7005, LEM: 0.4974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2093, partial_loss/deprel_loss: 0.3733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5076, loss: 0.5702, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||:  31%|###       | 34/111 [00:23<00:53,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9580, LAS: 0.9217, UEM: 0.6965, LEM: 0.4926, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1576, partial_loss/deprel_loss: 0.2765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4198, loss: 0.5702, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||:  33%|###3      | 37/111 [00:25<00:50,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9472, UAS: 0.9577, LAS: 0.9215, UEM: 0.6872, LEM: 0.4846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1256, partial_loss/deprel_loss: 0.2269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3737, loss: 0.5715, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||:  38%|###7      | 42/111 [00:27<00:42,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8963, UAS: 0.9560, LAS: 0.9194, UEM: 0.6657, LEM: 0.4646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6179, partial_loss/deprel_loss: 0.6150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7826, loss: 0.5871, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||:  42%|####2     | 47/111 [00:30<00:37,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9152, UAS: 0.9558, LAS: 0.9192, UEM: 0.6558, LEM: 0.4525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5090, partial_loss/deprel_loss: 0.4367, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6182, loss: 0.5894, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||:  47%|####6     | 52/111 [00:32<00:32,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9564, LAS: 0.9201, UEM: 0.6553, LEM: 0.4526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1447, partial_loss/deprel_loss: 0.2119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3655, loss: 0.5824, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||:  50%|#####     | 56/111 [00:35<00:32,  1.71it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9332, UAS: 0.9571, LAS: 0.9206, UEM: 0.6498, LEM: 0.4430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2884, partial_loss/deprel_loss: 0.3945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5403, loss: 0.5802, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||:  54%|#####4    | 60/111 [00:38<00:32,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9452, UAS: 0.9577, LAS: 0.9213, UEM: 0.6562, LEM: 0.4477, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0998, partial_loss/deprel_loss: 0.2114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3561, loss: 0.5750, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||:  58%|#####7    | 64/111 [00:41<00:31,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9585, LAS: 0.9220, UEM: 0.6612, LEM: 0.4481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1420, partial_loss/deprel_loss: 0.3105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4438, loss: 0.5705, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||:  61%|######1   | 68/111 [00:44<00:30,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9588, LAS: 0.9223, UEM: 0.6601, LEM: 0.4452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4256, partial_loss/deprel_loss: 0.4427, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6063, loss: 0.5690, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||:  64%|######3   | 71/111 [00:46<00:28,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9588, LAS: 0.9222, UEM: 0.6597, LEM: 0.4447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7597, partial_loss/deprel_loss: 0.5197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7346, loss: 0.5689, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||:  67%|######6   | 74/111 [00:48<00:26,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9592, LAS: 0.9224, UEM: 0.6585, LEM: 0.4393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2314, partial_loss/deprel_loss: 0.3426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4873, loss: 0.5679, batch_reg_loss: 0.1669, reg_loss: 0.1671 ||:  70%|#######   | 78/111 [00:50<00:22,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9587, LAS: 0.9218, UEM: 0.6511, LEM: 0.4325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7663, partial_loss/deprel_loss: 0.5629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7705, loss: 0.5723, batch_reg_loss: 0.1669, reg_loss: 0.1670 ||:  74%|#######3  | 82/111 [00:53<00:19,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9592, LAS: 0.9222, UEM: 0.6537, LEM: 0.4325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1484, partial_loss/deprel_loss: 0.2987, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4355, loss: 0.5698, batch_reg_loss: 0.1669, reg_loss: 0.1670 ||:  77%|#######7  | 86/111 [00:56<00:16,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9595, LAS: 0.9227, UEM: 0.6553, LEM: 0.4340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1589, partial_loss/deprel_loss: 0.2685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4135, loss: 0.5666, batch_reg_loss: 0.1669, reg_loss: 0.1670 ||:  80%|########  | 89/111 [00:58<00:15,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9593, LAS: 0.9226, UEM: 0.6498, LEM: 0.4279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5596, partial_loss/deprel_loss: 0.5026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6809, loss: 0.5676, batch_reg_loss: 0.1669, reg_loss: 0.1670 ||:  84%|########3 | 93/111 [01:01<00:12,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9590, LAS: 0.9221, UEM: 0.6420, LEM: 0.4201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4337, partial_loss/deprel_loss: 0.4895, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6452, loss: 0.5714, batch_reg_loss: 0.1669, reg_loss: 0.1670 ||:  87%|########7 | 97/111 [01:04<00:09,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9589, LAS: 0.9219, UEM: 0.6386, LEM: 0.4158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3582, partial_loss/deprel_loss: 0.4022, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5602, loss: 0.5725, batch_reg_loss: 0.1669, reg_loss: 0.1670 ||:  90%|######### | 100/111 [01:06<00:07,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9156, UAS: 0.9590, LAS: 0.9220, UEM: 0.6363, LEM: 0.4131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5635, partial_loss/deprel_loss: 0.4484, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6383, loss: 0.5716, batch_reg_loss: 0.1669, reg_loss: 0.1670 ||:  93%|#########2| 103/111 [01:08<00:05,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9591, LAS: 0.9222, UEM: 0.6381, LEM: 0.4158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2237, partial_loss/deprel_loss: 0.3158, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4642, loss: 0.5704, batch_reg_loss: 0.1668, reg_loss: 0.1670 ||:  95%|#########5| 106/111 [01:10<00:03,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9586, LAS: 0.9217, UEM: 0.6342, LEM: 0.4117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4813, partial_loss/deprel_loss: 0.4999, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6630, loss: 0.5739, batch_reg_loss: 0.1668, reg_loss: 0.1670 ||:  99%|#########9| 110/111 [01:13<00:00,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9585, LAS: 0.9215, UEM: 0.6323, LEM: 0.4101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6699, partial_loss/deprel_loss: 0.5022, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7025, loss: 0.5751, batch_reg_loss: 0.1668, reg_loss: 0.1670 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
+      "2023-04-07 01:09:55,423 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:09:55,423 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:09:55,423 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:09:55,423 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:09:55,423 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.502  |       N/A\n",
+      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.670  |       N/A\n",
+      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.167  |       N/A\n",
+      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - UEM                      |     0.632  |       N/A\n",
+      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - LAS                      |     0.922  |       N/A\n",
+      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - loss                     |     0.575  |       N/A\n",
+      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - LEM                      |     0.410  |       N/A\n",
+      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - UAS                      |     0.958  |       N/A\n",
+      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - EM                       |     0.903  |       N/A\n",
+      "2023-04-07 01:09:55,425 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:09:55,430 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:09:59,571 - INFO - combo.training.trainer - Epoch duration: 0:01:20.620700\n",
+      "2023-04-07 01:09:59,571 - INFO - combo.training.trainer - Estimated training time remaining: 6:44:16\n",
+      "2023-04-07 01:09:59,571 - INFO - allennlp.training.trainer - Epoch 103/399\n",
+      "2023-04-07 01:09:59,571 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:09:59,572 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:09:59,580 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9667, LAS: 0.9267, UEM: 0.6543, LEM: 0.3516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2148, partial_loss/deprel_loss: 0.3473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4876, loss: 0.5462, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||:   4%|3         | 4/111 [00:02<01:16,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9632, LAS: 0.9251, UEM: 0.6317, LEM: 0.3365, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1864, partial_loss/deprel_loss: 0.3413, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4771, loss: 0.5638, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||:   6%|6         | 7/111 [00:04<01:13,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9728, UAS: 0.9657, LAS: 0.9289, UEM: 0.7378, LEM: 0.5188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0321, partial_loss/deprel_loss: 0.1224, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2712, loss: 0.5427, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||:   9%|9         | 10/111 [00:07<01:15,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9589, LAS: 0.9227, UEM: 0.6830, LEM: 0.4771, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6950, partial_loss/deprel_loss: 0.5189, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7209, loss: 0.5806, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||:  13%|#2        | 14/111 [00:10<01:09,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9279, UAS: 0.9609, LAS: 0.9240, UEM: 0.6861, LEM: 0.4643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2205, partial_loss/deprel_loss: 0.3790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.5681, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||:  15%|#5        | 17/111 [00:12<01:07,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9060, UAS: 0.9623, LAS: 0.9250, UEM: 0.7001, LEM: 0.4740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6032, partial_loss/deprel_loss: 0.4965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6846, loss: 0.5604, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||:  18%|#8        | 20/111 [00:14<01:05,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9602, LAS: 0.9230, UEM: 0.6678, LEM: 0.4394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7369, partial_loss/deprel_loss: 0.4643, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6856, loss: 0.5714, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||:  22%|##1       | 24/111 [00:16<00:59,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9327, UAS: 0.9611, LAS: 0.9240, UEM: 0.6702, LEM: 0.4396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2633, partial_loss/deprel_loss: 0.3939, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5345, loss: 0.5612, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||:  26%|##6       | 29/111 [00:19<00:51,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9599, LAS: 0.9224, UEM: 0.6433, LEM: 0.4131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3315, partial_loss/deprel_loss: 0.4209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5697, loss: 0.5704, batch_reg_loss: 0.1667, reg_loss: 0.1668 ||:  31%|###       | 34/111 [00:21<00:44,  1.74it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9598, LAS: 0.9225, UEM: 0.6343, LEM: 0.4024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2272, partial_loss/deprel_loss: 0.2924, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4461, loss: 0.5673, batch_reg_loss: 0.1667, reg_loss: 0.1668 ||:  35%|###5      | 39/111 [00:23<00:39,  1.83it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8991, UAS: 0.9603, LAS: 0.9230, UEM: 0.6486, LEM: 0.4226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5966, partial_loss/deprel_loss: 0.5535, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7288, loss: 0.5641, batch_reg_loss: 0.1667, reg_loss: 0.1668 ||:  39%|###8      | 43/111 [00:26<00:38,  1.78it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9583, LAS: 0.9213, UEM: 0.6354, LEM: 0.4107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3198, partial_loss/deprel_loss: 0.3918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5442, loss: 0.5782, batch_reg_loss: 0.1667, reg_loss: 0.1668 ||:  42%|####2     | 47/111 [00:29<00:39,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8768, UAS: 0.9562, LAS: 0.9189, UEM: 0.6229, LEM: 0.4013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9840, partial_loss/deprel_loss: 0.6410, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8763, loss: 0.5938, batch_reg_loss: 0.1667, reg_loss: 0.1668 ||:  46%|####5     | 51/111 [00:31<00:37,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9570, LAS: 0.9198, UEM: 0.6357, LEM: 0.4096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2263, partial_loss/deprel_loss: 0.3587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4989, loss: 0.5857, batch_reg_loss: 0.1667, reg_loss: 0.1668 ||:  50%|####9     | 55/111 [00:35<00:37,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9430, UAS: 0.9578, LAS: 0.9206, UEM: 0.6415, LEM: 0.4125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1857, partial_loss/deprel_loss: 0.3076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4499, loss: 0.5814, batch_reg_loss: 0.1667, reg_loss: 0.1668 ||:  53%|#####3    | 59/111 [00:37<00:34,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9581, LAS: 0.9210, UEM: 0.6393, LEM: 0.4106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3038, partial_loss/deprel_loss: 0.3076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4735, loss: 0.5791, batch_reg_loss: 0.1667, reg_loss: 0.1667 ||:  57%|#####6    | 63/111 [00:40<00:33,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9585, LAS: 0.9215, UEM: 0.6440, LEM: 0.4141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4838, partial_loss/deprel_loss: 0.4486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6223, loss: 0.5752, batch_reg_loss: 0.1667, reg_loss: 0.1667 ||:  59%|#####9    | 66/111 [00:43<00:33,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8947, UAS: 0.9576, LAS: 0.9204, UEM: 0.6336, LEM: 0.4063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7353, partial_loss/deprel_loss: 0.6104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8020, loss: 0.5839, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||:  62%|######2   | 69/111 [00:45<00:31,  1.34it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9574, LAS: 0.9203, UEM: 0.6283, LEM: 0.4010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2851, partial_loss/deprel_loss: 0.3712, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5206, loss: 0.5847, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||:  65%|######4   | 72/111 [00:47<00:29,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9574, LAS: 0.9204, UEM: 0.6231, LEM: 0.3956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3128, partial_loss/deprel_loss: 0.3818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5346, loss: 0.5847, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||:  68%|######7   | 75/111 [00:50<00:27,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9184, UAS: 0.9578, LAS: 0.9211, UEM: 0.6336, LEM: 0.4086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4455, partial_loss/deprel_loss: 0.5083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6624, loss: 0.5806, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||:  70%|#######   | 78/111 [00:52<00:25,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9024, UAS: 0.9577, LAS: 0.9210, UEM: 0.6295, LEM: 0.4050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6275, partial_loss/deprel_loss: 0.5117, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7015, loss: 0.5811, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||:  74%|#######3  | 82/111 [00:55<00:22,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9580, LAS: 0.9213, UEM: 0.6309, LEM: 0.4043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3798, partial_loss/deprel_loss: 0.3906, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5551, loss: 0.5784, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||:  77%|#######7  | 86/111 [00:58<00:18,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9579, LAS: 0.9213, UEM: 0.6258, LEM: 0.3998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5987, partial_loss/deprel_loss: 0.5247, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7061, loss: 0.5788, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||:  81%|########1 | 90/111 [01:00<00:14,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9580, LAS: 0.9214, UEM: 0.6220, LEM: 0.3940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3268, partial_loss/deprel_loss: 0.3844, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5394, loss: 0.5793, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||:  85%|########4 | 94/111 [01:02<00:11,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9583, LAS: 0.9216, UEM: 0.6287, LEM: 0.3993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1964, partial_loss/deprel_loss: 0.2947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4416, loss: 0.5763, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||:  88%|########8 | 98/111 [01:05<00:08,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9518, UAS: 0.9591, LAS: 0.9225, UEM: 0.6436, LEM: 0.4152, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1200, partial_loss/deprel_loss: 0.2479, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3888, loss: 0.5697, batch_reg_loss: 0.1665, reg_loss: 0.1667 ||:  92%|#########1| 102/111 [01:08<00:06,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8799, UAS: 0.9582, LAS: 0.9216, UEM: 0.6361, LEM: 0.4093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8615, partial_loss/deprel_loss: 0.5799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8028, loss: 0.5751, batch_reg_loss: 0.1665, reg_loss: 0.1667 ||:  95%|#########5| 106/111 [01:11<00:03,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9584, LAS: 0.9217, UEM: 0.6389, LEM: 0.4116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5202, partial_loss/deprel_loss: 0.4868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6600, loss: 0.5732, batch_reg_loss: 0.1665, reg_loss: 0.1667 ||:  99%|#########9| 110/111 [01:14<00:00,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9585, LAS: 0.9218, UEM: 0.6393, LEM: 0.4117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2825, partial_loss/deprel_loss: 0.3588, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5101, loss: 0.5726, batch_reg_loss: 0.1665, reg_loss: 0.1667 ||: 100%|##########| 111/111 [01:14<00:00,  1.48it/s]\n",
+      "2023-04-07 01:11:17,321 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.359  |       N/A\n",
+      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.282  |       N/A\n",
+      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.167  |       N/A\n",
+      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - UEM                      |     0.639  |       N/A\n",
+      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - LAS                      |     0.922  |       N/A\n",
+      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - loss                     |     0.573  |       N/A\n",
+      "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - LEM                      |     0.412  |       N/A\n",
+      "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - UAS                      |     0.959  |       N/A\n",
+      "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - EM                       |     0.930  |       N/A\n",
+      "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:11:17,334 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:11:22,132 - INFO - combo.training.trainer - Epoch duration: 0:01:22.560293\n",
+      "2023-04-07 01:11:22,132 - INFO - combo.training.trainer - Estimated training time remaining: 6:42:57\n",
+      "2023-04-07 01:11:22,132 - INFO - allennlp.training.trainer - Epoch 104/399\n",
+      "2023-04-07 01:11:22,132 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:11:22,133 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:11:22,143 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9579, LAS: 0.9237, UEM: 0.4843, LEM: 0.2304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4918, partial_loss/deprel_loss: 0.4045, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5885, loss: 0.5448, batch_reg_loss: 0.1665, reg_loss: 0.1665 ||:   3%|2         | 3/111 [00:02<01:12,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9596, LAS: 0.9227, UEM: 0.5784, LEM: 0.3192, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2692, partial_loss/deprel_loss: 0.3732, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5189, loss: 0.5343, batch_reg_loss: 0.1665, reg_loss: 0.1665 ||:   5%|5         | 6/111 [00:04<01:12,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9639, LAS: 0.9279, UEM: 0.6773, LEM: 0.4301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4708, partial_loss/deprel_loss: 0.4108, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5893, loss: 0.5089, batch_reg_loss: 0.1665, reg_loss: 0.1665 ||:   8%|8         | 9/111 [00:06<01:10,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8996, UAS: 0.9582, LAS: 0.9228, UEM: 0.6431, LEM: 0.4054, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8202, partial_loss/deprel_loss: 0.5701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7866, loss: 0.5546, batch_reg_loss: 0.1665, reg_loss: 0.1665 ||:  13%|#2        | 14/111 [00:08<01:01,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9393, UAS: 0.9574, LAS: 0.9219, UEM: 0.6226, LEM: 0.3829, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2362, partial_loss/deprel_loss: 0.2969, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4512, loss: 0.5644, batch_reg_loss: 0.1665, reg_loss: 0.1665 ||:  17%|#7        | 19/111 [00:11<00:54,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9268, UAS: 0.9592, LAS: 0.9236, UEM: 0.6460, LEM: 0.4133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2917, partial_loss/deprel_loss: 0.3613, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5138, loss: 0.5537, batch_reg_loss: 0.1664, reg_loss: 0.1665 ||:  22%|##1       | 24/111 [00:13<00:48,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9607, LAS: 0.9253, UEM: 0.6852, LEM: 0.4642, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1332, partial_loss/deprel_loss: 0.2207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3697, loss: 0.5380, batch_reg_loss: 0.1664, reg_loss: 0.1665 ||:  25%|##5       | 28/111 [00:16<00:50,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9590, LAS: 0.9238, UEM: 0.6721, LEM: 0.4576, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6297, partial_loss/deprel_loss: 0.4486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6512, loss: 0.5475, batch_reg_loss: 0.1664, reg_loss: 0.1665 ||:  29%|##8       | 32/111 [00:19<00:50,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9037, UAS: 0.9587, LAS: 0.9229, UEM: 0.6562, LEM: 0.4379, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5505, partial_loss/deprel_loss: 0.5524, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7184, loss: 0.5561, batch_reg_loss: 0.1664, reg_loss: 0.1665 ||:  32%|###2      | 36/111 [00:21<00:47,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9362, UAS: 0.9583, LAS: 0.9225, UEM: 0.6445, LEM: 0.4229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2530, partial_loss/deprel_loss: 0.3163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4700, loss: 0.5594, batch_reg_loss: 0.1664, reg_loss: 0.1665 ||:  36%|###6      | 40/111 [00:24<00:45,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9180, UAS: 0.9579, LAS: 0.9221, UEM: 0.6292, LEM: 0.4080, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5182, partial_loss/deprel_loss: 0.4399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6220, loss: 0.5646, batch_reg_loss: 0.1664, reg_loss: 0.1664 ||:  40%|###9      | 44/111 [00:27<00:44,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9591, LAS: 0.9233, UEM: 0.6478, LEM: 0.4241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4055, partial_loss/deprel_loss: 0.4315, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5926, loss: 0.5555, batch_reg_loss: 0.1664, reg_loss: 0.1664 ||:  43%|####3     | 48/111 [00:30<00:43,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9582, LAS: 0.9226, UEM: 0.6473, LEM: 0.4273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6240, partial_loss/deprel_loss: 0.5214, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7083, loss: 0.5615, batch_reg_loss: 0.1664, reg_loss: 0.1664 ||:  46%|####5     | 51/111 [00:32<00:44,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9587, LAS: 0.9230, UEM: 0.6452, LEM: 0.4223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2726, partial_loss/deprel_loss: 0.3050, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4649, loss: 0.5592, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||:  49%|####8     | 54/111 [00:35<00:43,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9583, LAS: 0.9225, UEM: 0.6372, LEM: 0.4141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5030, partial_loss/deprel_loss: 0.5071, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6726, loss: 0.5631, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||:  51%|#####1    | 57/111 [00:37<00:40,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9576, LAS: 0.9218, UEM: 0.6313, LEM: 0.4109, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8949, partial_loss/deprel_loss: 0.5334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7720, loss: 0.5673, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||:  54%|#####4    | 60/111 [00:39<00:37,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9583, LAS: 0.9223, UEM: 0.6402, LEM: 0.4173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1827, partial_loss/deprel_loss: 0.2880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4332, loss: 0.5619, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||:  57%|#####6    | 63/111 [00:41<00:36,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9584, LAS: 0.9225, UEM: 0.6340, LEM: 0.4100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2745, partial_loss/deprel_loss: 0.3362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4901, loss: 0.5619, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||:  59%|#####9    | 66/111 [00:44<00:33,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9521, UAS: 0.9590, LAS: 0.9233, UEM: 0.6448, LEM: 0.4206, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0997, partial_loss/deprel_loss: 0.2236, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3651, loss: 0.5570, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||:  63%|######3   | 70/111 [00:46<00:28,  1.41it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9587, LAS: 0.9229, UEM: 0.6394, LEM: 0.4141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3804, partial_loss/deprel_loss: 0.4674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6163, loss: 0.5598, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||:  67%|######6   | 74/111 [00:49<00:25,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9587, LAS: 0.9230, UEM: 0.6390, LEM: 0.4135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8076, partial_loss/deprel_loss: 0.4870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7174, loss: 0.5591, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||:  70%|#######   | 78/111 [00:51<00:20,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9590, LAS: 0.9232, UEM: 0.6394, LEM: 0.4138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1533, partial_loss/deprel_loss: 0.2899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4288, loss: 0.5578, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||:  74%|#######3  | 82/111 [00:53<00:18,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9591, LAS: 0.9233, UEM: 0.6367, LEM: 0.4102, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4186, partial_loss/deprel_loss: 0.4657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6226, loss: 0.5577, batch_reg_loss: 0.1662, reg_loss: 0.1664 ||:  77%|#######7  | 86/111 [00:56<00:15,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9588, LAS: 0.9227, UEM: 0.6289, LEM: 0.4028, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6325, partial_loss/deprel_loss: 0.5095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7003, loss: 0.5627, batch_reg_loss: 0.1662, reg_loss: 0.1664 ||:  81%|########1 | 90/111 [00:58<00:13,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9430, UAS: 0.9590, LAS: 0.9230, UEM: 0.6330, LEM: 0.4060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1584, partial_loss/deprel_loss: 0.2693, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4134, loss: 0.5602, batch_reg_loss: 0.1662, reg_loss: 0.1664 ||:  85%|########4 | 94/111 [01:01<00:11,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9268, UAS: 0.9589, LAS: 0.9227, UEM: 0.6276, LEM: 0.4005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2896, partial_loss/deprel_loss: 0.3616, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5134, loss: 0.5627, batch_reg_loss: 0.1662, reg_loss: 0.1664 ||:  88%|########8 | 98/111 [01:03<00:08,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9728, UAS: 0.9581, LAS: 0.9220, UEM: 0.6366, LEM: 0.4174, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0334, partial_loss/deprel_loss: 0.1020, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2545, loss: 0.5686, batch_reg_loss: 0.1662, reg_loss: 0.1664 ||:  92%|#########1| 102/111 [01:06<00:06,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9582, LAS: 0.9220, UEM: 0.6356, LEM: 0.4154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3712, partial_loss/deprel_loss: 0.3612, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5294, loss: 0.5684, batch_reg_loss: 0.1662, reg_loss: 0.1664 ||:  95%|#########5| 106/111 [01:09<00:03,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9585, LAS: 0.9225, UEM: 0.6374, LEM: 0.4164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3568, partial_loss/deprel_loss: 0.3704, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5339, loss: 0.5656, batch_reg_loss: 0.1662, reg_loss: 0.1663 ||:  99%|#########9| 110/111 [01:12<00:00,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9585, LAS: 0.9225, UEM: 0.6356, LEM: 0.4146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4134, partial_loss/deprel_loss: 0.4592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6162, loss: 0.5660, batch_reg_loss: 0.1662, reg_loss: 0.1663 ||: 100%|##########| 111/111 [01:12<00:00,  1.52it/s]\n",
+      "2023-04-07 01:12:38,230 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:12:38,230 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:12:38,230 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:12:38,230 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:12:38,230 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:12:38,230 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.459  |       N/A\n",
+      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.413  |       N/A\n",
+      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.166  |       N/A\n",
+      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - UEM                      |     0.636  |       N/A\n",
+      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - LAS                      |     0.922  |       N/A\n",
+      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - loss                     |     0.566  |       N/A\n",
+      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - LEM                      |     0.415  |       N/A\n",
+      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - UAS                      |     0.958  |       N/A\n",
+      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - EM                       |     0.921  |       N/A\n",
+      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:12:38,238 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:12:43,544 - INFO - combo.training.trainer - Epoch duration: 0:01:21.411689\n",
+      "2023-04-07 01:12:43,545 - INFO - combo.training.trainer - Estimated training time remaining: 6:41:35\n",
+      "2023-04-07 01:12:43,545 - INFO - allennlp.training.trainer - Epoch 105/399\n",
+      "2023-04-07 01:12:43,545 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:12:43,546 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:12:43,555 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9605, LAS: 0.9238, UEM: 0.5154, LEM: 0.2423, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4710, partial_loss/deprel_loss: 0.4087, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5874, loss: 0.5467, batch_reg_loss: 0.1662, reg_loss: 0.1662 ||:   4%|3         | 4/111 [00:02<00:54,  1.95it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9268, UAS: 0.9555, LAS: 0.9193, UEM: 0.4861, LEM: 0.2369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3070, partial_loss/deprel_loss: 0.3412, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5006, loss: 0.5761, batch_reg_loss: 0.1662, reg_loss: 0.1662 ||:   7%|7         | 8/111 [00:04<00:55,  1.87it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9566, LAS: 0.9206, UEM: 0.5133, LEM: 0.2719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4960, partial_loss/deprel_loss: 0.4824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6513, loss: 0.5721, batch_reg_loss: 0.1661, reg_loss: 0.1662 ||:  11%|#         | 12/111 [00:06<00:54,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9589, LAS: 0.9236, UEM: 0.5616, LEM: 0.3189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2420, partial_loss/deprel_loss: 0.3775, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5165, loss: 0.5580, batch_reg_loss: 0.1661, reg_loss: 0.1662 ||:  14%|#4        | 16/111 [00:09<00:55,  1.71it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8997, UAS: 0.9586, LAS: 0.9240, UEM: 0.5809, LEM: 0.3489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7090, partial_loss/deprel_loss: 0.4814, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6930, loss: 0.5559, batch_reg_loss: 0.1661, reg_loss: 0.1662 ||:  18%|#8        | 20/111 [00:11<00:52,  1.74it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9578, LAS: 0.9217, UEM: 0.5885, LEM: 0.3592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1913, partial_loss/deprel_loss: 0.2940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4395, loss: 0.5726, batch_reg_loss: 0.1661, reg_loss: 0.1661 ||:  22%|##1       | 24/111 [00:13<00:49,  1.76it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9590, LAS: 0.9226, UEM: 0.5978, LEM: 0.3627, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4385, partial_loss/deprel_loss: 0.5090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6610, loss: 0.5674, batch_reg_loss: 0.1661, reg_loss: 0.1661 ||:  26%|##6       | 29/111 [00:16<00:43,  1.89it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9586, LAS: 0.9223, UEM: 0.5805, LEM: 0.3475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6027, partial_loss/deprel_loss: 0.5682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7412, loss: 0.5714, batch_reg_loss: 0.1661, reg_loss: 0.1661 ||:  30%|##9       | 33/111 [00:18<00:42,  1.84it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9587, LAS: 0.9221, UEM: 0.6065, LEM: 0.3742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2653, partial_loss/deprel_loss: 0.4016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5404, loss: 0.5698, batch_reg_loss: 0.1661, reg_loss: 0.1661 ||:  33%|###3      | 37/111 [00:21<00:43,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9594, LAS: 0.9225, UEM: 0.6225, LEM: 0.3869, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2054, partial_loss/deprel_loss: 0.3136, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4580, loss: 0.5648, batch_reg_loss: 0.1661, reg_loss: 0.1661 ||:  37%|###6      | 41/111 [00:24<00:44,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9591, LAS: 0.9220, UEM: 0.6231, LEM: 0.3862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2100, partial_loss/deprel_loss: 0.3562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4930, loss: 0.5681, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||:  41%|####      | 45/111 [00:26<00:41,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9592, LAS: 0.9222, UEM: 0.6172, LEM: 0.3777, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2282, partial_loss/deprel_loss: 0.3457, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4882, loss: 0.5694, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||:  44%|####4     | 49/111 [00:29<00:39,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9592, LAS: 0.9220, UEM: 0.6134, LEM: 0.3740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4211, partial_loss/deprel_loss: 0.5321, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6759, loss: 0.5711, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||:  48%|####7     | 53/111 [00:32<00:39,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9597, LAS: 0.9228, UEM: 0.6325, LEM: 0.4001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2204, partial_loss/deprel_loss: 0.2532, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4126, loss: 0.5662, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||:  50%|#####     | 56/111 [00:34<00:39,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9752, UAS: 0.9606, LAS: 0.9240, UEM: 0.6598, LEM: 0.4393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0256, partial_loss/deprel_loss: 0.0931, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2456, loss: 0.5583, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||:  53%|#####3    | 59/111 [00:37<00:40,  1.28it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9472, UAS: 0.9606, LAS: 0.9239, UEM: 0.6677, LEM: 0.4476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1025, partial_loss/deprel_loss: 0.2338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3735, loss: 0.5582, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||:  57%|#####6    | 63/111 [00:40<00:37,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9603, LAS: 0.9236, UEM: 0.6652, LEM: 0.4453, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5848, partial_loss/deprel_loss: 0.4815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6681, loss: 0.5607, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||:  59%|#####9    | 66/111 [00:42<00:33,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9604, LAS: 0.9236, UEM: 0.6648, LEM: 0.4440, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1711, partial_loss/deprel_loss: 0.2880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4306, loss: 0.5598, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||:  62%|######2   | 69/111 [00:44<00:31,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9592, LAS: 0.9223, UEM: 0.6538, LEM: 0.4348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0157, partial_loss/deprel_loss: 0.6286, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8720, loss: 0.5674, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||:  66%|######5   | 73/111 [00:47<00:26,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9588, LAS: 0.9219, UEM: 0.6449, LEM: 0.4262, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3976, partial_loss/deprel_loss: 0.4270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5871, loss: 0.5712, batch_reg_loss: 0.1659, reg_loss: 0.1661 ||:  69%|######9   | 77/111 [00:49<00:23,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9580, LAS: 0.9211, UEM: 0.6370, LEM: 0.4197, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9152, partial_loss/deprel_loss: 0.6189, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8441, loss: 0.5799, batch_reg_loss: 0.1659, reg_loss: 0.1661 ||:  72%|#######2  | 80/111 [00:51<00:21,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9576, LAS: 0.9209, UEM: 0.6312, LEM: 0.4145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6424, partial_loss/deprel_loss: 0.4890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6856, loss: 0.5808, batch_reg_loss: 0.1659, reg_loss: 0.1661 ||:  75%|#######4  | 83/111 [00:54<00:19,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9583, LAS: 0.9215, UEM: 0.6427, LEM: 0.4242, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1461, partial_loss/deprel_loss: 0.2934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4299, loss: 0.5761, batch_reg_loss: 0.1659, reg_loss: 0.1661 ||:  77%|#######7  | 86/111 [00:56<00:17,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9589, LAS: 0.9221, UEM: 0.6461, LEM: 0.4239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1714, partial_loss/deprel_loss: 0.3043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4437, loss: 0.5725, batch_reg_loss: 0.1659, reg_loss: 0.1660 ||:  81%|########1 | 90/111 [00:58<00:14,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9593, LAS: 0.9225, UEM: 0.6463, LEM: 0.4227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1769, partial_loss/deprel_loss: 0.2699, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4172, loss: 0.5698, batch_reg_loss: 0.1659, reg_loss: 0.1660 ||:  85%|########4 | 94/111 [01:01<00:11,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9595, LAS: 0.9228, UEM: 0.6455, LEM: 0.4205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2810, partial_loss/deprel_loss: 0.3794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5256, loss: 0.5681, batch_reg_loss: 0.1659, reg_loss: 0.1660 ||:  88%|########8 | 98/111 [01:03<00:08,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9116, UAS: 0.9592, LAS: 0.9224, UEM: 0.6407, LEM: 0.4158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5674, partial_loss/deprel_loss: 0.3946, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5951, loss: 0.5697, batch_reg_loss: 0.1659, reg_loss: 0.1660 ||:  92%|#########1| 102/111 [01:06<00:05,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9595, LAS: 0.9227, UEM: 0.6432, LEM: 0.4163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1545, partial_loss/deprel_loss: 0.2660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4095, loss: 0.5678, batch_reg_loss: 0.1659, reg_loss: 0.1660 ||:  95%|#########5| 106/111 [01:09<00:03,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8596, UAS: 0.9588, LAS: 0.9218, UEM: 0.6365, LEM: 0.4107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3701, partial_loss/deprel_loss: 0.8036, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0827, loss: 0.5747, batch_reg_loss: 0.1659, reg_loss: 0.1660 ||:  99%|#########9| 110/111 [01:12<00:00,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9586, LAS: 0.9217, UEM: 0.6349, LEM: 0.4092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6125, partial_loss/deprel_loss: 0.5305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7127, loss: 0.5760, batch_reg_loss: 0.1659, reg_loss: 0.1660 ||: 100%|##########| 111/111 [01:12<00:00,  1.53it/s]\n",
+      "2023-04-07 01:13:59,528 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9553, LAS: 0.9111, UEM: 0.7989, LEM: 0.6196, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1845, partial_loss/deprel_loss: 18.4393, partial_loss/cycle_loss: 0.0000, batch_loss: 14.7883, loss: 19.5219, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:11,  1.05s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9480, LAS: 0.9002, UEM: 0.6879, LEM: 0.4533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4402, partial_loss/deprel_loss: 23.9572, partial_loss/cycle_loss: 0.0000, batch_loss: 19.2538, loss: 24.4794, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:04<00:07,  1.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8872, UAS: 0.9532, LAS: 0.9045, UEM: 0.6803, LEM: 0.4123, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7114, partial_loss/deprel_loss: 29.0657, partial_loss/cycle_loss: 0.0000, batch_loss: 23.3948, loss: 22.1284, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  69%|######9   | 9/13 [00:07<00:03,  1.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8793, UAS: 0.9449, LAS: 0.8945, UEM: 0.6256, LEM: 0.3659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0921, partial_loss/deprel_loss: 41.6153, partial_loss/cycle_loss: 0.0000, batch_loss: 33.5107, loss: 25.4303, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  92%|#########2| 12/13 [00:09<00:00,  1.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9476, LAS: 0.8979, UEM: 0.6576, LEM: 0.3943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1506, partial_loss/deprel_loss: 22.9104, partial_loss/cycle_loss: 0.0000, batch_loss: 18.3585, loss: 24.8863, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:10<00:00,  1.29it/s]\n",
+      "2023-04-07 01:14:09,620 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:14:09,620 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:14:09,620 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:14:09,620 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.530  |    22.910\n",
+      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.613  |     0.151\n",
+      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.166  |     0.000\n",
+      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - UEM                      |     0.635  |     0.658\n",
+      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - LAS                      |     0.922  |     0.898\n",
+      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - loss                     |     0.576  |    24.886\n",
+      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - LEM                      |     0.409  |     0.394\n",
+      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - UAS                      |     0.959  |     0.948\n",
+      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:14:09,622 - INFO - combo.training.tensorboard_writer - EM                       |     0.905  |     0.939\n",
+      "2023-04-07 01:14:09,622 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:14:09,626 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:14:14,904 - INFO - combo.training.trainer - Epoch duration: 0:01:31.359274\n",
+      "2023-04-07 01:14:14,905 - INFO - combo.training.trainer - Estimated training time remaining: 6:40:40\n",
+      "2023-04-07 01:14:14,905 - INFO - allennlp.training.trainer - Epoch 106/399\n",
+      "2023-04-07 01:14:14,905 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:14:14,906 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:14:14,916 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9460, UAS: 0.9597, LAS: 0.9221, UEM: 0.6360, LEM: 0.4109, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1200, partial_loss/deprel_loss: 0.2448, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3857, loss: 0.5495, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:   4%|3         | 4/111 [00:02<01:11,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8979, UAS: 0.9562, LAS: 0.9204, UEM: 0.6661, LEM: 0.4711, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6598, partial_loss/deprel_loss: 0.4809, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6825, loss: 0.5676, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:   6%|6         | 7/111 [00:04<01:11,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9575, LAS: 0.9226, UEM: 0.6810, LEM: 0.4839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7804, partial_loss/deprel_loss: 0.6168, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8153, loss: 0.5618, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:   9%|9         | 10/111 [00:07<01:10,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9585, LAS: 0.9235, UEM: 0.6787, LEM: 0.4796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1399, partial_loss/deprel_loss: 0.2521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3955, loss: 0.5556, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:  12%|#1        | 13/111 [00:09<01:11,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9589, LAS: 0.9241, UEM: 0.6982, LEM: 0.5117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5977, partial_loss/deprel_loss: 0.5713, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7424, loss: 0.5556, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:  14%|#4        | 16/111 [00:11<01:08,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9035, UAS: 0.9575, LAS: 0.9222, UEM: 0.6738, LEM: 0.4852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6464, partial_loss/deprel_loss: 0.4745, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6747, loss: 0.5711, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:  17%|#7        | 19/111 [00:13<01:08,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9568, LAS: 0.9216, UEM: 0.6542, LEM: 0.4620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2399, partial_loss/deprel_loss: 0.2948, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4496, loss: 0.5771, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:  21%|##        | 23/111 [00:16<01:02,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9569, LAS: 0.9217, UEM: 0.6400, LEM: 0.4420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2381, partial_loss/deprel_loss: 0.3725, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5114, loss: 0.5755, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:  24%|##4       | 27/111 [00:19<00:58,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9252, UAS: 0.9582, LAS: 0.9229, UEM: 0.6431, LEM: 0.4341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3158, partial_loss/deprel_loss: 0.3573, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5148, loss: 0.5670, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:  28%|##7       | 31/111 [00:21<00:52,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9594, LAS: 0.9240, UEM: 0.6449, LEM: 0.4297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3148, partial_loss/deprel_loss: 0.3962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5457, loss: 0.5601, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:  32%|###1      | 35/111 [00:24<00:51,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.9591, LAS: 0.9232, UEM: 0.6442, LEM: 0.4281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8498, partial_loss/deprel_loss: 0.6169, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8292, loss: 0.5630, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:  34%|###4      | 38/111 [00:26<00:49,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9595, LAS: 0.9239, UEM: 0.6561, LEM: 0.4424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7706, partial_loss/deprel_loss: 0.5407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7524, loss: 0.5581, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||:  37%|###6      | 41/111 [00:28<00:48,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9595, LAS: 0.9238, UEM: 0.6468, LEM: 0.4285, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5706, partial_loss/deprel_loss: 0.4615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6490, loss: 0.5583, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||:  41%|####      | 45/111 [00:31<00:45,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9591, LAS: 0.9235, UEM: 0.6394, LEM: 0.4217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6297, partial_loss/deprel_loss: 0.5389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7228, loss: 0.5618, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||:  43%|####3     | 48/111 [00:33<00:43,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9209, UAS: 0.9593, LAS: 0.9236, UEM: 0.6394, LEM: 0.4189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4952, partial_loss/deprel_loss: 0.4717, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6421, loss: 0.5602, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||:  46%|####5     | 51/111 [00:35<00:42,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9400, UAS: 0.9601, LAS: 0.9243, UEM: 0.6537, LEM: 0.4329, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1582, partial_loss/deprel_loss: 0.2718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4148, loss: 0.5541, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||:  49%|####8     | 54/111 [00:38<00:43,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9597, LAS: 0.9237, UEM: 0.6536, LEM: 0.4303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3267, partial_loss/deprel_loss: 0.4067, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5564, loss: 0.5575, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||:  51%|#####1    | 57/111 [00:40<00:40,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9588, LAS: 0.9227, UEM: 0.6441, LEM: 0.4226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5373, partial_loss/deprel_loss: 0.5270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6947, loss: 0.5655, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||:  54%|#####4    | 60/111 [00:42<00:38,  1.33it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9288, UAS: 0.9592, LAS: 0.9230, UEM: 0.6392, LEM: 0.4135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3362, partial_loss/deprel_loss: 0.4284, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5756, loss: 0.5650, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||:  58%|#####7    | 64/111 [00:44<00:32,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9359, UAS: 0.9592, LAS: 0.9229, UEM: 0.6352, LEM: 0.4070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2206, partial_loss/deprel_loss: 0.3035, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4526, loss: 0.5645, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||:  61%|######1   | 68/111 [00:47<00:28,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9052, UAS: 0.9587, LAS: 0.9225, UEM: 0.6254, LEM: 0.3985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5371, partial_loss/deprel_loss: 0.5104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6814, loss: 0.5688, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||:  65%|######4   | 72/111 [00:49<00:25,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9586, LAS: 0.9223, UEM: 0.6207, LEM: 0.3927, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5256, partial_loss/deprel_loss: 0.4265, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6120, loss: 0.5691, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||:  68%|######8   | 76/111 [00:52<00:23,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9587, LAS: 0.9223, UEM: 0.6193, LEM: 0.3889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1841, partial_loss/deprel_loss: 0.3153, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4547, loss: 0.5685, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||:  72%|#######2  | 80/111 [00:55<00:22,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9590, LAS: 0.9226, UEM: 0.6208, LEM: 0.3900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2910, partial_loss/deprel_loss: 0.3747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5236, loss: 0.5656, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||:  75%|#######4  | 83/111 [00:58<00:20,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9588, LAS: 0.9222, UEM: 0.6164, LEM: 0.3852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5515, partial_loss/deprel_loss: 0.5246, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6956, loss: 0.5683, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||:  77%|#######7  | 86/111 [01:00<00:17,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9583, LAS: 0.9218, UEM: 0.6130, LEM: 0.3822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2468, partial_loss/deprel_loss: 0.3473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4928, loss: 0.5711, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||:  80%|########  | 89/111 [01:02<00:15,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9588, LAS: 0.9224, UEM: 0.6181, LEM: 0.3849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1722, partial_loss/deprel_loss: 0.2980, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4384, loss: 0.5672, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||:  84%|########3 | 93/111 [01:04<00:12,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9548, UAS: 0.9594, LAS: 0.9231, UEM: 0.6311, LEM: 0.3998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0772, partial_loss/deprel_loss: 0.2163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3541, loss: 0.5627, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||:  88%|########8 | 98/111 [01:07<00:08,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9593, LAS: 0.9232, UEM: 0.6285, LEM: 0.3972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6855, partial_loss/deprel_loss: 0.4708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6793, loss: 0.5622, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||:  93%|#########2| 103/111 [01:09<00:04,  1.76it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9196, UAS: 0.9589, LAS: 0.9229, UEM: 0.6367, LEM: 0.4134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4590, partial_loss/deprel_loss: 0.4846, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6451, loss: 0.5652, batch_reg_loss: 0.1655, reg_loss: 0.1657 ||:  96%|#########6| 107/111 [01:11<00:02,  1.76it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9590, LAS: 0.9230, UEM: 0.6388, LEM: 0.4147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6903, partial_loss/deprel_loss: 0.5063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7086, loss: 0.5640, batch_reg_loss: 0.1655, reg_loss: 0.1657 ||: 100%|##########| 111/111 [01:14<00:00,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9590, LAS: 0.9230, UEM: 0.6388, LEM: 0.4147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6903, partial_loss/deprel_loss: 0.5063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7086, loss: 0.5640, batch_reg_loss: 0.1655, reg_loss: 0.1657 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
+      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.506  |       N/A\n",
+      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.690  |       N/A\n",
+      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.166  |       N/A\n",
+      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - UEM                      |     0.639  |       N/A\n",
+      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - LAS                      |     0.923  |       N/A\n",
+      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - loss                     |     0.564  |       N/A\n",
+      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - LEM                      |     0.415  |       N/A\n",
+      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - UAS                      |     0.959  |       N/A\n",
+      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - EM                       |     0.907  |       N/A\n",
+      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:15:32,914 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:15:37,937 - INFO - combo.training.trainer - Epoch duration: 0:01:23.032082\n",
+      "2023-04-07 01:15:37,938 - INFO - combo.training.trainer - Estimated training time remaining: 6:39:22\n",
+      "2023-04-07 01:15:37,938 - INFO - allennlp.training.trainer - Epoch 107/399\n",
+      "2023-04-07 01:15:37,938 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:15:37,939 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:15:37,951 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9404, LAS: 0.9045, UEM: 0.1818, LEM: 0.0670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6183, partial_loss/deprel_loss: 0.4834, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6759, loss: 0.7128, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||:   3%|2         | 3/111 [00:02<01:17,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9551, LAS: 0.9217, UEM: 0.7477, LEM: 0.6220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2309, partial_loss/deprel_loss: 0.3238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4707, loss: 0.5912, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||:   5%|5         | 6/111 [00:04<01:20,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9327, UAS: 0.9598, LAS: 0.9264, UEM: 0.7318, LEM: 0.5729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2415, partial_loss/deprel_loss: 0.3944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5294, loss: 0.5564, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||:   8%|8         | 9/111 [00:06<01:16,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9556, UAS: 0.9638, LAS: 0.9295, UEM: 0.7680, LEM: 0.5838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0983, partial_loss/deprel_loss: 0.1903, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3374, loss: 0.5257, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||:  11%|#         | 12/111 [00:09<01:14,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9645, LAS: 0.9301, UEM: 0.7532, LEM: 0.5563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2345, partial_loss/deprel_loss: 0.3621, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5021, loss: 0.5165, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||:  14%|#4        | 16/111 [00:12<01:10,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.9611, LAS: 0.9260, UEM: 0.7304, LEM: 0.5306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0098, partial_loss/deprel_loss: 0.6083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8541, loss: 0.5462, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||:  17%|#7        | 19/111 [00:14<01:07,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9604, LAS: 0.9254, UEM: 0.7239, LEM: 0.5191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9762, partial_loss/deprel_loss: 0.5604, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8090, loss: 0.5532, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||:  20%|#9        | 22/111 [00:16<01:06,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9099, UAS: 0.9597, LAS: 0.9250, UEM: 0.7145, LEM: 0.5123, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6173, partial_loss/deprel_loss: 0.4916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6822, loss: 0.5542, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||:  23%|##2       | 25/111 [00:18<01:03,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9192, UAS: 0.9588, LAS: 0.9239, UEM: 0.6825, LEM: 0.4837, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4539, partial_loss/deprel_loss: 0.4544, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6198, loss: 0.5627, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||:  26%|##6       | 29/111 [00:21<00:58,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8950, UAS: 0.9579, LAS: 0.9230, UEM: 0.6704, LEM: 0.4709, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8390, partial_loss/deprel_loss: 0.5060, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7380, loss: 0.5715, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||:  29%|##8       | 32/111 [00:23<00:55,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9584, LAS: 0.9234, UEM: 0.6645, LEM: 0.4611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3485, partial_loss/deprel_loss: 0.3792, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5385, loss: 0.5686, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||:  32%|###1      | 35/111 [00:25<00:53,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9585, LAS: 0.9232, UEM: 0.6623, LEM: 0.4566, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5470, partial_loss/deprel_loss: 0.5001, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6749, loss: 0.5675, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||:  34%|###4      | 38/111 [00:27<00:50,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9595, LAS: 0.9242, UEM: 0.6705, LEM: 0.4606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2611, partial_loss/deprel_loss: 0.3462, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4946, loss: 0.5603, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||:  37%|###6      | 41/111 [00:29<00:49,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9595, LAS: 0.9238, UEM: 0.6617, LEM: 0.4485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6102, partial_loss/deprel_loss: 0.5191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7027, loss: 0.5607, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||:  41%|####      | 45/111 [00:32<00:44,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9589, LAS: 0.9233, UEM: 0.6512, LEM: 0.4375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2744, partial_loss/deprel_loss: 0.3026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4623, loss: 0.5633, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||:  44%|####4     | 49/111 [00:34<00:39,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9593, LAS: 0.9237, UEM: 0.6471, LEM: 0.4301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3814, partial_loss/deprel_loss: 0.4476, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5998, loss: 0.5621, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||:  48%|####7     | 53/111 [00:36<00:36,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9592, LAS: 0.9237, UEM: 0.6426, LEM: 0.4236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2156, partial_loss/deprel_loss: 0.3679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5028, loss: 0.5612, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||:  51%|#####1    | 57/111 [00:39<00:34,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9458, UAS: 0.9596, LAS: 0.9240, UEM: 0.6447, LEM: 0.4221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1229, partial_loss/deprel_loss: 0.2915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4231, loss: 0.5587, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||:  55%|#####4    | 61/111 [00:42<00:32,  1.53it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9597, LAS: 0.9239, UEM: 0.6410, LEM: 0.4175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5022, partial_loss/deprel_loss: 0.4624, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6357, loss: 0.5594, batch_reg_loss: 0.1654, reg_loss: 0.1654 ||:  59%|#####8    | 65/111 [00:44<00:29,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9529, UAS: 0.9589, LAS: 0.9234, UEM: 0.6424, LEM: 0.4215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1442, partial_loss/deprel_loss: 0.2097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3620, loss: 0.5627, batch_reg_loss: 0.1653, reg_loss: 0.1654 ||:  62%|######2   | 69/111 [00:47<00:28,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9592, LAS: 0.9236, UEM: 0.6441, LEM: 0.4216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4032, partial_loss/deprel_loss: 0.4486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6049, loss: 0.5617, batch_reg_loss: 0.1653, reg_loss: 0.1654 ||:  66%|######5   | 73/111 [00:50<00:25,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9548, UAS: 0.9599, LAS: 0.9243, UEM: 0.6642, LEM: 0.4449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0766, partial_loss/deprel_loss: 0.1825, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3266, loss: 0.5553, batch_reg_loss: 0.1653, reg_loss: 0.1654 ||:  70%|#######   | 78/111 [00:52<00:20,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9604, LAS: 0.9248, UEM: 0.6636, LEM: 0.4416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4480, partial_loss/deprel_loss: 0.4697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6306, loss: 0.5532, batch_reg_loss: 0.1653, reg_loss: 0.1654 ||:  75%|#######4  | 83/111 [00:54<00:15,  1.79it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9605, LAS: 0.9249, UEM: 0.6583, LEM: 0.4353, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3688, partial_loss/deprel_loss: 0.3764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5402, loss: 0.5531, batch_reg_loss: 0.1653, reg_loss: 0.1654 ||:  79%|#######9  | 88/111 [00:57<00:12,  1.87it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9603, LAS: 0.9246, UEM: 0.6530, LEM: 0.4290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3882, partial_loss/deprel_loss: 0.4423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5967, loss: 0.5549, batch_reg_loss: 0.1653, reg_loss: 0.1654 ||:  83%|########2 | 92/111 [00:59<00:10,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9597, LAS: 0.9239, UEM: 0.6455, LEM: 0.4215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6310, partial_loss/deprel_loss: 0.5527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7336, loss: 0.5602, batch_reg_loss: 0.1653, reg_loss: 0.1654 ||:  86%|########6 | 96/111 [01:02<00:08,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.9591, LAS: 0.9233, UEM: 0.6407, LEM: 0.4176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9582, partial_loss/deprel_loss: 0.5912, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8299, loss: 0.5646, batch_reg_loss: 0.1652, reg_loss: 0.1654 ||:  90%|######### | 100/111 [01:04<00:06,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9328, UAS: 0.9591, LAS: 0.9231, UEM: 0.6373, LEM: 0.4132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2896, partial_loss/deprel_loss: 0.3896, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5348, loss: 0.5664, batch_reg_loss: 0.1652, reg_loss: 0.1654 ||:  94%|#########3| 104/111 [01:08<00:04,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9592, LAS: 0.9232, UEM: 0.6353, LEM: 0.4108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3564, partial_loss/deprel_loss: 0.4573, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6024, loss: 0.5661, batch_reg_loss: 0.1652, reg_loss: 0.1654 ||:  97%|#########7| 108/111 [01:10<00:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9596, LAS: 0.9237, UEM: 0.6431, LEM: 0.4185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2550, partial_loss/deprel_loss: 0.3154, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4686, loss: 0.5627, batch_reg_loss: 0.1652, reg_loss: 0.1654 ||: 100%|##########| 111/111 [01:12<00:00,  1.52it/s]\n",
+      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.315  |       N/A\n",
+      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.255  |       N/A\n",
+      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.165  |       N/A\n",
+      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - UEM                      |     0.643  |       N/A\n",
+      "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - LAS                      |     0.924  |       N/A\n",
+      "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - loss                     |     0.563  |       N/A\n",
+      "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - LEM                      |     0.419  |       N/A\n",
+      "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - UAS                      |     0.960  |       N/A\n",
+      "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - EM                       |     0.936  |       N/A\n",
+      "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:16:54,114 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:16:59,229 - INFO - combo.training.trainer - Epoch duration: 0:01:21.291164\n",
+      "2023-04-07 01:16:59,230 - INFO - combo.training.trainer - Estimated training time remaining: 6:37:58\n",
+      "2023-04-07 01:16:59,230 - INFO - allennlp.training.trainer - Epoch 108/399\n",
+      "2023-04-07 01:16:59,230 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:16:59,230 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:16:59,239 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9553, LAS: 0.9185, UEM: 0.4522, LEM: 0.2261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2684, partial_loss/deprel_loss: 0.3385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4897, loss: 0.6150, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||:   3%|2         | 3/111 [00:02<01:15,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9546, LAS: 0.9193, UEM: 0.4889, LEM: 0.2563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8166, partial_loss/deprel_loss: 0.5060, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7334, loss: 0.6051, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||:   5%|5         | 6/111 [00:04<01:15,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9595, LAS: 0.9240, UEM: 0.6025, LEM: 0.3661, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1919, partial_loss/deprel_loss: 0.2749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4235, loss: 0.5659, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||:   8%|8         | 9/111 [00:06<01:15,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8859, UAS: 0.9532, LAS: 0.9178, UEM: 0.5312, LEM: 0.3147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0256, partial_loss/deprel_loss: 0.5718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8277, loss: 0.5976, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||:  12%|#1        | 13/111 [00:09<01:08,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9536, LAS: 0.9181, UEM: 0.5355, LEM: 0.3208, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2057, partial_loss/deprel_loss: 0.2798, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4302, loss: 0.5954, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||:  14%|#4        | 16/111 [00:11<01:06,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9538, LAS: 0.9180, UEM: 0.5170, LEM: 0.3018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4307, partial_loss/deprel_loss: 0.3894, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5629, loss: 0.5964, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||:  17%|#7        | 19/111 [00:13<01:04,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9534, LAS: 0.9171, UEM: 0.5024, LEM: 0.2893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5278, partial_loss/deprel_loss: 0.4720, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6483, loss: 0.5977, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||:  20%|#9        | 22/111 [00:15<01:01,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9547, LAS: 0.9183, UEM: 0.5345, LEM: 0.3124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6225, partial_loss/deprel_loss: 0.4262, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6306, loss: 0.5869, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||:  23%|##2       | 25/111 [00:17<01:02,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9420, UAS: 0.9568, LAS: 0.9208, UEM: 0.5885, LEM: 0.3651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1603, partial_loss/deprel_loss: 0.2463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3942, loss: 0.5704, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||:  25%|##5       | 28/111 [00:19<00:59,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9567, LAS: 0.9207, UEM: 0.5925, LEM: 0.3715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6408, partial_loss/deprel_loss: 0.6466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8106, loss: 0.5757, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||:  28%|##7       | 31/111 [00:22<00:59,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9220, UAS: 0.9570, LAS: 0.9211, UEM: 0.5842, LEM: 0.3600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3374, partial_loss/deprel_loss: 0.4541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5959, loss: 0.5759, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||:  31%|###       | 34/111 [00:24<00:56,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9571, LAS: 0.9210, UEM: 0.5775, LEM: 0.3523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5832, partial_loss/deprel_loss: 0.5241, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7011, loss: 0.5768, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||:  33%|###3      | 37/111 [00:26<00:53,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9566, LAS: 0.9205, UEM: 0.5616, LEM: 0.3367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5129, partial_loss/deprel_loss: 0.4416, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6210, loss: 0.5796, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||:  37%|###6      | 41/111 [00:29<00:48,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8969, UAS: 0.9568, LAS: 0.9208, UEM: 0.5599, LEM: 0.3330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7523, partial_loss/deprel_loss: 0.5404, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7479, loss: 0.5798, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||:  41%|####      | 45/111 [00:31<00:44,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9573, LAS: 0.9212, UEM: 0.5717, LEM: 0.3448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3370, partial_loss/deprel_loss: 0.3491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5118, loss: 0.5767, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||:  43%|####3     | 48/111 [00:33<00:43,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9327, UAS: 0.9577, LAS: 0.9217, UEM: 0.5806, LEM: 0.3533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2611, partial_loss/deprel_loss: 0.3451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4934, loss: 0.5721, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||:  46%|####5     | 51/111 [00:35<00:42,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9580, UAS: 0.9585, LAS: 0.9226, UEM: 0.6101, LEM: 0.3869, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0995, partial_loss/deprel_loss: 0.1774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3269, loss: 0.5642, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||:  49%|####8     | 54/111 [00:38<00:40,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9580, LAS: 0.9222, UEM: 0.6093, LEM: 0.3867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9579, partial_loss/deprel_loss: 0.6240, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8558, loss: 0.5683, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||:  51%|#####1    | 57/111 [00:40<00:38,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9593, LAS: 0.9234, UEM: 0.6378, LEM: 0.4135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1566, partial_loss/deprel_loss: 0.2924, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4303, loss: 0.5589, batch_reg_loss: 0.1651, reg_loss: 0.1651 ||:  55%|#####4    | 61/111 [00:42<00:33,  1.50it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9597, LAS: 0.9237, UEM: 0.6403, LEM: 0.4135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2546, partial_loss/deprel_loss: 0.2992, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4553, loss: 0.5568, batch_reg_loss: 0.1651, reg_loss: 0.1651 ||:  59%|#####8    | 65/111 [00:44<00:28,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9601, LAS: 0.9239, UEM: 0.6396, LEM: 0.4078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2857, partial_loss/deprel_loss: 0.3470, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4998, loss: 0.5548, batch_reg_loss: 0.1650, reg_loss: 0.1651 ||:  63%|######3   | 70/111 [00:46<00:22,  1.79it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9602, LAS: 0.9242, UEM: 0.6355, LEM: 0.4028, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3710, partial_loss/deprel_loss: 0.3691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5345, loss: 0.5529, batch_reg_loss: 0.1650, reg_loss: 0.1651 ||:  68%|######7   | 75/111 [00:49<00:19,  1.84it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9609, LAS: 0.9247, UEM: 0.6496, LEM: 0.4167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2679, partial_loss/deprel_loss: 0.3331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4851, loss: 0.5488, batch_reg_loss: 0.1650, reg_loss: 0.1651 ||:  71%|#######1  | 79/111 [00:51<00:18,  1.72it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9605, LAS: 0.9245, UEM: 0.6596, LEM: 0.4358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6113, partial_loss/deprel_loss: 0.5152, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6994, loss: 0.5509, batch_reg_loss: 0.1650, reg_loss: 0.1651 ||:  75%|#######4  | 83/111 [00:55<00:18,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9602, LAS: 0.9244, UEM: 0.6551, LEM: 0.4322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4968, partial_loss/deprel_loss: 0.4183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5990, loss: 0.5509, batch_reg_loss: 0.1650, reg_loss: 0.1651 ||:  78%|#######8  | 87/111 [00:58<00:16,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9606, LAS: 0.9248, UEM: 0.6565, LEM: 0.4329, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4187, partial_loss/deprel_loss: 0.3940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5639, loss: 0.5483, batch_reg_loss: 0.1650, reg_loss: 0.1651 ||:  82%|########1 | 91/111 [01:00<00:13,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9600, LAS: 0.9242, UEM: 0.6535, LEM: 0.4293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6841, partial_loss/deprel_loss: 0.4818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6872, loss: 0.5532, batch_reg_loss: 0.1649, reg_loss: 0.1651 ||:  86%|########5 | 95/111 [01:03<00:10,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9598, LAS: 0.9239, UEM: 0.6465, LEM: 0.4221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3786, partial_loss/deprel_loss: 0.4065, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5658, loss: 0.5551, batch_reg_loss: 0.1649, reg_loss: 0.1651 ||:  89%|########9 | 99/111 [01:05<00:07,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9596, LAS: 0.9238, UEM: 0.6435, LEM: 0.4186, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3555, partial_loss/deprel_loss: 0.3684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5308, loss: 0.5557, batch_reg_loss: 0.1649, reg_loss: 0.1651 ||:  93%|#########2| 103/111 [01:08<00:05,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9041, UAS: 0.9592, LAS: 0.9235, UEM: 0.6426, LEM: 0.4184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8306, partial_loss/deprel_loss: 0.4825, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7170, loss: 0.5577, batch_reg_loss: 0.1649, reg_loss: 0.1651 ||:  96%|#########6| 107/111 [01:11<00:02,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9593, LAS: 0.9237, UEM: 0.6404, LEM: 0.4160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4690, partial_loss/deprel_loss: 0.4414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6118, loss: 0.5582, batch_reg_loss: 0.1649, reg_loss: 0.1651 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9593, LAS: 0.9237, UEM: 0.6404, LEM: 0.4160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4690, partial_loss/deprel_loss: 0.4414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6118, loss: 0.5582, batch_reg_loss: 0.1649, reg_loss: 0.1651 ||: 100%|##########| 111/111 [01:13<00:00,  1.50it/s]\n",
+      "2023-04-07 01:18:15,970 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.441  |       N/A\n",
+      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.469  |       N/A\n",
+      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.165  |       N/A\n",
+      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - UEM                      |     0.640  |       N/A\n",
+      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - LAS                      |     0.924  |       N/A\n",
+      "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - loss                     |     0.558  |       N/A\n",
+      "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - LEM                      |     0.416  |       N/A\n",
+      "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - UAS                      |     0.959  |       N/A\n",
+      "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - EM                       |     0.922  |       N/A\n",
+      "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:18:15,977 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:18:20,504 - INFO - combo.training.trainer - Epoch duration: 0:01:21.274289\n",
+      "2023-04-07 01:18:20,504 - INFO - combo.training.trainer - Estimated training time remaining: 6:36:35\n",
+      "2023-04-07 01:18:20,505 - INFO - allennlp.training.trainer - Epoch 109/399\n",
+      "2023-04-07 01:18:20,505 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:18:20,505 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:18:20,511 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9593, LAS: 0.9236, UEM: 0.6521, LEM: 0.4525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5284, partial_loss/deprel_loss: 0.4916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6639, loss: 0.5311, batch_reg_loss: 0.1649, reg_loss: 0.1649 ||:   3%|2         | 3/111 [00:02<01:20,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9525, UAS: 0.9639, LAS: 0.9292, UEM: 0.6776, LEM: 0.4671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0727, partial_loss/deprel_loss: 0.2414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3725, loss: 0.5108, batch_reg_loss: 0.1649, reg_loss: 0.1649 ||:   6%|6         | 7/111 [00:04<01:13,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9647, LAS: 0.9301, UEM: 0.7206, LEM: 0.5242, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5017, partial_loss/deprel_loss: 0.4443, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6206, loss: 0.4998, batch_reg_loss: 0.1649, reg_loss: 0.1649 ||:   9%|9         | 10/111 [00:07<01:13,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9639, LAS: 0.9291, UEM: 0.6909, LEM: 0.4869, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2603, partial_loss/deprel_loss: 0.3373, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4868, loss: 0.5078, batch_reg_loss: 0.1649, reg_loss: 0.1649 ||:  12%|#1        | 13/111 [00:09<01:09,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9650, LAS: 0.9297, UEM: 0.7081, LEM: 0.4977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1774, partial_loss/deprel_loss: 0.3130, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4507, loss: 0.5012, batch_reg_loss: 0.1649, reg_loss: 0.1649 ||:  14%|#4        | 16/111 [00:11<01:09,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9652, LAS: 0.9295, UEM: 0.7043, LEM: 0.4836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1694, partial_loss/deprel_loss: 0.2815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4240, loss: 0.5025, batch_reg_loss: 0.1648, reg_loss: 0.1649 ||:  17%|#7        | 19/111 [00:13<01:06,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9268, UAS: 0.9654, LAS: 0.9295, UEM: 0.6904, LEM: 0.4650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2851, partial_loss/deprel_loss: 0.3708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5185, loss: 0.5048, batch_reg_loss: 0.1648, reg_loss: 0.1649 ||:  20%|#9        | 22/111 [00:15<01:04,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9639, LAS: 0.9277, UEM: 0.6742, LEM: 0.4469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6014, partial_loss/deprel_loss: 0.5016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6864, loss: 0.5192, batch_reg_loss: 0.1648, reg_loss: 0.1649 ||:  23%|##3       | 26/111 [00:18<00:59,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9629, LAS: 0.9264, UEM: 0.6690, LEM: 0.4389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9460, partial_loss/deprel_loss: 0.6749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8939, loss: 0.5308, batch_reg_loss: 0.1648, reg_loss: 0.1649 ||:  26%|##6       | 29/111 [00:20<00:57,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9076, UAS: 0.9615, LAS: 0.9251, UEM: 0.6499, LEM: 0.4218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6377, partial_loss/deprel_loss: 0.4794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6759, loss: 0.5409, batch_reg_loss: 0.1648, reg_loss: 0.1649 ||:  29%|##8       | 32/111 [00:22<00:57,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9618, LAS: 0.9255, UEM: 0.6579, LEM: 0.4286, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1913, partial_loss/deprel_loss: 0.2937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4380, loss: 0.5392, batch_reg_loss: 0.1648, reg_loss: 0.1648 ||:  32%|###1      | 35/111 [00:24<00:54,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9622, LAS: 0.9256, UEM: 0.6576, LEM: 0.4232, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2549, partial_loss/deprel_loss: 0.3702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5119, loss: 0.5392, batch_reg_loss: 0.1648, reg_loss: 0.1648 ||:  35%|###5      | 39/111 [00:27<00:49,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9624, LAS: 0.9262, UEM: 0.6782, LEM: 0.4593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6272, partial_loss/deprel_loss: 0.4519, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6517, loss: 0.5356, batch_reg_loss: 0.1648, reg_loss: 0.1648 ||:  38%|###7      | 42/111 [00:29<00:50,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9618, LAS: 0.9259, UEM: 0.6666, LEM: 0.4473, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6933, partial_loss/deprel_loss: 0.4629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6737, loss: 0.5404, batch_reg_loss: 0.1648, reg_loss: 0.1648 ||:  42%|####2     | 47/111 [00:32<00:42,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9612, LAS: 0.9255, UEM: 0.6695, LEM: 0.4513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2173, partial_loss/deprel_loss: 0.2628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4185, loss: 0.5427, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||:  46%|####5     | 51/111 [00:35<00:40,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9617, LAS: 0.9261, UEM: 0.6680, LEM: 0.4468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2944, partial_loss/deprel_loss: 0.3405, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4960, loss: 0.5398, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||:  50%|####9     | 55/111 [00:37<00:35,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9620, LAS: 0.9264, UEM: 0.6709, LEM: 0.4483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2472, partial_loss/deprel_loss: 0.2889, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4453, loss: 0.5356, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||:  53%|#####3    | 59/111 [00:40<00:34,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9621, LAS: 0.9265, UEM: 0.6713, LEM: 0.4464, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3059, partial_loss/deprel_loss: 0.3606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5144, loss: 0.5340, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||:  57%|#####6    | 63/111 [00:43<00:32,  1.47it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9380, UAS: 0.9622, LAS: 0.9267, UEM: 0.6706, LEM: 0.4439, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1655, partial_loss/deprel_loss: 0.2805, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4222, loss: 0.5326, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||:  60%|######    | 67/111 [00:45<00:28,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9617, LAS: 0.9261, UEM: 0.6613, LEM: 0.4347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2136, partial_loss/deprel_loss: 0.3104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4557, loss: 0.5385, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||:  65%|######4   | 72/111 [00:47<00:23,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9610, LAS: 0.9255, UEM: 0.6554, LEM: 0.4301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6497, partial_loss/deprel_loss: 0.4840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6818, loss: 0.5429, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||:  68%|######8   | 76/111 [00:50<00:21,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9607, LAS: 0.9252, UEM: 0.6508, LEM: 0.4250, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2026, partial_loss/deprel_loss: 0.3609, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4939, loss: 0.5461, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||:  72%|#######2  | 80/111 [00:52<00:18,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9607, LAS: 0.9251, UEM: 0.6457, LEM: 0.4202, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2719, partial_loss/deprel_loss: 0.3363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4881, loss: 0.5473, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||:  76%|#######5  | 84/111 [00:55<00:16,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8811, UAS: 0.9606, LAS: 0.9251, UEM: 0.6512, LEM: 0.4269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0141, partial_loss/deprel_loss: 0.6056, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8519, loss: 0.5472, batch_reg_loss: 0.1646, reg_loss: 0.1648 ||:  79%|#######9  | 88/111 [00:58<00:15,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9607, LAS: 0.9251, UEM: 0.6511, LEM: 0.4258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2974, partial_loss/deprel_loss: 0.3590, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5113, loss: 0.5471, batch_reg_loss: 0.1646, reg_loss: 0.1648 ||:  83%|########2 | 92/111 [01:00<00:12,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9512, UAS: 0.9605, LAS: 0.9250, UEM: 0.6587, LEM: 0.4366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0870, partial_loss/deprel_loss: 0.2240, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3612, loss: 0.5474, batch_reg_loss: 0.1646, reg_loss: 0.1648 ||:  86%|########6 | 96/111 [01:03<00:10,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9600, LAS: 0.9245, UEM: 0.6535, LEM: 0.4318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6137, partial_loss/deprel_loss: 0.4769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6689, loss: 0.5521, batch_reg_loss: 0.1646, reg_loss: 0.1648 ||:  90%|######### | 100/111 [01:06<00:07,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9596, LAS: 0.9239, UEM: 0.6484, LEM: 0.4261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4753, partial_loss/deprel_loss: 0.4882, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6502, loss: 0.5571, batch_reg_loss: 0.1646, reg_loss: 0.1647 ||:  94%|#########3| 104/111 [01:08<00:04,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9596, LAS: 0.9239, UEM: 0.6458, LEM: 0.4228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2564, partial_loss/deprel_loss: 0.3385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4867, loss: 0.5568, batch_reg_loss: 0.1646, reg_loss: 0.1647 ||:  97%|#########7| 108/111 [01:11<00:01,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9596, LAS: 0.9238, UEM: 0.6435, LEM: 0.4200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2266, partial_loss/deprel_loss: 0.3723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5078, loss: 0.5579, batch_reg_loss: 0.1646, reg_loss: 0.1647 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
+      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.372  |       N/A\n",
+      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.227  |       N/A\n",
+      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.165  |       N/A\n",
+      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - UEM                      |     0.643  |       N/A\n",
+      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - LAS                      |     0.924  |       N/A\n",
+      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - loss                     |     0.558  |       N/A\n",
+      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - LEM                      |     0.420  |       N/A\n",
+      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - UAS                      |     0.960  |       N/A\n",
+      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - EM                       |     0.929  |       N/A\n",
+      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:19:36,953 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:19:41,588 - INFO - combo.training.trainer - Epoch duration: 0:01:21.083316\n",
+      "2023-04-07 01:19:41,588 - INFO - combo.training.trainer - Estimated training time remaining: 6:35:12\n",
+      "2023-04-07 01:19:41,589 - INFO - allennlp.training.trainer - Epoch 110/399\n",
+      "2023-04-07 01:19:41,589 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:19:41,589 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:19:41,614 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9717, LAS: 0.9407, UEM: 0.8579, LEM: 0.7503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4825, partial_loss/deprel_loss: 0.4682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6356, loss: 0.4710, batch_reg_loss: 0.1646, reg_loss: 0.1646 ||:   3%|2         | 3/111 [00:02<01:23,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9648, LAS: 0.9312, UEM: 0.7607, LEM: 0.6095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2430, partial_loss/deprel_loss: 0.3122, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4630, loss: 0.5286, batch_reg_loss: 0.1646, reg_loss: 0.1646 ||:   5%|5         | 6/111 [00:04<01:19,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9070, UAS: 0.9631, LAS: 0.9301, UEM: 0.7603, LEM: 0.6183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5614, partial_loss/deprel_loss: 0.5790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7401, loss: 0.5314, batch_reg_loss: 0.1646, reg_loss: 0.1646 ||:   8%|8         | 9/111 [00:06<01:16,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9626, LAS: 0.9295, UEM: 0.7216, LEM: 0.5597, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1972, partial_loss/deprel_loss: 0.3086, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4509, loss: 0.5329, batch_reg_loss: 0.1646, reg_loss: 0.1646 ||:  11%|#         | 12/111 [00:08<01:14,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9602, LAS: 0.9259, UEM: 0.6921, LEM: 0.5212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3618, partial_loss/deprel_loss: 0.4305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5813, loss: 0.5588, batch_reg_loss: 0.1645, reg_loss: 0.1646 ||:  14%|#3        | 15/111 [00:10<01:09,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9328, UAS: 0.9605, LAS: 0.9263, UEM: 0.6697, LEM: 0.4844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3103, partial_loss/deprel_loss: 0.3685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5214, loss: 0.5584, batch_reg_loss: 0.1645, reg_loss: 0.1646 ||:  17%|#7        | 19/111 [00:13<01:03,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9598, LAS: 0.9255, UEM: 0.6550, LEM: 0.4644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1687, partial_loss/deprel_loss: 0.3197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4541, loss: 0.5648, batch_reg_loss: 0.1645, reg_loss: 0.1646 ||:  20%|#9        | 22/111 [00:15<01:03,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9586, LAS: 0.9242, UEM: 0.6355, LEM: 0.4419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5601, partial_loss/deprel_loss: 0.4628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6468, loss: 0.5702, batch_reg_loss: 0.1645, reg_loss: 0.1646 ||:  23%|##3       | 26/111 [00:18<00:58,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9580, LAS: 0.9236, UEM: 0.6279, LEM: 0.4288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2239, partial_loss/deprel_loss: 0.3454, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4856, loss: 0.5715, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||:  27%|##7       | 30/111 [00:21<00:55,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9576, LAS: 0.9234, UEM: 0.6131, LEM: 0.4149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6178, partial_loss/deprel_loss: 0.5330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7145, loss: 0.5735, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||:  30%|##9       | 33/111 [00:23<00:55,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9568, LAS: 0.9225, UEM: 0.6158, LEM: 0.4149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2690, partial_loss/deprel_loss: 0.3602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5064, loss: 0.5788, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||:  32%|###2      | 36/111 [00:25<00:53,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9568, LAS: 0.9225, UEM: 0.6259, LEM: 0.4195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0041, partial_loss/deprel_loss: 0.5339, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7924, loss: 0.5774, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||:  35%|###5      | 39/111 [00:27<00:53,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9555, LAS: 0.9210, UEM: 0.6101, LEM: 0.4044, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8748, partial_loss/deprel_loss: 0.6011, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8203, loss: 0.5890, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||:  39%|###8      | 43/111 [00:30<00:48,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9099, UAS: 0.9556, LAS: 0.9212, UEM: 0.5979, LEM: 0.3897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5680, partial_loss/deprel_loss: 0.4212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6151, loss: 0.5863, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||:  43%|####3     | 48/111 [00:32<00:39,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9562, LAS: 0.9215, UEM: 0.6145, LEM: 0.4018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0934, partial_loss/deprel_loss: 0.2977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4213, loss: 0.5821, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||:  48%|####7     | 53/111 [00:34<00:33,  1.74it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9171, UAS: 0.9565, LAS: 0.9217, UEM: 0.6144, LEM: 0.3993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4778, partial_loss/deprel_loss: 0.4093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5875, loss: 0.5790, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||:  51%|#####1    | 57/111 [00:36<00:30,  1.80it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9562, LAS: 0.9214, UEM: 0.6066, LEM: 0.3921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2144, partial_loss/deprel_loss: 0.3356, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4758, loss: 0.5818, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||:  55%|#####4    | 61/111 [00:38<00:27,  1.84it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9565, LAS: 0.9219, UEM: 0.6104, LEM: 0.3969, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3077, partial_loss/deprel_loss: 0.3634, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5167, loss: 0.5782, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||:  59%|#####8    | 65/111 [00:42<00:28,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9564, LAS: 0.9217, UEM: 0.6083, LEM: 0.3928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3418, partial_loss/deprel_loss: 0.3516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.5789, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||:  62%|######2   | 69/111 [00:44<00:26,  1.58it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9572, LAS: 0.9223, UEM: 0.6156, LEM: 0.3964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4749, partial_loss/deprel_loss: 0.4711, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6363, loss: 0.5745, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||:  66%|######5   | 73/111 [00:47<00:25,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9575, LAS: 0.9226, UEM: 0.6203, LEM: 0.3998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1145, partial_loss/deprel_loss: 0.2285, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3701, loss: 0.5720, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||:  69%|######9   | 77/111 [00:50<00:23,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9575, LAS: 0.9225, UEM: 0.6175, LEM: 0.3945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5904, partial_loss/deprel_loss: 0.4982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6810, loss: 0.5731, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||:  73%|#######2  | 81/111 [00:53<00:21,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9576, LAS: 0.9226, UEM: 0.6186, LEM: 0.3954, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3328, partial_loss/deprel_loss: 0.4035, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5538, loss: 0.5720, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||:  76%|#######5  | 84/111 [00:56<00:19,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9580, LAS: 0.9229, UEM: 0.6180, LEM: 0.3933, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3493, partial_loss/deprel_loss: 0.4093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5617, loss: 0.5701, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||:  78%|#######8  | 87/111 [00:58<00:17,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9583, LAS: 0.9233, UEM: 0.6233, LEM: 0.3994, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1383, partial_loss/deprel_loss: 0.2481, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3905, loss: 0.5673, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||:  81%|########1 | 90/111 [01:00<00:15,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9082, UAS: 0.9585, LAS: 0.9235, UEM: 0.6321, LEM: 0.4094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6988, partial_loss/deprel_loss: 0.4598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6720, loss: 0.5650, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||:  84%|########3 | 93/111 [01:02<00:13,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9585, LAS: 0.9234, UEM: 0.6279, LEM: 0.4046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3920, partial_loss/deprel_loss: 0.4626, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6129, loss: 0.5658, batch_reg_loss: 0.1643, reg_loss: 0.1645 ||:  86%|########6 | 96/111 [01:05<00:11,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9586, LAS: 0.9236, UEM: 0.6319, LEM: 0.4104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6267, partial_loss/deprel_loss: 0.4552, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6539, loss: 0.5635, batch_reg_loss: 0.1643, reg_loss: 0.1645 ||:  89%|########9 | 99/111 [01:07<00:08,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9590, LAS: 0.9239, UEM: 0.6369, LEM: 0.4143, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3991, partial_loss/deprel_loss: 0.4368, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5936, loss: 0.5613, batch_reg_loss: 0.1643, reg_loss: 0.1645 ||:  92%|#########1| 102/111 [01:09<00:06,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9196, UAS: 0.9594, LAS: 0.9242, UEM: 0.6422, LEM: 0.4173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3173, partial_loss/deprel_loss: 0.3599, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5157, loss: 0.5582, batch_reg_loss: 0.1643, reg_loss: 0.1645 ||:  95%|#########4| 105/111 [01:12<00:04,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9597, LAS: 0.9245, UEM: 0.6444, LEM: 0.4182, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1521, partial_loss/deprel_loss: 0.2242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3741, loss: 0.5558, batch_reg_loss: 0.1643, reg_loss: 0.1645 ||:  97%|#########7| 108/111 [01:14<00:02,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9596, LAS: 0.9243, UEM: 0.6463, LEM: 0.4194, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2799, partial_loss/deprel_loss: 0.3418, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4937, loss: 0.5562, batch_reg_loss: 0.1643, reg_loss: 0.1645 ||: 100%|##########| 111/111 [01:16<00:00,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9596, LAS: 0.9243, UEM: 0.6463, LEM: 0.4194, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2799, partial_loss/deprel_loss: 0.3418, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4937, loss: 0.5562, batch_reg_loss: 0.1643, reg_loss: 0.1645 ||: 100%|##########| 111/111 [01:16<00:00,  1.46it/s]\n",
+      "2023-04-07 01:21:01,093 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9641, LAS: 0.9129, UEM: 0.7128, LEM: 0.3718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3735, partial_loss/deprel_loss: 25.4464, partial_loss/cycle_loss: 0.0000, batch_loss: 20.4318, loss: 19.6309, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:11,  1.04s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9636, LAS: 0.9138, UEM: 0.7601, LEM: 0.4905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1781, partial_loss/deprel_loss: 18.1071, partial_loss/cycle_loss: 0.0000, batch_loss: 14.5213, loss: 19.2017, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:04<00:08,  1.02s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8781, UAS: 0.9509, LAS: 0.9007, UEM: 0.7007, LEM: 0.4404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1098, partial_loss/deprel_loss: 41.2865, partial_loss/cycle_loss: 0.0000, batch_loss: 33.2512, loss: 23.2837, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:08<00:05,  1.02s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8705, UAS: 0.9466, LAS: 0.8952, UEM: 0.6532, LEM: 0.3988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3394, partial_loss/deprel_loss: 45.8758, partial_loss/cycle_loss: 0.0000, batch_loss: 36.9685, loss: 25.1615, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  77%|#######6  | 10/13 [00:10<00:03,  1.01s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9476, LAS: 0.8970, UEM: 0.6576, LEM: 0.3971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8956, partial_loss/deprel_loss: 29.6791, partial_loss/cycle_loss: 0.0000, batch_loss: 23.9224, loss: 24.6363, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9476, LAS: 0.8970, UEM: 0.6576, LEM: 0.3971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8956, partial_loss/deprel_loss: 29.6791, partial_loss/cycle_loss: 0.0000, batch_loss: 23.9224, loss: 24.6363, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.03it/s]\n",
+      "2023-04-07 01:21:13,721 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:21:13,721 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:21:13,721 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:21:13,721 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
+      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.342  |    29.679\n",
+      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.280  |     0.896\n",
+      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.164  |     0.000\n",
+      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - UEM                      |     0.646  |     0.658\n",
+      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - LAS                      |     0.924  |     0.897\n",
+      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - loss                     |     0.556  |    24.636\n",
+      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - LEM                      |     0.419  |     0.397\n",
+      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - UAS                      |     0.960  |     0.948\n",
+      "2023-04-07 01:21:13,723 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:21:13,723 - INFO - combo.training.tensorboard_writer - EM                       |     0.934  |     0.881\n",
+      "2023-04-07 01:21:13,723 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:21:13,728 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:21:18,618 - INFO - combo.training.trainer - Epoch duration: 0:01:37.029658\n",
+      "2023-04-07 01:21:18,619 - INFO - combo.training.trainer - Estimated training time remaining: 6:34:30\n",
+      "2023-04-07 01:21:18,619 - INFO - allennlp.training.trainer - Epoch 111/399\n",
+      "2023-04-07 01:21:18,619 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:21:18,619 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:21:18,627 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9351, UAS: 0.9556, LAS: 0.9218, UEM: 0.4730, LEM: 0.2527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2893, partial_loss/deprel_loss: 0.2881, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4526, loss: 0.5829, batch_reg_loss: 0.1643, reg_loss: 0.1643 ||:   4%|3         | 4/111 [00:02<01:09,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9574, LAS: 0.9235, UEM: 0.4780, LEM: 0.2599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3950, partial_loss/deprel_loss: 0.3992, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5627, loss: 0.5757, batch_reg_loss: 0.1643, reg_loss: 0.1643 ||:   7%|7         | 8/111 [00:04<01:03,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9294, UAS: 0.9598, LAS: 0.9249, UEM: 0.5409, LEM: 0.3060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2755, partial_loss/deprel_loss: 0.3663, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5124, loss: 0.5598, batch_reg_loss: 0.1643, reg_loss: 0.1643 ||:  12%|#1        | 13/111 [00:06<00:55,  1.78it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9476, UAS: 0.9620, LAS: 0.9272, UEM: 0.6094, LEM: 0.3869, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1368, partial_loss/deprel_loss: 0.2402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3838, loss: 0.5370, batch_reg_loss: 0.1642, reg_loss: 0.1643 ||:  16%|#6        | 18/111 [00:09<00:48,  1.90it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9626, LAS: 0.9280, UEM: 0.6157, LEM: 0.3911, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3550, partial_loss/deprel_loss: 0.3964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5523, loss: 0.5314, batch_reg_loss: 0.1642, reg_loss: 0.1643 ||:  20%|#9        | 22/111 [00:11<00:46,  1.91it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9647, LAS: 0.9304, UEM: 0.6799, LEM: 0.4691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3518, partial_loss/deprel_loss: 0.3935, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5494, loss: 0.5178, batch_reg_loss: 0.1642, reg_loss: 0.1643 ||:  23%|##3       | 26/111 [00:14<00:49,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9448, UAS: 0.9639, LAS: 0.9299, UEM: 0.6849, LEM: 0.4770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1500, partial_loss/deprel_loss: 0.2611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4031, loss: 0.5199, batch_reg_loss: 0.1642, reg_loss: 0.1643 ||:  27%|##7       | 30/111 [00:17<00:53,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9635, LAS: 0.9297, UEM: 0.7096, LEM: 0.5093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1431, partial_loss/deprel_loss: 0.2757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4134, loss: 0.5201, batch_reg_loss: 0.1642, reg_loss: 0.1642 ||:  30%|##9       | 33/111 [00:19<00:54,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9603, LAS: 0.9262, UEM: 0.6885, LEM: 0.4912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6263, partial_loss/deprel_loss: 0.5303, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7137, loss: 0.5447, batch_reg_loss: 0.1642, reg_loss: 0.1642 ||:  33%|###3      | 37/111 [00:22<00:49,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9603, LAS: 0.9262, UEM: 0.6803, LEM: 0.4802, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4154, partial_loss/deprel_loss: 0.4471, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6050, loss: 0.5469, batch_reg_loss: 0.1642, reg_loss: 0.1642 ||:  37%|###6      | 41/111 [00:24<00:44,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9592, LAS: 0.9249, UEM: 0.6709, LEM: 0.4690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1996, partial_loss/deprel_loss: 0.3331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4706, loss: 0.5541, batch_reg_loss: 0.1642, reg_loss: 0.1642 ||:  41%|####      | 45/111 [00:27<00:43,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8997, UAS: 0.9580, LAS: 0.9238, UEM: 0.6687, LEM: 0.4696, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8114, partial_loss/deprel_loss: 0.4566, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6917, loss: 0.5602, batch_reg_loss: 0.1642, reg_loss: 0.1642 ||:  44%|####4     | 49/111 [00:30<00:41,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9581, LAS: 0.9238, UEM: 0.6645, LEM: 0.4654, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5992, partial_loss/deprel_loss: 0.4125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6140, loss: 0.5593, batch_reg_loss: 0.1642, reg_loss: 0.1642 ||:  48%|####7     | 53/111 [00:33<00:40,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9589, LAS: 0.9246, UEM: 0.6702, LEM: 0.4658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1928, partial_loss/deprel_loss: 0.3195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4583, loss: 0.5533, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  50%|#####     | 56/111 [00:35<00:40,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9144, UAS: 0.9589, LAS: 0.9245, UEM: 0.6632, LEM: 0.4577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5083, partial_loss/deprel_loss: 0.4816, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6511, loss: 0.5547, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  53%|#####3    | 59/111 [00:37<00:37,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9591, LAS: 0.9245, UEM: 0.6607, LEM: 0.4538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3761, partial_loss/deprel_loss: 0.4201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5754, loss: 0.5543, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  56%|#####5    | 62/111 [00:39<00:35,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9596, LAS: 0.9248, UEM: 0.6674, LEM: 0.4607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2814, partial_loss/deprel_loss: 0.3194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4760, loss: 0.5503, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  59%|#####8    | 65/111 [00:41<00:33,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9597, LAS: 0.9248, UEM: 0.6682, LEM: 0.4607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1707, partial_loss/deprel_loss: 0.2553, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4025, loss: 0.5495, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  61%|######1   | 68/111 [00:44<00:31,  1.35it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9599, LAS: 0.9250, UEM: 0.6684, LEM: 0.4601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1683, partial_loss/deprel_loss: 0.2533, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4004, loss: 0.5474, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  64%|######3   | 71/111 [00:46<00:29,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9600, LAS: 0.9251, UEM: 0.6631, LEM: 0.4524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2880, partial_loss/deprel_loss: 0.3692, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5171, loss: 0.5473, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  68%|######7   | 75/111 [00:48<00:24,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9295, UAS: 0.9592, LAS: 0.9241, UEM: 0.6583, LEM: 0.4477, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2128, partial_loss/deprel_loss: 0.3548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4905, loss: 0.5534, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  70%|#######   | 78/111 [00:51<00:23,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9593, LAS: 0.9240, UEM: 0.6555, LEM: 0.4427, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4426, partial_loss/deprel_loss: 0.4539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6158, loss: 0.5546, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  73%|#######2  | 81/111 [00:53<00:21,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9470, UAS: 0.9593, LAS: 0.9240, UEM: 0.6541, LEM: 0.4401, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1507, partial_loss/deprel_loss: 0.2648, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4060, loss: 0.5554, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  76%|#######5  | 84/111 [00:55<00:19,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9591, LAS: 0.9238, UEM: 0.6509, LEM: 0.4369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1896, partial_loss/deprel_loss: 0.2569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4075, loss: 0.5566, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  78%|#######8  | 87/111 [00:57<00:17,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9595, LAS: 0.9241, UEM: 0.6525, LEM: 0.4357, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2041, partial_loss/deprel_loss: 0.2996, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4446, loss: 0.5538, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  81%|########1 | 90/111 [00:59<00:15,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9597, LAS: 0.9243, UEM: 0.6539, LEM: 0.4352, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3412, partial_loss/deprel_loss: 0.3975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5503, loss: 0.5519, batch_reg_loss: 0.1640, reg_loss: 0.1642 ||:  85%|########4 | 94/111 [01:02<00:11,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9600, LAS: 0.9247, UEM: 0.6560, LEM: 0.4365, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2771, partial_loss/deprel_loss: 0.3875, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5294, loss: 0.5495, batch_reg_loss: 0.1640, reg_loss: 0.1642 ||:  87%|########7 | 97/111 [01:04<00:09,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9596, LAS: 0.9243, UEM: 0.6499, LEM: 0.4312, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3014, partial_loss/deprel_loss: 0.3095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4719, loss: 0.5512, batch_reg_loss: 0.1640, reg_loss: 0.1642 ||:  91%|######### | 101/111 [01:09<00:08,  1.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9594, LAS: 0.9240, UEM: 0.6432, LEM: 0.4241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4741, partial_loss/deprel_loss: 0.5343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6863, loss: 0.5547, batch_reg_loss: 0.1640, reg_loss: 0.1642 ||:  95%|#########4| 105/111 [01:12<00:04,  1.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9597, LAS: 0.9244, UEM: 0.6477, LEM: 0.4275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2616, partial_loss/deprel_loss: 0.3654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5086, loss: 0.5519, batch_reg_loss: 0.1640, reg_loss: 0.1641 ||:  97%|#########7| 108/111 [01:14<00:02,  1.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9595, LAS: 0.9241, UEM: 0.6436, LEM: 0.4229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3721, partial_loss/deprel_loss: 0.3770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5400, loss: 0.5536, batch_reg_loss: 0.1640, reg_loss: 0.1641 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
+      "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.377  |       N/A\n",
+      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.372  |       N/A\n",
+      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.164  |       N/A\n",
+      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - UEM                      |     0.644  |       N/A\n",
+      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - LAS                      |     0.924  |       N/A\n",
+      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - loss                     |     0.554  |       N/A\n",
+      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - LEM                      |     0.423  |       N/A\n",
+      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - UAS                      |     0.959  |       N/A\n",
+      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - EM                       |     0.922  |       N/A\n",
+      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:22:38,121 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:22:45,590 - INFO - combo.training.trainer - Epoch duration: 0:01:26.971396\n",
+      "2023-04-07 01:22:45,591 - INFO - combo.training.trainer - Estimated training time remaining: 6:33:21\n",
+      "2023-04-07 01:22:45,591 - INFO - allennlp.training.trainer - Epoch 112/399\n",
+      "2023-04-07 01:22:45,591 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:22:45,592 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:22:45,602 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8898, UAS: 0.9465, LAS: 0.9113, UEM: 0.3516, LEM: 0.1868, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9347, partial_loss/deprel_loss: 0.5649, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8029, loss: 0.6429, batch_reg_loss: 0.1640, reg_loss: 0.1640 ||:   3%|2         | 3/111 [00:02<01:18,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9502, LAS: 0.9139, UEM: 0.4979, LEM: 0.3100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7785, partial_loss/deprel_loss: 0.5310, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7445, loss: 0.6125, batch_reg_loss: 0.1640, reg_loss: 0.1640 ||:   5%|5         | 6/111 [00:04<01:16,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9543, LAS: 0.9171, UEM: 0.5289, LEM: 0.2964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2015, partial_loss/deprel_loss: 0.3542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4876, loss: 0.5984, batch_reg_loss: 0.1640, reg_loss: 0.1640 ||:   9%|9         | 10/111 [00:06<01:10,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9520, LAS: 0.9153, UEM: 0.4784, LEM: 0.2608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3941, partial_loss/deprel_loss: 0.4399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5947, loss: 0.6202, batch_reg_loss: 0.1640, reg_loss: 0.1640 ||:  13%|#2        | 14/111 [00:09<01:06,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9533, LAS: 0.9172, UEM: 0.5065, LEM: 0.2880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1862, partial_loss/deprel_loss: 0.3066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4465, loss: 0.6082, batch_reg_loss: 0.1640, reg_loss: 0.1640 ||:  16%|#6        | 18/111 [00:12<01:03,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8858, UAS: 0.9527, LAS: 0.9165, UEM: 0.5070, LEM: 0.2859, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8457, partial_loss/deprel_loss: 0.5729, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7914, loss: 0.6121, batch_reg_loss: 0.1640, reg_loss: 0.1640 ||:  19%|#8        | 21/111 [00:14<01:04,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9252, UAS: 0.9537, LAS: 0.9181, UEM: 0.5409, LEM: 0.3272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3244, partial_loss/deprel_loss: 0.3309, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4936, loss: 0.6005, batch_reg_loss: 0.1639, reg_loss: 0.1640 ||:  22%|##1       | 24/111 [00:16<01:03,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9403, UAS: 0.9540, LAS: 0.9189, UEM: 0.5440, LEM: 0.3287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3007, partial_loss/deprel_loss: 0.2811, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4490, loss: 0.5944, batch_reg_loss: 0.1639, reg_loss: 0.1640 ||:  24%|##4       | 27/111 [00:19<01:01,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9564, LAS: 0.9210, UEM: 0.5942, LEM: 0.3711, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1901, partial_loss/deprel_loss: 0.2766, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4233, loss: 0.5804, batch_reg_loss: 0.1639, reg_loss: 0.1640 ||:  27%|##7       | 30/111 [00:21<00:58,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9170, UAS: 0.9571, LAS: 0.9218, UEM: 0.6062, LEM: 0.3837, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4590, partial_loss/deprel_loss: 0.4322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6015, loss: 0.5729, batch_reg_loss: 0.1639, reg_loss: 0.1640 ||:  30%|##9       | 33/111 [00:23<00:56,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9579, LAS: 0.9227, UEM: 0.6108, LEM: 0.3877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2158, partial_loss/deprel_loss: 0.2707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4236, loss: 0.5635, batch_reg_loss: 0.1639, reg_loss: 0.1640 ||:  33%|###3      | 37/111 [00:25<00:51,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9576, LAS: 0.9225, UEM: 0.6093, LEM: 0.3865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7147, partial_loss/deprel_loss: 0.4772, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6886, loss: 0.5641, batch_reg_loss: 0.1639, reg_loss: 0.1640 ||:  36%|###6      | 40/111 [00:28<00:52,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9577, LAS: 0.9223, UEM: 0.6054, LEM: 0.3808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2507, partial_loss/deprel_loss: 0.3784, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5167, loss: 0.5653, batch_reg_loss: 0.1639, reg_loss: 0.1640 ||:  39%|###8      | 43/111 [00:30<00:49,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9584, UAS: 0.9583, LAS: 0.9233, UEM: 0.6294, LEM: 0.4113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0886, partial_loss/deprel_loss: 0.1720, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3192, loss: 0.5584, batch_reg_loss: 0.1639, reg_loss: 0.1639 ||:  41%|####1     | 46/111 [00:32<00:47,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9496, UAS: 0.9586, LAS: 0.9236, UEM: 0.6407, LEM: 0.4244, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1205, partial_loss/deprel_loss: 0.1973, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3458, loss: 0.5557, batch_reg_loss: 0.1639, reg_loss: 0.1639 ||:  45%|####5     | 50/111 [00:35<00:43,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9588, LAS: 0.9235, UEM: 0.6325, LEM: 0.4154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2406, partial_loss/deprel_loss: 0.3505, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4924, loss: 0.5578, batch_reg_loss: 0.1639, reg_loss: 0.1639 ||:  49%|####8     | 54/111 [00:37<00:38,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9588, LAS: 0.9236, UEM: 0.6321, LEM: 0.4144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1250, partial_loss/deprel_loss: 0.2503, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3891, loss: 0.5572, batch_reg_loss: 0.1639, reg_loss: 0.1639 ||:  51%|#####1    | 57/111 [00:39<00:36,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9582, LAS: 0.9231, UEM: 0.6267, LEM: 0.4089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2787, partial_loss/deprel_loss: 0.2862, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4485, loss: 0.5608, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  55%|#####4    | 61/111 [00:42<00:33,  1.50it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9581, LAS: 0.9230, UEM: 0.6202, LEM: 0.4024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4928, partial_loss/deprel_loss: 0.4218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5998, loss: 0.5626, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  59%|#####8    | 65/111 [00:45<00:30,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9243, UAS: 0.9577, LAS: 0.9226, UEM: 0.6181, LEM: 0.3990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3401, partial_loss/deprel_loss: 0.3742, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5312, loss: 0.5654, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  61%|######1   | 68/111 [00:47<00:29,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9583, LAS: 0.9231, UEM: 0.6201, LEM: 0.3982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3537, partial_loss/deprel_loss: 0.4052, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5587, loss: 0.5631, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  64%|######3   | 71/111 [00:49<00:27,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9581, LAS: 0.9230, UEM: 0.6127, LEM: 0.3914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4975, partial_loss/deprel_loss: 0.4292, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6067, loss: 0.5656, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  67%|######6   | 74/111 [00:51<00:26,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9437, UAS: 0.9583, LAS: 0.9234, UEM: 0.6134, LEM: 0.3913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2865, partial_loss/deprel_loss: 0.3171, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4748, loss: 0.5631, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  70%|#######   | 78/111 [00:54<00:22,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9589, LAS: 0.9240, UEM: 0.6244, LEM: 0.4020, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1680, partial_loss/deprel_loss: 0.2197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3732, loss: 0.5580, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  73%|#######2  | 81/111 [00:56<00:20,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9413, UAS: 0.9588, LAS: 0.9238, UEM: 0.6206, LEM: 0.3978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2257, partial_loss/deprel_loss: 0.2934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4437, loss: 0.5580, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  77%|#######6  | 85/111 [00:59<00:18,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9327, UAS: 0.9595, LAS: 0.9246, UEM: 0.6336, LEM: 0.4103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2709, partial_loss/deprel_loss: 0.3525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4999, loss: 0.5523, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  80%|########  | 89/111 [01:01<00:14,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9602, LAS: 0.9254, UEM: 0.6529, LEM: 0.4353, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1587, partial_loss/deprel_loss: 0.2924, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4294, loss: 0.5475, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  84%|########3 | 93/111 [01:05<00:13,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9599, LAS: 0.9252, UEM: 0.6513, LEM: 0.4335, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1936, partial_loss/deprel_loss: 0.2764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4236, loss: 0.5494, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  86%|########6 | 96/111 [01:07<00:10,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9597, LAS: 0.9249, UEM: 0.6490, LEM: 0.4296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2162, partial_loss/deprel_loss: 0.3828, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5132, loss: 0.5507, batch_reg_loss: 0.1637, reg_loss: 0.1639 ||:  90%|######### | 100/111 [01:09<00:07,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9595, LAS: 0.9246, UEM: 0.6438, LEM: 0.4233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2196, partial_loss/deprel_loss: 0.3284, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4704, loss: 0.5532, batch_reg_loss: 0.1637, reg_loss: 0.1639 ||:  95%|#########4| 105/111 [01:11<00:03,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9597, LAS: 0.9248, UEM: 0.6440, LEM: 0.4238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3882, partial_loss/deprel_loss: 0.3587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5283, loss: 0.5515, batch_reg_loss: 0.1637, reg_loss: 0.1639 ||:  99%|#########9| 110/111 [01:13<00:00,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9597, LAS: 0.9249, UEM: 0.6435, LEM: 0.4229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2821, partial_loss/deprel_loss: 0.3450, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4962, loss: 0.5510, batch_reg_loss: 0.1637, reg_loss: 0.1639 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
+      "2023-04-07 01:24:02,965 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.345  |       N/A\n",
+      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.282  |       N/A\n",
+      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.164  |       N/A\n",
+      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - UEM                      |     0.644  |       N/A\n",
+      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - LAS                      |     0.925  |       N/A\n",
+      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - loss                     |     0.551  |       N/A\n",
+      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:24:02,967 - INFO - combo.training.tensorboard_writer - LEM                      |     0.423  |       N/A\n",
+      "2023-04-07 01:24:02,967 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:24:02,967 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:24:02,967 - INFO - combo.training.tensorboard_writer - UAS                      |     0.960  |       N/A\n",
+      "2023-04-07 01:24:02,967 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:24:02,967 - INFO - combo.training.tensorboard_writer - EM                       |     0.931  |       N/A\n",
+      "2023-04-07 01:24:02,967 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:24:02,972 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:24:08,115 - INFO - combo.training.trainer - Epoch duration: 0:01:22.524054\n",
+      "2023-04-07 01:24:08,116 - INFO - combo.training.trainer - Estimated training time remaining: 6:32:00\n",
+      "2023-04-07 01:24:08,116 - INFO - allennlp.training.trainer - Epoch 113/399\n",
+      "2023-04-07 01:24:08,119 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:24:08,120 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:24:08,127 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9435, LAS: 0.9077, UEM: 0.5920, LEM: 0.3600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1878, partial_loss/deprel_loss: 0.2747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4211, loss: 0.6665, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||:   3%|2         | 3/111 [00:02<01:18,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9525, LAS: 0.9181, UEM: 0.6117, LEM: 0.3944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3329, partial_loss/deprel_loss: 0.3963, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5473, loss: 0.5999, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||:   5%|5         | 6/111 [00:04<01:14,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9380, UAS: 0.9566, LAS: 0.9209, UEM: 0.6403, LEM: 0.4142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1369, partial_loss/deprel_loss: 0.2747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4108, loss: 0.5777, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||:   8%|8         | 9/111 [00:06<01:12,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9572, UAS: 0.9597, LAS: 0.9256, UEM: 0.6848, LEM: 0.4760, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0767, partial_loss/deprel_loss: 0.1787, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3220, loss: 0.5496, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||:  11%|#         | 12/111 [00:08<01:11,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9600, LAS: 0.9256, UEM: 0.6684, LEM: 0.4553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5117, partial_loss/deprel_loss: 0.4077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5922, loss: 0.5426, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||:  14%|#3        | 15/111 [00:10<01:08,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9054, UAS: 0.9572, LAS: 0.9225, UEM: 0.6189, LEM: 0.4124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6246, partial_loss/deprel_loss: 0.5487, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7275, loss: 0.5690, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||:  17%|#7        | 19/111 [00:13<01:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9537, UAS: 0.9574, LAS: 0.9231, UEM: 0.6233, LEM: 0.4158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1474, partial_loss/deprel_loss: 0.2087, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3601, loss: 0.5615, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||:  21%|##        | 23/111 [00:15<00:57,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8803, UAS: 0.9573, LAS: 0.9233, UEM: 0.6406, LEM: 0.4323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0529, partial_loss/deprel_loss: 0.5422, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8079, loss: 0.5586, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||:  24%|##4       | 27/111 [00:18<00:54,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9564, LAS: 0.9221, UEM: 0.6399, LEM: 0.4344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1533, partial_loss/deprel_loss: 0.2707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4108, loss: 0.5640, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||:  27%|##7       | 30/111 [00:20<00:54,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9571, LAS: 0.9223, UEM: 0.6434, LEM: 0.4315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1653, partial_loss/deprel_loss: 0.2758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4173, loss: 0.5608, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||:  30%|##9       | 33/111 [00:22<00:52,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9044, UAS: 0.9564, LAS: 0.9217, UEM: 0.6241, LEM: 0.4161, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6261, partial_loss/deprel_loss: 0.4662, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6618, loss: 0.5668, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||:  32%|###2      | 36/111 [00:24<00:51,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9566, LAS: 0.9218, UEM: 0.6162, LEM: 0.4052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3270, partial_loss/deprel_loss: 0.3358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4977, loss: 0.5653, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||:  35%|###5      | 39/111 [00:26<00:50,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9144, UAS: 0.9567, LAS: 0.9220, UEM: 0.6088, LEM: 0.3970, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6791, partial_loss/deprel_loss: 0.4889, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6906, loss: 0.5671, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||:  38%|###7      | 42/111 [00:28<00:49,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9564, LAS: 0.9216, UEM: 0.6039, LEM: 0.3907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1989, partial_loss/deprel_loss: 0.2975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4414, loss: 0.5713, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||:  41%|####1     | 46/111 [00:31<00:45,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9572, LAS: 0.9224, UEM: 0.6089, LEM: 0.3914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5235, partial_loss/deprel_loss: 0.4346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6160, loss: 0.5652, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||:  45%|####5     | 50/111 [00:34<00:42,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9082, UAS: 0.9569, LAS: 0.9224, UEM: 0.6093, LEM: 0.3951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7306, partial_loss/deprel_loss: 0.5466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7470, loss: 0.5666, batch_reg_loss: 0.1636, reg_loss: 0.1636 ||:  49%|####8     | 54/111 [00:36<00:38,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9574, LAS: 0.9229, UEM: 0.6208, LEM: 0.4067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6226, partial_loss/deprel_loss: 0.4704, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6644, loss: 0.5625, batch_reg_loss: 0.1636, reg_loss: 0.1636 ||:  51%|#####1    | 57/111 [00:39<00:37,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9579, LAS: 0.9234, UEM: 0.6257, LEM: 0.4112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3557, partial_loss/deprel_loss: 0.4244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5743, loss: 0.5590, batch_reg_loss: 0.1636, reg_loss: 0.1636 ||:  54%|#####4    | 60/111 [00:41<00:35,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9586, LAS: 0.9242, UEM: 0.6372, LEM: 0.4214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1545, partial_loss/deprel_loss: 0.2473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3923, loss: 0.5533, batch_reg_loss: 0.1636, reg_loss: 0.1636 ||:  57%|#####6    | 63/111 [00:43<00:36,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9583, LAS: 0.9240, UEM: 0.6283, LEM: 0.4121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3313, partial_loss/deprel_loss: 0.3747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5295, loss: 0.5554, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||:  60%|######    | 67/111 [00:46<00:31,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9525, UAS: 0.9595, LAS: 0.9252, UEM: 0.6533, LEM: 0.4396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1309, partial_loss/deprel_loss: 0.2326, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3758, loss: 0.5470, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||:  63%|######3   | 70/111 [00:48<00:28,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9599, LAS: 0.9257, UEM: 0.6554, LEM: 0.4405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1910, partial_loss/deprel_loss: 0.3548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4856, loss: 0.5443, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||:  66%|######5   | 73/111 [00:50<00:28,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9596, LAS: 0.9254, UEM: 0.6500, LEM: 0.4346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3578, partial_loss/deprel_loss: 0.3686, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5300, loss: 0.5468, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||:  69%|######9   | 77/111 [00:53<00:24,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9601, LAS: 0.9257, UEM: 0.6518, LEM: 0.4329, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1751, partial_loss/deprel_loss: 0.2854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4268, loss: 0.5443, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||:  73%|#######2  | 81/111 [00:55<00:19,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9595, LAS: 0.9250, UEM: 0.6442, LEM: 0.4260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8791, partial_loss/deprel_loss: 0.5936, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8142, loss: 0.5483, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||:  77%|#######7  | 86/111 [00:57<00:14,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9598, LAS: 0.9254, UEM: 0.6547, LEM: 0.4429, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5151, partial_loss/deprel_loss: 0.4351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6146, loss: 0.5463, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||:  81%|########1 | 90/111 [01:00<00:13,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9604, LAS: 0.9259, UEM: 0.6577, LEM: 0.4424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2140, partial_loss/deprel_loss: 0.3738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5053, loss: 0.5433, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||:  85%|########4 | 94/111 [01:02<00:10,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9602, LAS: 0.9256, UEM: 0.6506, LEM: 0.4359, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4410, partial_loss/deprel_loss: 0.4332, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5982, loss: 0.5457, batch_reg_loss: 0.1634, reg_loss: 0.1636 ||:  88%|########8 | 98/111 [01:05<00:07,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9604, LAS: 0.9258, UEM: 0.6540, LEM: 0.4368, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3462, partial_loss/deprel_loss: 0.3633, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5233, loss: 0.5434, batch_reg_loss: 0.1634, reg_loss: 0.1636 ||:  92%|#########1| 102/111 [01:07<00:05,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9605, LAS: 0.9260, UEM: 0.6514, LEM: 0.4324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3090, partial_loss/deprel_loss: 0.3175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4792, loss: 0.5419, batch_reg_loss: 0.1634, reg_loss: 0.1636 ||:  96%|#########6| 107/111 [01:10<00:02,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9601, LAS: 0.9256, UEM: 0.6451, LEM: 0.4269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4750, partial_loss/deprel_loss: 0.4599, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6263, loss: 0.5441, batch_reg_loss: 0.1634, reg_loss: 0.1636 ||: 100%|##########| 111/111 [01:12<00:00,  1.54it/s]\n",
+      "2023-04-07 01:25:23,464 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:25:23,464 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:25:23,464 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:25:23,464 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:25:23,464 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.460  |       N/A\n",
+      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.475  |       N/A\n",
+      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.164  |       N/A\n",
+      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - UEM                      |     0.645  |       N/A\n",
+      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - LAS                      |     0.926  |       N/A\n",
+      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - loss                     |     0.544  |       N/A\n",
+      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - LEM                      |     0.427  |       N/A\n",
+      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - UAS                      |     0.960  |       N/A\n",
+      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - EM                       |     0.915  |       N/A\n",
+      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:25:23,472 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:25:28,456 - INFO - combo.training.trainer - Epoch duration: 0:01:20.340225\n",
+      "2023-04-07 01:25:28,456 - INFO - combo.training.trainer - Estimated training time remaining: 6:30:34\n",
+      "2023-04-07 01:25:28,457 - INFO - allennlp.training.trainer - Epoch 114/399\n",
+      "2023-04-07 01:25:28,457 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:25:28,457 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:25:28,466 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9547, LAS: 0.9186, UEM: 0.4273, LEM: 0.1939, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6578, partial_loss/deprel_loss: 0.4807, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6796, loss: 0.6056, batch_reg_loss: 0.1634, reg_loss: 0.1634 ||:   3%|2         | 3/111 [00:02<01:21,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9578, LAS: 0.9234, UEM: 0.4774, LEM: 0.2359, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2891, partial_loss/deprel_loss: 0.3978, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5394, loss: 0.5772, batch_reg_loss: 0.1634, reg_loss: 0.1634 ||:   5%|5         | 6/111 [00:04<01:18,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9633, LAS: 0.9302, UEM: 0.5858, LEM: 0.3515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2834, partial_loss/deprel_loss: 0.3211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4769, loss: 0.5286, batch_reg_loss: 0.1634, reg_loss: 0.1634 ||:   9%|9         | 10/111 [00:06<01:11,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9626, LAS: 0.9286, UEM: 0.6194, LEM: 0.3824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5775, partial_loss/deprel_loss: 0.5050, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6829, loss: 0.5309, batch_reg_loss: 0.1634, reg_loss: 0.1634 ||:  13%|#2        | 14/111 [00:09<01:05,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9637, LAS: 0.9305, UEM: 0.6935, LEM: 0.4949, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2059, partial_loss/deprel_loss: 0.3146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4562, loss: 0.5180, batch_reg_loss: 0.1634, reg_loss: 0.1634 ||:  15%|#5        | 17/111 [00:11<01:08,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9644, LAS: 0.9308, UEM: 0.6832, LEM: 0.4742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3690, partial_loss/deprel_loss: 0.4402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5893, loss: 0.5159, batch_reg_loss: 0.1633, reg_loss: 0.1634 ||:  19%|#8        | 21/111 [00:14<01:02,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9633, LAS: 0.9294, UEM: 0.6628, LEM: 0.4527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6813, partial_loss/deprel_loss: 0.5702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7558, loss: 0.5264, batch_reg_loss: 0.1633, reg_loss: 0.1634 ||:  22%|##1       | 24/111 [00:16<01:00,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9457, UAS: 0.9644, LAS: 0.9303, UEM: 0.6832, LEM: 0.4702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0925, partial_loss/deprel_loss: 0.2237, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3608, loss: 0.5173, batch_reg_loss: 0.1633, reg_loss: 0.1634 ||:  24%|##4       | 27/111 [00:18<00:58,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9140, UAS: 0.9624, LAS: 0.9282, UEM: 0.6623, LEM: 0.4533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4599, partial_loss/deprel_loss: 0.4563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6204, loss: 0.5314, batch_reg_loss: 0.1633, reg_loss: 0.1634 ||:  27%|##7       | 30/111 [00:20<00:56,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9620, LAS: 0.9284, UEM: 0.6473, LEM: 0.4383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6177, partial_loss/deprel_loss: 0.4161, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6197, loss: 0.5333, batch_reg_loss: 0.1633, reg_loss: 0.1634 ||:  31%|###       | 34/111 [00:23<00:51,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9632, LAS: 0.9297, UEM: 0.6585, LEM: 0.4422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3120, partial_loss/deprel_loss: 0.3296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4894, loss: 0.5242, batch_reg_loss: 0.1633, reg_loss: 0.1634 ||:  34%|###4      | 38/111 [00:25<00:48,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9390, UAS: 0.9624, LAS: 0.9289, UEM: 0.6467, LEM: 0.4326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2178, partial_loss/deprel_loss: 0.2864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4360, loss: 0.5306, batch_reg_loss: 0.1633, reg_loss: 0.1633 ||:  38%|###7      | 42/111 [00:28<00:46,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9616, LAS: 0.9279, UEM: 0.6359, LEM: 0.4228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7707, partial_loss/deprel_loss: 0.5840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7846, loss: 0.5386, batch_reg_loss: 0.1633, reg_loss: 0.1633 ||:  41%|####      | 45/111 [00:30<00:47,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9620, LAS: 0.9282, UEM: 0.6325, LEM: 0.4168, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2114, partial_loss/deprel_loss: 0.2645, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4172, loss: 0.5358, batch_reg_loss: 0.1633, reg_loss: 0.1633 ||:  43%|####3     | 48/111 [00:33<00:45,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9617, LAS: 0.9280, UEM: 0.6243, LEM: 0.4086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3437, partial_loss/deprel_loss: 0.3858, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5407, loss: 0.5381, batch_reg_loss: 0.1633, reg_loss: 0.1633 ||:  46%|####5     | 51/111 [00:35<00:44,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9617, LAS: 0.9280, UEM: 0.6325, LEM: 0.4184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3666, partial_loss/deprel_loss: 0.3718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5340, loss: 0.5358, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  49%|####8     | 54/111 [00:37<00:41,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8896, UAS: 0.9615, LAS: 0.9277, UEM: 0.6346, LEM: 0.4193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9003, partial_loss/deprel_loss: 0.5767, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8046, loss: 0.5368, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  51%|#####1    | 57/111 [00:39<00:39,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8737, UAS: 0.9606, LAS: 0.9267, UEM: 0.6277, LEM: 0.4124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0115, partial_loss/deprel_loss: 0.6611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8944, loss: 0.5447, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  54%|#####4    | 60/111 [00:42<00:37,  1.35it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9609, LAS: 0.9269, UEM: 0.6307, LEM: 0.4115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4027, partial_loss/deprel_loss: 0.4277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5859, loss: 0.5431, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  57%|#####6    | 63/111 [00:44<00:36,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9607, LAS: 0.9267, UEM: 0.6229, LEM: 0.4040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2619, partial_loss/deprel_loss: 0.3418, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4891, loss: 0.5432, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  60%|######    | 67/111 [00:46<00:31,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9613, LAS: 0.9271, UEM: 0.6294, LEM: 0.4077, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1762, partial_loss/deprel_loss: 0.3194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4539, loss: 0.5403, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  63%|######3   | 70/111 [00:49<00:29,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9609, LAS: 0.9267, UEM: 0.6307, LEM: 0.4092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3327, partial_loss/deprel_loss: 0.3712, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5267, loss: 0.5436, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  66%|######5   | 73/111 [00:51<00:26,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9613, LAS: 0.9272, UEM: 0.6381, LEM: 0.4157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2478, partial_loss/deprel_loss: 0.3511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4936, loss: 0.5398, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  68%|######8   | 76/111 [00:53<00:24,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9149, UAS: 0.9614, LAS: 0.9272, UEM: 0.6402, LEM: 0.4171, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4677, partial_loss/deprel_loss: 0.4691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6320, loss: 0.5406, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  72%|#######2  | 80/111 [00:55<00:20,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9616, LAS: 0.9273, UEM: 0.6387, LEM: 0.4146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1989, partial_loss/deprel_loss: 0.3139, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4541, loss: 0.5391, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  76%|#######5  | 84/111 [00:57<00:17,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9078, UAS: 0.9616, LAS: 0.9271, UEM: 0.6359, LEM: 0.4101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6056, partial_loss/deprel_loss: 0.4984, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6830, loss: 0.5388, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  80%|########  | 89/111 [01:00<00:13,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9432, UAS: 0.9613, LAS: 0.9268, UEM: 0.6340, LEM: 0.4079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1500, partial_loss/deprel_loss: 0.2520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3948, loss: 0.5409, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  85%|########4 | 94/111 [01:02<00:09,  1.76it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9607, LAS: 0.9261, UEM: 0.6273, LEM: 0.4017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4857, partial_loss/deprel_loss: 0.3974, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5782, loss: 0.5446, batch_reg_loss: 0.1631, reg_loss: 0.1633 ||:  89%|########9 | 99/111 [01:05<00:06,  1.87it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9608, LAS: 0.9263, UEM: 0.6391, LEM: 0.4190, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5761, partial_loss/deprel_loss: 0.4574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6442, loss: 0.5438, batch_reg_loss: 0.1631, reg_loss: 0.1633 ||:  93%|#########2| 103/111 [01:07<00:04,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9232, UAS: 0.9606, LAS: 0.9262, UEM: 0.6421, LEM: 0.4215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3545, partial_loss/deprel_loss: 0.4660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6068, loss: 0.5446, batch_reg_loss: 0.1631, reg_loss: 0.1633 ||:  96%|#########6| 107/111 [01:10<00:02,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9610, LAS: 0.9266, UEM: 0.6457, LEM: 0.4231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2279, partial_loss/deprel_loss: 0.2647, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4205, loss: 0.5415, batch_reg_loss: 0.1631, reg_loss: 0.1633 ||: 100%|##########| 111/111 [01:13<00:00,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9610, LAS: 0.9266, UEM: 0.6457, LEM: 0.4231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2279, partial_loss/deprel_loss: 0.2647, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4205, loss: 0.5415, batch_reg_loss: 0.1631, reg_loss: 0.1633 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
+      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.265  |       N/A\n",
+      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.228  |       N/A\n",
+      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.163  |       N/A\n",
+      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - UEM                      |     0.646  |       N/A\n",
+      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - LAS                      |     0.927  |       N/A\n",
+      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - loss                     |     0.542  |       N/A\n",
+      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - LEM                      |     0.423  |       N/A\n",
+      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - UAS                      |     0.961  |       N/A\n",
+      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - EM                       |     0.937  |       N/A\n",
+      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:26:44,764 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:26:49,799 - INFO - combo.training.trainer - Epoch duration: 0:01:21.342111\n",
+      "2023-04-07 01:26:49,799 - INFO - combo.training.trainer - Estimated training time remaining: 6:29:11\n",
+      "2023-04-07 01:26:49,799 - INFO - allennlp.training.trainer - Epoch 115/399\n",
+      "2023-04-07 01:26:49,799 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:26:49,800 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:26:49,811 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9547, LAS: 0.9173, UEM: 0.3925, LEM: 0.1752, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3871, partial_loss/deprel_loss: 0.3791, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5438, loss: 0.5949, batch_reg_loss: 0.1631, reg_loss: 0.1631 ||:   4%|3         | 4/111 [00:02<01:03,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9481, UAS: 0.9608, LAS: 0.9239, UEM: 0.6031, LEM: 0.3739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0845, partial_loss/deprel_loss: 0.2596, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3876, loss: 0.5477, batch_reg_loss: 0.1631, reg_loss: 0.1631 ||:   6%|6         | 7/111 [00:04<01:06,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9610, LAS: 0.9251, UEM: 0.6085, LEM: 0.3740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2537, partial_loss/deprel_loss: 0.3027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4560, loss: 0.5365, batch_reg_loss: 0.1631, reg_loss: 0.1631 ||:   9%|9         | 10/111 [00:06<01:05,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9606, LAS: 0.9248, UEM: 0.5913, LEM: 0.3514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3193, partial_loss/deprel_loss: 0.3527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5091, loss: 0.5387, batch_reg_loss: 0.1631, reg_loss: 0.1631 ||:  13%|#2        | 14/111 [00:09<01:02,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8811, UAS: 0.9561, LAS: 0.9205, UEM: 0.5787, LEM: 0.3493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9752, partial_loss/deprel_loss: 0.5953, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8343, loss: 0.5763, batch_reg_loss: 0.1631, reg_loss: 0.1631 ||:  16%|#6        | 18/111 [00:11<01:00,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9571, LAS: 0.9214, UEM: 0.5802, LEM: 0.3486, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4454, partial_loss/deprel_loss: 0.4338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5991, loss: 0.5686, batch_reg_loss: 0.1631, reg_loss: 0.1631 ||:  19%|#8        | 21/111 [00:13<00:59,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9558, LAS: 0.9203, UEM: 0.5699, LEM: 0.3397, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7849, partial_loss/deprel_loss: 0.5225, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7381, loss: 0.5809, batch_reg_loss: 0.1630, reg_loss: 0.1631 ||:  23%|##2       | 25/111 [00:16<00:54,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9003, UAS: 0.9560, LAS: 0.9204, UEM: 0.5712, LEM: 0.3433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7318, partial_loss/deprel_loss: 0.5219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7270, loss: 0.5789, batch_reg_loss: 0.1630, reg_loss: 0.1631 ||:  26%|##6       | 29/111 [00:18<00:52,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9562, LAS: 0.9205, UEM: 0.5662, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4325, partial_loss/deprel_loss: 0.3829, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5558, loss: 0.5776, batch_reg_loss: 0.1630, reg_loss: 0.1631 ||:  29%|##8       | 32/111 [00:20<00:51,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9074, UAS: 0.9567, LAS: 0.9210, UEM: 0.5642, LEM: 0.3343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5532, partial_loss/deprel_loss: 0.4689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6488, loss: 0.5761, batch_reg_loss: 0.1630, reg_loss: 0.1631 ||:  32%|###2      | 36/111 [00:23<00:48,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9577, LAS: 0.9227, UEM: 0.5645, LEM: 0.3351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2900, partial_loss/deprel_loss: 0.3423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4949, loss: 0.5676, batch_reg_loss: 0.1630, reg_loss: 0.1631 ||:  36%|###6      | 40/111 [00:25<00:44,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9432, UAS: 0.9593, LAS: 0.9242, UEM: 0.6023, LEM: 0.3702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1667, partial_loss/deprel_loss: 0.2403, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3885, loss: 0.5565, batch_reg_loss: 0.1630, reg_loss: 0.1631 ||:  40%|###9      | 44/111 [00:28<00:42,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9598, LAS: 0.9247, UEM: 0.6098, LEM: 0.3747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1807, partial_loss/deprel_loss: 0.3618, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4886, loss: 0.5529, batch_reg_loss: 0.1630, reg_loss: 0.1630 ||:  43%|####3     | 48/111 [00:30<00:39,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9600, LAS: 0.9249, UEM: 0.6152, LEM: 0.3815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8968, partial_loss/deprel_loss: 0.6086, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8292, loss: 0.5531, batch_reg_loss: 0.1630, reg_loss: 0.1630 ||:  47%|####6     | 52/111 [00:33<00:38,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9760, UAS: 0.9603, LAS: 0.9255, UEM: 0.6436, LEM: 0.4230, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0247, partial_loss/deprel_loss: 0.0855, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2363, loss: 0.5484, batch_reg_loss: 0.1630, reg_loss: 0.1630 ||:  50%|#####     | 56/111 [00:37<00:40,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9620, UAS: 0.9613, LAS: 0.9268, UEM: 0.6714, LEM: 0.4588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0662, partial_loss/deprel_loss: 0.1438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2913, loss: 0.5381, batch_reg_loss: 0.1630, reg_loss: 0.1630 ||:  53%|#####3    | 59/111 [00:39<00:40,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9611, LAS: 0.9266, UEM: 0.6727, LEM: 0.4602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1327, partial_loss/deprel_loss: 0.2068, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3549, loss: 0.5380, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||:  57%|#####6    | 63/111 [00:42<00:37,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9608, LAS: 0.9264, UEM: 0.6661, LEM: 0.4527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3382, partial_loss/deprel_loss: 0.3869, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5401, loss: 0.5396, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||:  59%|#####9    | 66/111 [00:45<00:33,  1.33it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9610, LAS: 0.9265, UEM: 0.6630, LEM: 0.4484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1927, partial_loss/deprel_loss: 0.3164, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4546, loss: 0.5398, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||:  64%|######3   | 71/111 [00:47<00:26,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9604, LAS: 0.9259, UEM: 0.6528, LEM: 0.4391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7439, partial_loss/deprel_loss: 0.5034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7144, loss: 0.5445, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||:  68%|######8   | 76/111 [00:49<00:21,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9600, LAS: 0.9254, UEM: 0.6427, LEM: 0.4295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6552, partial_loss/deprel_loss: 0.4768, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6753, loss: 0.5482, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||:  73%|#######2  | 81/111 [00:52<00:17,  1.76it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9605, LAS: 0.9259, UEM: 0.6488, LEM: 0.4346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1739, partial_loss/deprel_loss: 0.2751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4177, loss: 0.5444, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||:  77%|#######6  | 85/111 [00:54<00:14,  1.76it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9603, LAS: 0.9255, UEM: 0.6422, LEM: 0.4275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1929, partial_loss/deprel_loss: 0.3498, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4813, loss: 0.5465, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||:  80%|########  | 89/111 [00:57<00:13,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9104, UAS: 0.9602, LAS: 0.9253, UEM: 0.6407, LEM: 0.4251, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5308, partial_loss/deprel_loss: 0.4559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6338, loss: 0.5477, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||:  84%|########3 | 93/111 [01:00<00:12,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9604, LAS: 0.9255, UEM: 0.6448, LEM: 0.4295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1062, partial_loss/deprel_loss: 0.2317, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3694, loss: 0.5461, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||:  87%|########7 | 97/111 [01:03<00:09,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9604, LAS: 0.9255, UEM: 0.6440, LEM: 0.4280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7574, partial_loss/deprel_loss: 0.5058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7189, loss: 0.5467, batch_reg_loss: 0.1628, reg_loss: 0.1630 ||:  91%|######### | 101/111 [01:06<00:06,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9607, LAS: 0.9259, UEM: 0.6425, LEM: 0.4246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3432, partial_loss/deprel_loss: 0.3784, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5342, loss: 0.5447, batch_reg_loss: 0.1628, reg_loss: 0.1630 ||:  95%|#########4| 105/111 [01:09<00:04,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9607, LAS: 0.9259, UEM: 0.6409, LEM: 0.4238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4736, partial_loss/deprel_loss: 0.4850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6455, loss: 0.5447, batch_reg_loss: 0.1628, reg_loss: 0.1630 ||:  98%|#########8| 109/111 [01:11<00:01,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9488, UAS: 0.9610, LAS: 0.9262, UEM: 0.6476, LEM: 0.4308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0943, partial_loss/deprel_loss: 0.2058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3463, loss: 0.5421, batch_reg_loss: 0.1628, reg_loss: 0.1630 ||: 100%|##########| 111/111 [01:13<00:00,  1.52it/s]\n",
+      "2023-04-07 01:28:05,803 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8771, UAS: 0.9357, LAS: 0.8788, UEM: 0.3387, LEM: 0.0753, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9730, partial_loss/deprel_loss: 35.4884, partial_loss/cycle_loss: 0.0000, batch_loss: 28.5853, loss: 31.0780, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:12,  1.09s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9552, LAS: 0.9039, UEM: 0.6997, LEM: 0.4008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1418, partial_loss/deprel_loss: 22.8051, partial_loss/cycle_loss: 0.0000, batch_loss: 18.2725, loss: 25.2398, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  31%|###       | 4/13 [00:04<00:09,  1.09s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9505, LAS: 0.9004, UEM: 0.6364, LEM: 0.3599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7520, partial_loss/deprel_loss: 28.9441, partial_loss/cycle_loss: 0.0000, batch_loss: 23.3056, loss: 25.0064, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  54%|#####3    | 7/13 [00:07<00:06,  1.04s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9546, LAS: 0.9063, UEM: 0.7099, LEM: 0.4538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5701, partial_loss/deprel_loss: 23.5040, partial_loss/cycle_loss: 0.0000, batch_loss: 18.9172, loss: 23.1846, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  69%|######9   | 9/13 [00:09<00:04,  1.06s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9528, LAS: 0.9035, UEM: 0.6763, LEM: 0.4070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7413, partial_loss/deprel_loss: 33.2838, partial_loss/cycle_loss: 0.0000, batch_loss: 26.7753, loss: 23.2175, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  92%|#########2| 12/13 [00:11<00:00,  1.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8407, UAS: 0.9483, LAS: 0.8987, UEM: 0.6599, LEM: 0.3961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6642, partial_loss/deprel_loss: 54.1649, partial_loss/cycle_loss: 0.0000, batch_loss: 43.6647, loss: 24.7903, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.00it/s]\n",
+      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
+      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.206  |    54.165\n",
+      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.094  |     1.664\n",
+      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.163  |     0.000\n",
+      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - UEM                      |     0.648  |     0.660\n",
+      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - LAS                      |     0.926  |     0.899\n",
+      "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - loss                     |     0.542  |    24.790\n",
+      "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - LEM                      |     0.431  |     0.396\n",
+      "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - UAS                      |     0.961  |     0.948\n",
+      "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - EM                       |     0.949  |     0.841\n",
+      "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:28:18,783 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:28:23,018 - INFO - combo.training.trainer - Epoch duration: 0:01:33.219014\n",
+      "2023-04-07 01:28:23,019 - INFO - combo.training.trainer - Estimated training time remaining: 6:28:17\n",
+      "2023-04-07 01:28:23,019 - INFO - allennlp.training.trainer - Epoch 116/399\n",
+      "2023-04-07 01:28:23,019 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:28:23,020 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:28:23,029 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9574, LAS: 0.9219, UEM: 0.5537, LEM: 0.3239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2990, partial_loss/deprel_loss: 0.3329, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4890, loss: 0.5787, batch_reg_loss: 0.1628, reg_loss: 0.1628 ||:   4%|3         | 4/111 [00:02<01:11,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9581, LAS: 0.9241, UEM: 0.5307, LEM: 0.3093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6387, partial_loss/deprel_loss: 0.4368, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6399, loss: 0.5651, batch_reg_loss: 0.1628, reg_loss: 0.1628 ||:   7%|7         | 8/111 [00:05<01:07,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9591, LAS: 0.9241, UEM: 0.5168, LEM: 0.2895, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4099, partial_loss/deprel_loss: 0.4618, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6142, loss: 0.5604, batch_reg_loss: 0.1628, reg_loss: 0.1628 ||:  10%|9         | 11/111 [00:07<01:07,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9567, LAS: 0.9219, UEM: 0.5284, LEM: 0.3066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4870, partial_loss/deprel_loss: 0.4399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6121, loss: 0.5698, batch_reg_loss: 0.1628, reg_loss: 0.1628 ||:  13%|#2        | 14/111 [00:09<01:08,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9312, UAS: 0.9564, LAS: 0.9219, UEM: 0.5200, LEM: 0.2981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3841, partial_loss/deprel_loss: 0.3641, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5309, loss: 0.5723, batch_reg_loss: 0.1628, reg_loss: 0.1628 ||:  15%|#5        | 17/111 [00:11<01:07,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9589, LAS: 0.9248, UEM: 0.6190, LEM: 0.4255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2891, partial_loss/deprel_loss: 0.3886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5315, loss: 0.5545, batch_reg_loss: 0.1628, reg_loss: 0.1628 ||:  18%|#8        | 20/111 [00:14<01:06,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9577, LAS: 0.9236, UEM: 0.6216, LEM: 0.4336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5082, partial_loss/deprel_loss: 0.4548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6282, loss: 0.5616, batch_reg_loss: 0.1628, reg_loss: 0.1628 ||:  21%|##        | 23/111 [00:16<01:07,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9595, LAS: 0.9256, UEM: 0.6471, LEM: 0.4526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1424, partial_loss/deprel_loss: 0.2302, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3754, loss: 0.5457, batch_reg_loss: 0.1627, reg_loss: 0.1628 ||:  23%|##3       | 26/111 [00:19<01:07,  1.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9588, LAS: 0.9249, UEM: 0.6298, LEM: 0.4361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3933, partial_loss/deprel_loss: 0.4228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5796, loss: 0.5488, batch_reg_loss: 0.1627, reg_loss: 0.1628 ||:  26%|##6       | 29/111 [00:21<01:02,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9606, LAS: 0.9268, UEM: 0.6540, LEM: 0.4570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3722, partial_loss/deprel_loss: 0.3230, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4956, loss: 0.5388, batch_reg_loss: 0.1627, reg_loss: 0.1628 ||:  30%|##9       | 33/111 [00:23<00:54,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9612, LAS: 0.9271, UEM: 0.6495, LEM: 0.4434, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1959, partial_loss/deprel_loss: 0.3470, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4795, loss: 0.5359, batch_reg_loss: 0.1627, reg_loss: 0.1628 ||:  34%|###4      | 38/111 [00:26<00:47,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9500, UAS: 0.9614, LAS: 0.9273, UEM: 0.6543, LEM: 0.4509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1142, partial_loss/deprel_loss: 0.1998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3453, loss: 0.5354, batch_reg_loss: 0.1627, reg_loss: 0.1628 ||:  39%|###8      | 43/111 [00:28<00:40,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9616, LAS: 0.9277, UEM: 0.6489, LEM: 0.4439, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2601, partial_loss/deprel_loss: 0.3257, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4753, loss: 0.5345, batch_reg_loss: 0.1627, reg_loss: 0.1627 ||:  43%|####3     | 48/111 [00:31<00:35,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9430, UAS: 0.9621, LAS: 0.9282, UEM: 0.6544, LEM: 0.4447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1851, partial_loss/deprel_loss: 0.2794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4232, loss: 0.5299, batch_reg_loss: 0.1627, reg_loss: 0.1627 ||:  47%|####6     | 52/111 [00:33<00:35,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9624, LAS: 0.9282, UEM: 0.6494, LEM: 0.4354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3444, partial_loss/deprel_loss: 0.4008, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5522, loss: 0.5285, batch_reg_loss: 0.1627, reg_loss: 0.1627 ||:  50%|#####     | 56/111 [00:36<00:35,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9626, LAS: 0.9284, UEM: 0.6518, LEM: 0.4341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2388, partial_loss/deprel_loss: 0.3454, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4868, loss: 0.5269, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||:  54%|#####4    | 60/111 [00:40<00:36,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9604, UAS: 0.9629, LAS: 0.9288, UEM: 0.6697, LEM: 0.4579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0658, partial_loss/deprel_loss: 0.1754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3161, loss: 0.5245, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||:  58%|#####7    | 64/111 [00:43<00:33,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9629, LAS: 0.9286, UEM: 0.6671, LEM: 0.4545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1502, partial_loss/deprel_loss: 0.2937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4276, loss: 0.5241, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||:  61%|######1   | 68/111 [00:45<00:29,  1.44it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9630, LAS: 0.9289, UEM: 0.6664, LEM: 0.4523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2564, partial_loss/deprel_loss: 0.3409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4866, loss: 0.5225, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||:  65%|######4   | 72/111 [00:48<00:25,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9620, LAS: 0.9276, UEM: 0.6565, LEM: 0.4431, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5197, partial_loss/deprel_loss: 0.4834, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6533, loss: 0.5320, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||:  68%|######8   | 76/111 [00:50<00:23,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8912, UAS: 0.9617, LAS: 0.9273, UEM: 0.6535, LEM: 0.4384, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8500, partial_loss/deprel_loss: 0.5179, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7469, loss: 0.5336, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||:  72%|#######2  | 80/111 [00:53<00:20,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9613, LAS: 0.9271, UEM: 0.6508, LEM: 0.4368, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5955, partial_loss/deprel_loss: 0.4227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6198, loss: 0.5355, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||:  76%|#######5  | 84/111 [00:56<00:18,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9300, UAS: 0.9606, LAS: 0.9264, UEM: 0.6449, LEM: 0.4306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3222, partial_loss/deprel_loss: 0.3930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5414, loss: 0.5413, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||:  79%|#######9  | 88/111 [00:58<00:15,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9381, UAS: 0.9608, LAS: 0.9267, UEM: 0.6465, LEM: 0.4318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2406, partial_loss/deprel_loss: 0.3309, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4754, loss: 0.5395, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||:  83%|########2 | 92/111 [01:01<00:12,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9609, LAS: 0.9267, UEM: 0.6496, LEM: 0.4346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7109, partial_loss/deprel_loss: 0.4976, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7028, loss: 0.5385, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||:  86%|########6 | 96/111 [01:04<00:10,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9610, LAS: 0.9268, UEM: 0.6488, LEM: 0.4326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6543, partial_loss/deprel_loss: 0.4789, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6765, loss: 0.5377, batch_reg_loss: 0.1625, reg_loss: 0.1627 ||:  90%|######### | 100/111 [01:06<00:07,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9608, LAS: 0.9266, UEM: 0.6439, LEM: 0.4283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2691, partial_loss/deprel_loss: 0.3528, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4986, loss: 0.5396, batch_reg_loss: 0.1625, reg_loss: 0.1627 ||:  93%|#########2| 103/111 [01:08<00:05,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9610, LAS: 0.9268, UEM: 0.6465, LEM: 0.4289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1619, partial_loss/deprel_loss: 0.2886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4258, loss: 0.5377, batch_reg_loss: 0.1625, reg_loss: 0.1627 ||:  96%|#########6| 107/111 [01:11<00:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9608, LAS: 0.9265, UEM: 0.6469, LEM: 0.4300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1204, partial_loss/deprel_loss: 0.2431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3811, loss: 0.5391, batch_reg_loss: 0.1625, reg_loss: 0.1627 ||:  99%|#########9| 110/111 [01:13<00:00,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9609, LAS: 0.9266, UEM: 0.6485, LEM: 0.4310, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2016, partial_loss/deprel_loss: 0.2930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4372, loss: 0.5382, batch_reg_loss: 0.1625, reg_loss: 0.1627 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
+      "2023-04-07 01:29:40,436 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:29:40,436 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:29:40,436 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.293  |       N/A\n",
+      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.202  |       N/A\n",
+      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.163  |       N/A\n",
+      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - UEM                      |     0.649  |       N/A\n",
+      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - LAS                      |     0.927  |       N/A\n",
+      "2023-04-07 01:29:40,438 - INFO - combo.training.tensorboard_writer - loss                     |     0.538  |       N/A\n",
+      "2023-04-07 01:29:40,438 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:29:40,438 - INFO - combo.training.tensorboard_writer - LEM                      |     0.431  |       N/A\n",
+      "2023-04-07 01:29:40,438 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:29:40,438 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:29:40,438 - INFO - combo.training.tensorboard_writer - UAS                      |     0.961  |       N/A\n",
+      "2023-04-07 01:29:40,439 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:29:40,439 - INFO - combo.training.tensorboard_writer - EM                       |     0.938  |       N/A\n",
+      "2023-04-07 01:29:40,439 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:29:40,447 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:29:45,284 - INFO - combo.training.trainer - Epoch duration: 0:01:22.264978\n",
+      "2023-04-07 01:29:45,284 - INFO - combo.training.trainer - Estimated training time remaining: 6:26:55\n",
+      "2023-04-07 01:29:45,285 - INFO - allennlp.training.trainer - Epoch 117/399\n",
+      "2023-04-07 01:29:45,285 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:29:45,286 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:29:45,297 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8930, UAS: 0.9410, LAS: 0.9072, UEM: 0.2115, LEM: 0.0673, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0066, partial_loss/deprel_loss: 0.4922, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7576, loss: 0.6695, batch_reg_loss: 0.1625, reg_loss: 0.1625 ||:   3%|2         | 3/111 [00:02<01:16,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9473, UAS: 0.9573, LAS: 0.9234, UEM: 0.6225, LEM: 0.4012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1534, partial_loss/deprel_loss: 0.2371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3829, loss: 0.5587, batch_reg_loss: 0.1625, reg_loss: 0.1625 ||:   5%|5         | 6/111 [00:04<01:13,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9597, LAS: 0.9265, UEM: 0.6303, LEM: 0.4005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2763, partial_loss/deprel_loss: 0.2943, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4532, loss: 0.5306, batch_reg_loss: 0.1625, reg_loss: 0.1625 ||:   9%|9         | 10/111 [00:06<01:08,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9362, UAS: 0.9618, LAS: 0.9290, UEM: 0.6422, LEM: 0.4102, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3256, partial_loss/deprel_loss: 0.3279, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4899, loss: 0.5178, batch_reg_loss: 0.1625, reg_loss: 0.1625 ||:  13%|#2        | 14/111 [00:09<01:04,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9631, LAS: 0.9301, UEM: 0.6359, LEM: 0.3976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2475, partial_loss/deprel_loss: 0.3239, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4711, loss: 0.5122, batch_reg_loss: 0.1625, reg_loss: 0.1625 ||:  16%|#6        | 18/111 [00:11<00:57,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9630, LAS: 0.9298, UEM: 0.6229, LEM: 0.3805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3032, partial_loss/deprel_loss: 0.3606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5115, loss: 0.5102, batch_reg_loss: 0.1625, reg_loss: 0.1625 ||:  21%|##        | 23/111 [00:13<00:50,  1.74it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9634, LAS: 0.9309, UEM: 0.6398, LEM: 0.4021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1709, partial_loss/deprel_loss: 0.2609, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4053, loss: 0.5038, batch_reg_loss: 0.1624, reg_loss: 0.1625 ||:  25%|##5       | 28/111 [00:15<00:43,  1.90it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9280, UAS: 0.9632, LAS: 0.9309, UEM: 0.6331, LEM: 0.3985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3200, partial_loss/deprel_loss: 0.4090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5536, loss: 0.5060, batch_reg_loss: 0.1624, reg_loss: 0.1625 ||:  29%|##8       | 32/111 [00:17<00:41,  1.91it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9744, UAS: 0.9632, LAS: 0.9312, UEM: 0.6660, LEM: 0.4534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0344, partial_loss/deprel_loss: 0.0977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2474, loss: 0.5044, batch_reg_loss: 0.1624, reg_loss: 0.1625 ||:  32%|###2      | 36/111 [00:21<00:46,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9634, LAS: 0.9313, UEM: 0.6693, LEM: 0.4571, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4329, partial_loss/deprel_loss: 0.4586, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6159, loss: 0.5044, batch_reg_loss: 0.1624, reg_loss: 0.1625 ||:  36%|###6      | 40/111 [00:23<00:45,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9626, LAS: 0.9303, UEM: 0.6647, LEM: 0.4514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6757, partial_loss/deprel_loss: 0.4823, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6834, loss: 0.5078, batch_reg_loss: 0.1624, reg_loss: 0.1625 ||:  40%|###9      | 44/111 [00:26<00:45,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9623, LAS: 0.9300, UEM: 0.6570, LEM: 0.4426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5023, partial_loss/deprel_loss: 0.4532, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6254, loss: 0.5114, batch_reg_loss: 0.1624, reg_loss: 0.1624 ||:  43%|####3     | 48/111 [00:29<00:42,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9164, UAS: 0.9624, LAS: 0.9300, UEM: 0.6613, LEM: 0.4473, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5246, partial_loss/deprel_loss: 0.4793, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6507, loss: 0.5130, batch_reg_loss: 0.1624, reg_loss: 0.1624 ||:  47%|####6     | 52/111 [00:32<00:39,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9625, LAS: 0.9299, UEM: 0.6535, LEM: 0.4376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3355, partial_loss/deprel_loss: 0.3536, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5124, loss: 0.5163, batch_reg_loss: 0.1624, reg_loss: 0.1624 ||:  50%|#####     | 56/111 [00:34<00:34,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9621, LAS: 0.9293, UEM: 0.6491, LEM: 0.4327, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1408, partial_loss/deprel_loss: 0.2545, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3941, loss: 0.5204, batch_reg_loss: 0.1624, reg_loss: 0.1624 ||:  54%|#####4    | 60/111 [00:37<00:32,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9619, LAS: 0.9290, UEM: 0.6429, LEM: 0.4245, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4015, partial_loss/deprel_loss: 0.3097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4904, loss: 0.5217, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  58%|#####7    | 64/111 [00:39<00:31,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8819, UAS: 0.9610, LAS: 0.9281, UEM: 0.6440, LEM: 0.4281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0708, partial_loss/deprel_loss: 0.6247, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8763, loss: 0.5269, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  61%|######1   | 68/111 [00:42<00:29,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9601, LAS: 0.9271, UEM: 0.6366, LEM: 0.4217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3447, partial_loss/deprel_loss: 0.3889, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5424, loss: 0.5337, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  64%|######3   | 71/111 [00:44<00:27,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9602, LAS: 0.9270, UEM: 0.6335, LEM: 0.4178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1685, partial_loss/deprel_loss: 0.3030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4385, loss: 0.5353, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  67%|######6   | 74/111 [00:47<00:26,  1.41it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9603, LAS: 0.9271, UEM: 0.6388, LEM: 0.4246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5088, partial_loss/deprel_loss: 0.4509, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6248, loss: 0.5350, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  69%|######9   | 77/111 [00:49<00:24,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9606, LAS: 0.9274, UEM: 0.6483, LEM: 0.4373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6415, partial_loss/deprel_loss: 0.5587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7376, loss: 0.5339, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  72%|#######2  | 80/111 [00:51<00:22,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9608, LAS: 0.9275, UEM: 0.6506, LEM: 0.4383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4282, partial_loss/deprel_loss: 0.4634, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6186, loss: 0.5326, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  75%|#######4  | 83/111 [00:53<00:20,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9612, LAS: 0.9277, UEM: 0.6555, LEM: 0.4408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2927, partial_loss/deprel_loss: 0.3332, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4874, loss: 0.5298, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  78%|#######8  | 87/111 [00:56<00:17,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9149, UAS: 0.9611, LAS: 0.9276, UEM: 0.6540, LEM: 0.4393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6455, partial_loss/deprel_loss: 0.5085, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6982, loss: 0.5311, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  81%|########1 | 90/111 [00:58<00:15,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9606, LAS: 0.9271, UEM: 0.6474, LEM: 0.4331, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6479, partial_loss/deprel_loss: 0.4413, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6449, loss: 0.5349, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  85%|########4 | 94/111 [01:01<00:11,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9608, LAS: 0.9273, UEM: 0.6451, LEM: 0.4300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3137, partial_loss/deprel_loss: 0.3642, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5164, loss: 0.5347, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  87%|########7 | 97/111 [01:03<00:09,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9607, LAS: 0.9271, UEM: 0.6447, LEM: 0.4293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3215, partial_loss/deprel_loss: 0.4272, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5683, loss: 0.5362, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  90%|######### | 100/111 [01:05<00:07,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9605, LAS: 0.9269, UEM: 0.6461, LEM: 0.4320, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1824, partial_loss/deprel_loss: 0.2260, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3796, loss: 0.5365, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  93%|#########2| 103/111 [01:07<00:05,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9608, LAS: 0.9272, UEM: 0.6491, LEM: 0.4333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1632, partial_loss/deprel_loss: 0.2947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4306, loss: 0.5345, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  95%|#########5| 106/111 [01:10<00:03,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9608, LAS: 0.9271, UEM: 0.6473, LEM: 0.4307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2056, partial_loss/deprel_loss: 0.3438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4784, loss: 0.5352, batch_reg_loss: 0.1622, reg_loss: 0.1624 ||:  99%|#########9| 110/111 [01:12<00:00,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9331, UAS: 0.9608, LAS: 0.9271, UEM: 0.6470, LEM: 0.4302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3199, partial_loss/deprel_loss: 0.3751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5263, loss: 0.5351, batch_reg_loss: 0.1622, reg_loss: 0.1624 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
+      "2023-04-07 01:31:01,940 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:31:01,940 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:31:01,940 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:31:01,940 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:31:01,940 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:31:01,940 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:31:01,940 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.375  |       N/A\n",
+      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.320  |       N/A\n",
+      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.162  |       N/A\n",
+      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - UEM                      |     0.647  |       N/A\n",
+      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - LAS                      |     0.927  |       N/A\n",
+      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - loss                     |     0.535  |       N/A\n",
+      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - LEM                      |     0.430  |       N/A\n",
+      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - UAS                      |     0.961  |       N/A\n",
+      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - EM                       |     0.933  |       N/A\n",
+      "2023-04-07 01:31:01,942 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:31:01,947 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:31:06,980 - INFO - combo.training.trainer - Epoch duration: 0:01:21.695775\n",
+      "2023-04-07 01:31:06,981 - INFO - combo.training.trainer - Estimated training time remaining: 6:25:32\n",
+      "2023-04-07 01:31:06,981 - INFO - allennlp.training.trainer - Epoch 118/399\n",
+      "2023-04-07 01:31:06,982 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:31:06,982 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:31:06,992 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9584, LAS: 0.9244, UEM: 0.5742, LEM: 0.3493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5284, partial_loss/deprel_loss: 0.4591, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6352, loss: 0.5838, batch_reg_loss: 0.1622, reg_loss: 0.1622 ||:   5%|4         | 5/111 [00:02<00:49,  2.13it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9661, LAS: 0.9330, UEM: 0.6756, LEM: 0.4417, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2489, partial_loss/deprel_loss: 0.3630, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5024, loss: 0.5213, batch_reg_loss: 0.1622, reg_loss: 0.1622 ||:   8%|8         | 9/111 [00:05<00:53,  1.89it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9642, LAS: 0.9312, UEM: 0.6472, LEM: 0.4141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2436, partial_loss/deprel_loss: 0.3190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4661, loss: 0.5239, batch_reg_loss: 0.1622, reg_loss: 0.1622 ||:  12%|#1        | 13/111 [00:07<00:54,  1.79it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9160, UAS: 0.9629, LAS: 0.9304, UEM: 0.6386, LEM: 0.4124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6097, partial_loss/deprel_loss: 0.4469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6417, loss: 0.5277, batch_reg_loss: 0.1622, reg_loss: 0.1622 ||:  15%|#5        | 17/111 [00:10<00:55,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9627, LAS: 0.9306, UEM: 0.6374, LEM: 0.4183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4281, partial_loss/deprel_loss: 0.3719, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5453, loss: 0.5259, batch_reg_loss: 0.1622, reg_loss: 0.1622 ||:  19%|#8        | 21/111 [00:12<00:54,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9628, LAS: 0.9302, UEM: 0.6381, LEM: 0.4163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4613, partial_loss/deprel_loss: 0.4099, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5824, loss: 0.5261, batch_reg_loss: 0.1622, reg_loss: 0.1622 ||:  23%|##3       | 26/111 [00:15<00:47,  1.78it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9468, UAS: 0.9630, LAS: 0.9303, UEM: 0.6479, LEM: 0.4259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1632, partial_loss/deprel_loss: 0.2524, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3967, loss: 0.5214, batch_reg_loss: 0.1622, reg_loss: 0.1622 ||:  28%|##7       | 31/111 [00:17<00:42,  1.87it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8916, UAS: 0.9633, LAS: 0.9307, UEM: 0.6835, LEM: 0.4758, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9265, partial_loss/deprel_loss: 0.5708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8041, loss: 0.5189, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||:  32%|###1      | 35/111 [00:20<00:45,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9635, LAS: 0.9309, UEM: 0.6790, LEM: 0.4666, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3176, partial_loss/deprel_loss: 0.3150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4776, loss: 0.5163, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||:  35%|###5      | 39/111 [00:23<00:48,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9580, UAS: 0.9644, LAS: 0.9317, UEM: 0.7036, LEM: 0.4959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0596, partial_loss/deprel_loss: 0.1671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3077, loss: 0.5090, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||:  38%|###7      | 42/111 [00:26<00:49,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9243, UAS: 0.9646, LAS: 0.9317, UEM: 0.6970, LEM: 0.4853, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4318, partial_loss/deprel_loss: 0.4018, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5699, loss: 0.5093, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||:  41%|####1     | 46/111 [00:28<00:45,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9643, LAS: 0.9313, UEM: 0.6905, LEM: 0.4775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2069, partial_loss/deprel_loss: 0.3115, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4527, loss: 0.5109, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||:  44%|####4     | 49/111 [00:30<00:42,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9520, UAS: 0.9647, LAS: 0.9317, UEM: 0.6980, LEM: 0.4860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0849, partial_loss/deprel_loss: 0.1925, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3331, loss: 0.5082, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||:  47%|####6     | 52/111 [00:33<00:41,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9636, LAS: 0.9306, UEM: 0.6847, LEM: 0.4741, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7901, partial_loss/deprel_loss: 0.4558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6847, loss: 0.5165, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||:  50%|#####     | 56/111 [00:35<00:37,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9637, LAS: 0.9306, UEM: 0.6816, LEM: 0.4689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3447, partial_loss/deprel_loss: 0.3302, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4952, loss: 0.5146, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||:  53%|#####3    | 59/111 [00:37<00:35,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9631, LAS: 0.9296, UEM: 0.6729, LEM: 0.4598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3769, partial_loss/deprel_loss: 0.4646, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6091, loss: 0.5212, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||:  56%|#####5    | 62/111 [00:39<00:33,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9633, LAS: 0.9297, UEM: 0.6692, LEM: 0.4535, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2217, partial_loss/deprel_loss: 0.3478, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4846, loss: 0.5206, batch_reg_loss: 0.1621, reg_loss: 0.1621 ||:  59%|#####9    | 66/111 [00:41<00:28,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9627, LAS: 0.9290, UEM: 0.6628, LEM: 0.4461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6047, partial_loss/deprel_loss: 0.4760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6637, loss: 0.5258, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  63%|######3   | 70/111 [00:45<00:28,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9625, LAS: 0.9287, UEM: 0.6564, LEM: 0.4398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4710, partial_loss/deprel_loss: 0.4209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5930, loss: 0.5275, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  66%|######5   | 73/111 [00:47<00:26,  1.41it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9627, LAS: 0.9290, UEM: 0.6556, LEM: 0.4382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3633, partial_loss/deprel_loss: 0.3333, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5013, loss: 0.5263, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  69%|######9   | 77/111 [00:49<00:22,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9437, UAS: 0.9630, LAS: 0.9293, UEM: 0.6552, LEM: 0.4360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2212, partial_loss/deprel_loss: 0.2669, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4198, loss: 0.5241, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  73%|#######2  | 81/111 [00:52<00:20,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9634, LAS: 0.9297, UEM: 0.6572, LEM: 0.4348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1872, partial_loss/deprel_loss: 0.2738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4185, loss: 0.5218, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  77%|#######6  | 85/111 [00:54<00:17,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9632, LAS: 0.9295, UEM: 0.6530, LEM: 0.4303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2652, partial_loss/deprel_loss: 0.3209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4717, loss: 0.5238, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  80%|########  | 89/111 [00:57<00:14,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9628, LAS: 0.9290, UEM: 0.6508, LEM: 0.4269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2090, partial_loss/deprel_loss: 0.3746, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5034, loss: 0.5269, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  84%|########3 | 93/111 [01:00<00:12,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9627, LAS: 0.9289, UEM: 0.6587, LEM: 0.4366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1577, partial_loss/deprel_loss: 0.2665, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4067, loss: 0.5265, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  87%|########7 | 97/111 [01:03<00:10,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9625, LAS: 0.9288, UEM: 0.6574, LEM: 0.4358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4383, partial_loss/deprel_loss: 0.4457, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6062, loss: 0.5284, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  90%|######### | 100/111 [01:05<00:07,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9621, LAS: 0.9284, UEM: 0.6529, LEM: 0.4315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8222, partial_loss/deprel_loss: 0.5854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7947, loss: 0.5315, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  93%|#########2| 103/111 [01:07<00:05,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9622, LAS: 0.9286, UEM: 0.6580, LEM: 0.4379, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5416, partial_loss/deprel_loss: 0.4245, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6099, loss: 0.5292, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  95%|#########5| 106/111 [01:10<00:03,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8870, UAS: 0.9617, LAS: 0.9280, UEM: 0.6534, LEM: 0.4338, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0117, partial_loss/deprel_loss: 0.5263, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7853, loss: 0.5327, batch_reg_loss: 0.1619, reg_loss: 0.1621 ||:  99%|#########9| 110/111 [01:13<00:00,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9615, LAS: 0.9277, UEM: 0.6512, LEM: 0.4323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6477, partial_loss/deprel_loss: 0.5848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7593, loss: 0.5348, batch_reg_loss: 0.1619, reg_loss: 0.1621 ||: 100%|##########| 111/111 [01:13<00:00,  1.50it/s]\n",
+      "2023-04-07 01:32:24,077 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:32:24,077 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:32:24,077 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:32:24,077 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:32:24,077 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.585  |       N/A\n",
+      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.648  |       N/A\n",
+      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.162  |       N/A\n",
+      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - UEM                      |     0.651  |       N/A\n",
+      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - LAS                      |     0.928  |       N/A\n",
+      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - loss                     |     0.535  |       N/A\n",
+      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - LEM                      |     0.432  |       N/A\n",
+      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - UAS                      |     0.961  |       N/A\n",
+      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - EM                       |     0.901  |       N/A\n",
+      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:32:24,083 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:32:29,151 - INFO - combo.training.trainer - Epoch duration: 0:01:22.169650\n",
+      "2023-04-07 01:32:29,152 - INFO - combo.training.trainer - Estimated training time remaining: 6:24:11\n",
+      "2023-04-07 01:32:29,153 - INFO - allennlp.training.trainer - Epoch 119/399\n",
+      "2023-04-07 01:32:29,153 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:32:29,153 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:32:29,162 - INFO - allennlp.training.trainer - Training\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9560, LAS: 0.9230, UEM: 0.6512, LEM: 0.4110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6316, partial_loss/deprel_loss: 0.4480, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6467, loss: 0.5886, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||:   5%|4         | 5/111 [00:02<00:52,  2.00it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8882, UAS: 0.9547, LAS: 0.9204, UEM: 0.5686, LEM: 0.3328, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9893, partial_loss/deprel_loss: 0.5484, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7985, loss: 0.5991, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||:   9%|9         | 10/111 [00:04<00:49,  2.05it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9562, LAS: 0.9221, UEM: 0.5881, LEM: 0.3630, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6123, partial_loss/deprel_loss: 0.4122, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6141, loss: 0.5779, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||:  14%|#3        | 15/111 [00:07<00:46,  2.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9558, LAS: 0.9221, UEM: 0.5655, LEM: 0.3452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3024, partial_loss/deprel_loss: 0.3077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4686, loss: 0.5763, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||:  17%|#7        | 19/111 [00:09<00:49,  1.88it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9567, LAS: 0.9229, UEM: 0.5671, LEM: 0.3446, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4757, partial_loss/deprel_loss: 0.4163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5901, loss: 0.5670, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||:  21%|##        | 23/111 [00:12<00:49,  1.78it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9571, LAS: 0.9234, UEM: 0.6038, LEM: 0.3925, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2781, partial_loss/deprel_loss: 0.3534, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5002, loss: 0.5615, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||:  23%|##3       | 26/111 [00:14<00:53,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9688, UAS: 0.9594, LAS: 0.9259, UEM: 0.6656, LEM: 0.4674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0312, partial_loss/deprel_loss: 0.1093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2556, loss: 0.5430, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||:  26%|##6       | 29/111 [00:17<00:56,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9607, LAS: 0.9274, UEM: 0.6750, LEM: 0.4757, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1359, partial_loss/deprel_loss: 0.2697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4048, loss: 0.5329, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||:  29%|##8       | 32/111 [00:19<00:57,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9607, LAS: 0.9274, UEM: 0.6677, LEM: 0.4672, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2178, partial_loss/deprel_loss: 0.2610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4143, loss: 0.5330, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||:  32%|###1      | 35/111 [00:21<00:54,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9408, UAS: 0.9616, LAS: 0.9282, UEM: 0.6710, LEM: 0.4637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2761, partial_loss/deprel_loss: 0.3460, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4939, loss: 0.5294, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||:  34%|###4      | 38/111 [00:23<00:51,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9283, UAS: 0.9621, LAS: 0.9284, UEM: 0.6754, LEM: 0.4638, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2917, partial_loss/deprel_loss: 0.3887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5312, loss: 0.5263, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  37%|###6      | 41/111 [00:25<00:49,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9617, LAS: 0.9280, UEM: 0.6783, LEM: 0.4673, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0769, partial_loss/deprel_loss: 0.2259, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3580, loss: 0.5280, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  40%|###9      | 44/111 [00:27<00:47,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9621, LAS: 0.9284, UEM: 0.6747, LEM: 0.4613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3800, partial_loss/deprel_loss: 0.3772, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5396, loss: 0.5269, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  42%|####2     | 47/111 [00:29<00:44,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9608, LAS: 0.9271, UEM: 0.6570, LEM: 0.4461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5127, partial_loss/deprel_loss: 0.4390, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6155, loss: 0.5357, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  46%|####5     | 51/111 [00:32<00:41,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9614, LAS: 0.9277, UEM: 0.6581, LEM: 0.4439, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3493, partial_loss/deprel_loss: 0.4118, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5611, loss: 0.5331, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  50%|####9     | 55/111 [00:35<00:38,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9612, LAS: 0.9275, UEM: 0.6545, LEM: 0.4409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4683, partial_loss/deprel_loss: 0.4351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6035, loss: 0.5331, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  52%|#####2    | 58/111 [00:37<00:37,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9610, LAS: 0.9275, UEM: 0.6621, LEM: 0.4544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5465, partial_loss/deprel_loss: 0.4218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6085, loss: 0.5332, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  55%|#####4    | 61/111 [00:39<00:35,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9610, LAS: 0.9276, UEM: 0.6568, LEM: 0.4468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3979, partial_loss/deprel_loss: 0.4106, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5698, loss: 0.5333, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  58%|#####7    | 64/111 [00:42<00:34,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9608, LAS: 0.9273, UEM: 0.6518, LEM: 0.4414, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2573, partial_loss/deprel_loss: 0.3191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4686, loss: 0.5350, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  60%|######    | 67/111 [00:44<00:31,  1.38it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9607, LAS: 0.9271, UEM: 0.6513, LEM: 0.4398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1883, partial_loss/deprel_loss: 0.3120, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4490, loss: 0.5358, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  63%|######3   | 70/111 [00:46<00:29,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9607, LAS: 0.9270, UEM: 0.6530, LEM: 0.4406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3512, partial_loss/deprel_loss: 0.3129, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4823, loss: 0.5351, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  67%|######6   | 74/111 [00:49<00:26,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9603, LAS: 0.9266, UEM: 0.6537, LEM: 0.4407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2083, partial_loss/deprel_loss: 0.3212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4603, loss: 0.5373, batch_reg_loss: 0.1618, reg_loss: 0.1618 ||:  70%|#######   | 78/111 [00:51<00:23,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9600, LAS: 0.9264, UEM: 0.6507, LEM: 0.4395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7320, partial_loss/deprel_loss: 0.4751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6882, loss: 0.5391, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||:  73%|#######2  | 81/111 [00:54<00:22,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8880, UAS: 0.9596, LAS: 0.9260, UEM: 0.6459, LEM: 0.4345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9141, partial_loss/deprel_loss: 0.5886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8154, loss: 0.5417, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||:  77%|#######6  | 85/111 [00:56<00:18,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9593, LAS: 0.9257, UEM: 0.6400, LEM: 0.4291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5148, partial_loss/deprel_loss: 0.4794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6482, loss: 0.5443, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||:  79%|#######9  | 88/111 [00:59<00:16,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9596, LAS: 0.9261, UEM: 0.6410, LEM: 0.4290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3060, partial_loss/deprel_loss: 0.2798, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4468, loss: 0.5411, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||:  82%|########1 | 91/111 [01:01<00:14,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9600, LAS: 0.9265, UEM: 0.6463, LEM: 0.4342, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3279, partial_loss/deprel_loss: 0.3422, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5010, loss: 0.5384, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||:  85%|########4 | 94/111 [01:03<00:12,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9601, LAS: 0.9266, UEM: 0.6469, LEM: 0.4343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3405, partial_loss/deprel_loss: 0.3789, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5329, loss: 0.5386, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||:  87%|########7 | 97/111 [01:05<00:09,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9602, LAS: 0.9266, UEM: 0.6479, LEM: 0.4355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5201, partial_loss/deprel_loss: 0.4496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6254, loss: 0.5378, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||:  90%|######### | 100/111 [01:07<00:07,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9144, UAS: 0.9606, LAS: 0.9270, UEM: 0.6509, LEM: 0.4367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5157, partial_loss/deprel_loss: 0.5044, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6684, loss: 0.5354, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||:  94%|#########3| 104/111 [01:09<00:04,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9607, LAS: 0.9271, UEM: 0.6519, LEM: 0.4374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2124, partial_loss/deprel_loss: 0.3220, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4618, loss: 0.5335, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||:  97%|#########7| 108/111 [01:12<00:02,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9607, LAS: 0.9272, UEM: 0.6491, LEM: 0.4348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2512, partial_loss/deprel_loss: 0.2724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4298, loss: 0.5331, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||: 100%|##########| 111/111 [01:14<00:00,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9607, LAS: 0.9272, UEM: 0.6491, LEM: 0.4348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2512, partial_loss/deprel_loss: 0.2724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4298, loss: 0.5331, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
+      "2023-04-07 01:33:46,617 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:33:46,617 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:33:46,617 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:33:46,617 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:33:46,617 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:33:46,617 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.272  |       N/A\n",
+      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.251  |       N/A\n",
+      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.162  |       N/A\n",
+      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - UEM                      |     0.649  |       N/A\n",
+      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - LAS                      |     0.927  |       N/A\n",
+      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - loss                     |     0.533  |       N/A\n",
+      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - LEM                      |     0.435  |       N/A\n",
+      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - UAS                      |     0.961  |       N/A\n",
+      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - EM                       |     0.936  |       N/A\n",
+      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:33:46,623 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:33:54,256 - INFO - combo.training.trainer - Epoch duration: 0:01:25.103205\n",
+      "2023-04-07 01:33:54,256 - INFO - combo.training.trainer - Estimated training time remaining: 6:22:56\n",
+      "2023-04-07 01:33:54,257 - INFO - allennlp.training.trainer - Epoch 120/399\n",
+      "2023-04-07 01:33:54,258 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:33:54,259 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:33:54,269 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9004, UAS: 0.9501, LAS: 0.9170, UEM: 0.5021, LEM: 0.3026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8535, partial_loss/deprel_loss: 0.5228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7506, loss: 0.5918, batch_reg_loss: 0.1617, reg_loss: 0.1617 ||:   4%|3         | 4/111 [00:02<01:01,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9531, LAS: 0.9200, UEM: 0.4871, LEM: 0.2667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5064, partial_loss/deprel_loss: 0.4212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5999, loss: 0.5803, batch_reg_loss: 0.1617, reg_loss: 0.1617 ||:   7%|7         | 8/111 [00:05<01:02,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9541, LAS: 0.9206, UEM: 0.5231, LEM: 0.3075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6122, partial_loss/deprel_loss: 0.4584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6508, loss: 0.5758, batch_reg_loss: 0.1616, reg_loss: 0.1617 ||:  10%|9         | 11/111 [00:07<01:05,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9580, LAS: 0.9244, UEM: 0.5806, LEM: 0.3570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3549, partial_loss/deprel_loss: 0.3522, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5143, loss: 0.5547, batch_reg_loss: 0.1616, reg_loss: 0.1617 ||:  13%|#2        | 14/111 [00:09<01:05,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9164, UAS: 0.9595, LAS: 0.9262, UEM: 0.5897, LEM: 0.3669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5475, partial_loss/deprel_loss: 0.4541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6344, loss: 0.5433, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||:  16%|#6        | 18/111 [00:12<01:01,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9603, LAS: 0.9269, UEM: 0.5869, LEM: 0.3581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3965, partial_loss/deprel_loss: 0.3725, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5389, loss: 0.5377, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||:  20%|#9        | 22/111 [00:14<00:58,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9740, UAS: 0.9625, LAS: 0.9299, UEM: 0.6652, LEM: 0.4636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0359, partial_loss/deprel_loss: 0.1071, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2545, loss: 0.5194, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||:  23%|##2       | 25/111 [00:17<01:00,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9603, LAS: 0.9278, UEM: 0.6394, LEM: 0.4425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2706, partial_loss/deprel_loss: 0.3206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4722, loss: 0.5364, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||:  26%|##6       | 29/111 [00:19<00:55,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9608, LAS: 0.9282, UEM: 0.6520, LEM: 0.4574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2792, partial_loss/deprel_loss: 0.3689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5125, loss: 0.5330, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||:  29%|##8       | 32/111 [00:21<00:54,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9617, LAS: 0.9292, UEM: 0.6638, LEM: 0.4631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6578, partial_loss/deprel_loss: 0.3979, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6114, loss: 0.5262, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||:  32%|###2      | 36/111 [00:24<00:51,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9611, LAS: 0.9286, UEM: 0.6649, LEM: 0.4640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4831, partial_loss/deprel_loss: 0.4557, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6227, loss: 0.5295, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||:  36%|###6      | 40/111 [00:27<00:48,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9621, LAS: 0.9297, UEM: 0.6798, LEM: 0.4768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3156, partial_loss/deprel_loss: 0.4022, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5464, loss: 0.5221, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||:  39%|###8      | 43/111 [00:29<00:46,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9620, LAS: 0.9296, UEM: 0.6714, LEM: 0.4641, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5441, partial_loss/deprel_loss: 0.4304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6147, loss: 0.5224, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  42%|####2     | 47/111 [00:31<00:42,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9619, LAS: 0.9292, UEM: 0.6658, LEM: 0.4540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5552, partial_loss/deprel_loss: 0.4651, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6446, loss: 0.5248, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  46%|####5     | 51/111 [00:34<00:40,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9021, UAS: 0.9615, LAS: 0.9288, UEM: 0.6645, LEM: 0.4538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7061, partial_loss/deprel_loss: 0.5740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7619, loss: 0.5273, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  49%|####8     | 54/111 [00:36<00:38,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9615, LAS: 0.9286, UEM: 0.6585, LEM: 0.4443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3896, partial_loss/deprel_loss: 0.4041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5627, loss: 0.5292, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  52%|#####2    | 58/111 [00:38<00:34,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9204, UAS: 0.9623, LAS: 0.9292, UEM: 0.6673, LEM: 0.4507, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3596, partial_loss/deprel_loss: 0.4629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6037, loss: 0.5255, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  56%|#####5    | 62/111 [00:41<00:32,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9628, LAS: 0.9299, UEM: 0.6752, LEM: 0.4595, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2684, partial_loss/deprel_loss: 0.3365, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4844, loss: 0.5204, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  59%|#####8    | 65/111 [00:43<00:31,  1.44it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9619, LAS: 0.9288, UEM: 0.6688, LEM: 0.4528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3563, partial_loss/deprel_loss: 0.3716, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5301, loss: 0.5295, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  61%|######1   | 68/111 [00:46<00:30,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9540, UAS: 0.9615, LAS: 0.9283, UEM: 0.6717, LEM: 0.4592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0960, partial_loss/deprel_loss: 0.1973, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3385, loss: 0.5329, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  64%|######3   | 71/111 [00:48<00:29,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9340, UAS: 0.9619, LAS: 0.9286, UEM: 0.6709, LEM: 0.4567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2529, partial_loss/deprel_loss: 0.3776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.5311, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  68%|######7   | 75/111 [00:51<00:25,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9617, LAS: 0.9284, UEM: 0.6664, LEM: 0.4508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4704, partial_loss/deprel_loss: 0.4265, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5967, loss: 0.5322, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  71%|#######1  | 79/111 [00:53<00:22,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9618, LAS: 0.9285, UEM: 0.6676, LEM: 0.4516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2552, partial_loss/deprel_loss: 0.3319, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4780, loss: 0.5314, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  74%|#######3  | 82/111 [00:56<00:20,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9618, LAS: 0.9283, UEM: 0.6666, LEM: 0.4497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1772, partial_loss/deprel_loss: 0.2633, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4075, loss: 0.5323, batch_reg_loss: 0.1614, reg_loss: 0.1616 ||:  77%|#######7  | 86/111 [00:58<00:17,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8862, UAS: 0.9617, LAS: 0.9283, UEM: 0.6735, LEM: 0.4597, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0861, partial_loss/deprel_loss: 0.5565, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8239, loss: 0.5321, batch_reg_loss: 0.1614, reg_loss: 0.1616 ||:  80%|########  | 89/111 [01:01<00:15,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9616, LAS: 0.9283, UEM: 0.6689, LEM: 0.4549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2165, partial_loss/deprel_loss: 0.3058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4494, loss: 0.5322, batch_reg_loss: 0.1614, reg_loss: 0.1615 ||:  84%|########3 | 93/111 [01:03<00:12,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9617, LAS: 0.9281, UEM: 0.6673, LEM: 0.4515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1981, partial_loss/deprel_loss: 0.3654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4933, loss: 0.5328, batch_reg_loss: 0.1614, reg_loss: 0.1615 ||:  86%|########6 | 96/111 [01:05<00:10,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9617, LAS: 0.9281, UEM: 0.6644, LEM: 0.4475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3597, partial_loss/deprel_loss: 0.3367, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5027, loss: 0.5319, batch_reg_loss: 0.1614, reg_loss: 0.1615 ||:  90%|######### | 100/111 [01:08<00:07,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9613, LAS: 0.9277, UEM: 0.6560, LEM: 0.4402, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3539, partial_loss/deprel_loss: 0.3841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5394, loss: 0.5347, batch_reg_loss: 0.1614, reg_loss: 0.1615 ||:  95%|#########4| 105/111 [01:10<00:03,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9615, LAS: 0.9278, UEM: 0.6528, LEM: 0.4349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1941, partial_loss/deprel_loss: 0.3065, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4454, loss: 0.5337, batch_reg_loss: 0.1614, reg_loss: 0.1615 ||:  99%|#########9| 110/111 [01:12<00:00,  1.82it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9616, LAS: 0.9279, UEM: 0.6534, LEM: 0.4346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2313, partial_loss/deprel_loss: 0.3515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4888, loss: 0.5333, batch_reg_loss: 0.1614, reg_loss: 0.1615 ||: 100%|##########| 111/111 [01:12<00:00,  1.52it/s]\n",
+      "2023-04-07 01:35:10,476 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9340, LAS: 0.8843, UEM: 0.7299, LEM: 0.4799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1551, partial_loss/deprel_loss: 22.5874, partial_loss/cycle_loss: 0.0000, batch_loss: 18.1009, loss: 30.5976, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:12,  1.10s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9231, UAS: 0.9563, LAS: 0.9123, UEM: 0.8067, LEM: 0.5765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3924, partial_loss/deprel_loss: 25.3394, partial_loss/cycle_loss: 0.0000, batch_loss: 20.3500, loss: 21.9278, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:05<00:08,  1.06s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9492, LAS: 0.9002, UEM: 0.7154, LEM: 0.4758, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1023, partial_loss/deprel_loss: 41.2377, partial_loss/cycle_loss: 0.0000, batch_loss: 33.2106, loss: 24.2740, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:08<00:05,  1.04s/it]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9480, LAS: 0.8980, UEM: 0.6665, LEM: 0.4116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7164, partial_loss/deprel_loss: 32.8922, partial_loss/cycle_loss: 0.0000, batch_loss: 26.4571, loss: 23.9450, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:10<00:01,  1.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9475, LAS: 0.8973, UEM: 0.6503, LEM: 0.3892, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4480, partial_loss/deprel_loss: 23.6254, partial_loss/cycle_loss: 0.0000, batch_loss: 18.9900, loss: 24.5413, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.03it/s]\n",
+      "2023-04-07 01:35:23,094 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:35:23,094 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:35:23,094 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:35:23,094 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
+      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.351  |    23.625\n",
+      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.231  |     0.448\n",
+      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.162  |     0.000\n",
+      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - UEM                      |     0.653  |     0.650\n",
+      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - LAS                      |     0.928  |     0.897\n",
+      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - loss                     |     0.533  |    24.541\n",
+      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - LEM                      |     0.435  |     0.389\n",
+      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |     0.947\n",
+      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - EM                       |     0.935  |     0.914\n",
+      "2023-04-07 01:35:23,096 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:35:23,101 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:35:28,020 - INFO - combo.training.trainer - Epoch duration: 0:01:33.762829\n",
+      "2023-04-07 01:35:28,021 - INFO - combo.training.trainer - Estimated training time remaining: 6:22:01\n",
+      "2023-04-07 01:35:28,021 - INFO - allennlp.training.trainer - Epoch 121/399\n",
+      "2023-04-07 01:35:28,021 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:35:28,021 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:35:28,028 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9625, LAS: 0.9278, UEM: 0.6975, LEM: 0.4612, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6757, partial_loss/deprel_loss: 0.4689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6717, loss: 0.5151, batch_reg_loss: 0.1614, reg_loss: 0.1614 ||:   3%|2         | 3/111 [00:02<01:16,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9672, LAS: 0.9355, UEM: 0.7027, LEM: 0.4777, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2837, partial_loss/deprel_loss: 0.3431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4926, loss: 0.4797, batch_reg_loss: 0.1614, reg_loss: 0.1614 ||:   6%|6         | 7/111 [00:04<01:10,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9678, LAS: 0.9357, UEM: 0.7548, LEM: 0.5496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6550, partial_loss/deprel_loss: 0.5144, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7039, loss: 0.4759, batch_reg_loss: 0.1614, reg_loss: 0.1614 ||:   9%|9         | 10/111 [00:06<01:08,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9383, UAS: 0.9662, LAS: 0.9341, UEM: 0.7161, LEM: 0.5052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2910, partial_loss/deprel_loss: 0.2941, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4548, loss: 0.4895, batch_reg_loss: 0.1613, reg_loss: 0.1614 ||:  12%|#1        | 13/111 [00:08<01:07,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9625, LAS: 0.9294, UEM: 0.7186, LEM: 0.5103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0669, partial_loss/deprel_loss: 0.2664, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3879, loss: 0.5213, batch_reg_loss: 0.1613, reg_loss: 0.1614 ||:  14%|#4        | 16/111 [00:11<01:07,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9170, UAS: 0.9621, LAS: 0.9291, UEM: 0.6897, LEM: 0.4818, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4282, partial_loss/deprel_loss: 0.4310, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5918, loss: 0.5272, batch_reg_loss: 0.1613, reg_loss: 0.1614 ||:  18%|#8        | 20/111 [00:13<01:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9629, LAS: 0.9297, UEM: 0.7008, LEM: 0.4936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4723, partial_loss/deprel_loss: 0.4305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6002, loss: 0.5215, batch_reg_loss: 0.1613, reg_loss: 0.1614 ||:  21%|##        | 23/111 [00:15<01:02,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9048, UAS: 0.9615, LAS: 0.9286, UEM: 0.6829, LEM: 0.4761, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7597, partial_loss/deprel_loss: 0.5481, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7517, loss: 0.5324, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||:  23%|##3       | 26/111 [00:17<00:59,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9601, LAS: 0.9271, UEM: 0.6503, LEM: 0.4472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3940, partial_loss/deprel_loss: 0.3808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5447, loss: 0.5419, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||:  27%|##7       | 30/111 [00:20<00:56,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9327, UAS: 0.9600, LAS: 0.9269, UEM: 0.6390, LEM: 0.4315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3166, partial_loss/deprel_loss: 0.3335, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4914, loss: 0.5444, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||:  30%|##9       | 33/111 [00:22<00:54,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9602, LAS: 0.9271, UEM: 0.6246, LEM: 0.4132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5958, partial_loss/deprel_loss: 0.4498, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6403, loss: 0.5440, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||:  33%|###3      | 37/111 [00:25<00:49,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9592, LAS: 0.9259, UEM: 0.6117, LEM: 0.4009, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9584, partial_loss/deprel_loss: 0.5039, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7561, loss: 0.5516, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||:  36%|###6      | 40/111 [00:27<00:48,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8916, UAS: 0.9582, LAS: 0.9248, UEM: 0.5995, LEM: 0.3884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8587, partial_loss/deprel_loss: 0.6059, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8177, loss: 0.5590, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||:  39%|###8      | 43/111 [00:29<00:46,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9592, LAS: 0.9257, UEM: 0.6153, LEM: 0.4001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1867, partial_loss/deprel_loss: 0.2768, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4200, loss: 0.5514, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||:  41%|####1     | 46/111 [00:31<00:46,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8932, UAS: 0.9586, LAS: 0.9252, UEM: 0.6056, LEM: 0.3905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8144, partial_loss/deprel_loss: 0.5216, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7414, loss: 0.5554, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||:  45%|####5     | 50/111 [00:34<00:42,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9596, LAS: 0.9260, UEM: 0.6167, LEM: 0.3957, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1388, partial_loss/deprel_loss: 0.2741, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4083, loss: 0.5495, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||:  48%|####7     | 53/111 [00:36<00:41,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9602, LAS: 0.9265, UEM: 0.6188, LEM: 0.3926, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2883, partial_loss/deprel_loss: 0.3921, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5326, loss: 0.5468, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||:  51%|#####1    | 57/111 [00:39<00:37,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9598, LAS: 0.9262, UEM: 0.6186, LEM: 0.3944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1625, partial_loss/deprel_loss: 0.2233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3724, loss: 0.5476, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||:  55%|#####4    | 61/111 [00:41<00:33,  1.49it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9602, LAS: 0.9266, UEM: 0.6270, LEM: 0.4035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4080, partial_loss/deprel_loss: 0.4123, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5727, loss: 0.5433, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||:  59%|#####8    | 65/111 [00:43<00:29,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9609, LAS: 0.9273, UEM: 0.6400, LEM: 0.4165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1509, partial_loss/deprel_loss: 0.2523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3933, loss: 0.5379, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||:  62%|######2   | 69/111 [00:46<00:25,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9614, LAS: 0.9277, UEM: 0.6463, LEM: 0.4210, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2193, partial_loss/deprel_loss: 0.3163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4581, loss: 0.5341, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||:  66%|######5   | 73/111 [00:48<00:22,  1.73it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9614, LAS: 0.9276, UEM: 0.6457, LEM: 0.4195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2231, partial_loss/deprel_loss: 0.3305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4702, loss: 0.5339, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||:  70%|#######   | 78/111 [00:50<00:18,  1.83it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9732, UAS: 0.9616, LAS: 0.9279, UEM: 0.6571, LEM: 0.4395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0336, partial_loss/deprel_loss: 0.0988, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2469, loss: 0.5322, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||:  74%|#######3  | 82/111 [00:53<00:17,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9616, LAS: 0.9279, UEM: 0.6532, LEM: 0.4341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5493, partial_loss/deprel_loss: 0.4245, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6106, loss: 0.5317, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||:  77%|#######7  | 86/111 [00:56<00:16,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9492, UAS: 0.9621, LAS: 0.9284, UEM: 0.6628, LEM: 0.4424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1212, partial_loss/deprel_loss: 0.2469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3829, loss: 0.5276, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||:  81%|########1 | 90/111 [00:58<00:13,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9621, LAS: 0.9284, UEM: 0.6589, LEM: 0.4386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2574, partial_loss/deprel_loss: 0.3425, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4866, loss: 0.5275, batch_reg_loss: 0.1611, reg_loss: 0.1613 ||:  85%|########4 | 94/111 [01:01<00:10,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9617, LAS: 0.9281, UEM: 0.6526, LEM: 0.4330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4018, partial_loss/deprel_loss: 0.4294, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5850, loss: 0.5303, batch_reg_loss: 0.1611, reg_loss: 0.1613 ||:  88%|########8 | 98/111 [01:03<00:08,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9618, LAS: 0.9281, UEM: 0.6492, LEM: 0.4280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2187, partial_loss/deprel_loss: 0.3255, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4653, loss: 0.5298, batch_reg_loss: 0.1611, reg_loss: 0.1613 ||:  92%|#########1| 102/111 [01:06<00:05,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9526, UAS: 0.9621, LAS: 0.9285, UEM: 0.6590, LEM: 0.4395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1560, partial_loss/deprel_loss: 0.2417, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3856, loss: 0.5267, batch_reg_loss: 0.1611, reg_loss: 0.1612 ||:  95%|#########5| 106/111 [01:09<00:03,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9620, LAS: 0.9284, UEM: 0.6538, LEM: 0.4340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2230, partial_loss/deprel_loss: 0.3147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4574, loss: 0.5279, batch_reg_loss: 0.1611, reg_loss: 0.1612 ||:  99%|#########9| 110/111 [01:11<00:00,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9620, LAS: 0.9284, UEM: 0.6522, LEM: 0.4325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3857, partial_loss/deprel_loss: 0.3601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5263, loss: 0.5279, batch_reg_loss: 0.1611, reg_loss: 0.1612 ||: 100%|##########| 111/111 [01:12<00:00,  1.53it/s]\n",
+      "2023-04-07 01:36:43,250 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:36:43,250 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:36:43,250 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:36:43,250 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:36:43,250 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.360  |       N/A\n",
+      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.386  |       N/A\n",
+      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.161  |       N/A\n",
+      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - UEM                      |     0.652  |       N/A\n",
+      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - LAS                      |     0.928  |       N/A\n",
+      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - loss                     |     0.528  |       N/A\n",
+      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - LEM                      |     0.433  |       N/A\n",
+      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |       N/A\n",
+      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - EM                       |     0.932  |       N/A\n",
+      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:36:43,257 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:36:49,054 - INFO - combo.training.trainer - Epoch duration: 0:01:21.032962\n",
+      "2023-04-07 01:36:49,054 - INFO - combo.training.trainer - Estimated training time remaining: 6:20:36\n",
+      "2023-04-07 01:36:49,054 - INFO - allennlp.training.trainer - Epoch 122/399\n",
+      "2023-04-07 01:36:49,055 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:36:49,055 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:36:49,065 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9468, UAS: 0.9650, LAS: 0.9338, UEM: 0.6522, LEM: 0.4229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1713, partial_loss/deprel_loss: 0.2491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3946, loss: 0.4751, batch_reg_loss: 0.1611, reg_loss: 0.1611 ||:   3%|2         | 3/111 [00:02<01:13,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9639, LAS: 0.9312, UEM: 0.6423, LEM: 0.4008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1668, partial_loss/deprel_loss: 0.2690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4096, loss: 0.4931, batch_reg_loss: 0.1611, reg_loss: 0.1611 ||:   5%|5         | 6/111 [00:04<01:15,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9595, LAS: 0.9277, UEM: 0.6090, LEM: 0.3797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6934, partial_loss/deprel_loss: 0.4242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6391, loss: 0.5225, batch_reg_loss: 0.1611, reg_loss: 0.1611 ||:   8%|8         | 9/111 [00:06<01:12,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9620, LAS: 0.9302, UEM: 0.6435, LEM: 0.4178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5243, partial_loss/deprel_loss: 0.4132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5965, loss: 0.5120, batch_reg_loss: 0.1611, reg_loss: 0.1611 ||:  11%|#         | 12/111 [00:08<01:10,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9144, UAS: 0.9622, LAS: 0.9303, UEM: 0.6295, LEM: 0.4019, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5368, partial_loss/deprel_loss: 0.4377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6186, loss: 0.5119, batch_reg_loss: 0.1610, reg_loss: 0.1611 ||:  14%|#4        | 16/111 [00:11<01:06,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9502, UAS: 0.9621, LAS: 0.9310, UEM: 0.6313, LEM: 0.4091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1706, partial_loss/deprel_loss: 0.2616, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4044, loss: 0.5085, batch_reg_loss: 0.1610, reg_loss: 0.1611 ||:  18%|#8        | 20/111 [00:13<01:02,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9600, LAS: 0.9284, UEM: 0.6104, LEM: 0.3878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2424, partial_loss/deprel_loss: 0.3302, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4736, loss: 0.5285, batch_reg_loss: 0.1610, reg_loss: 0.1611 ||:  22%|##1       | 24/111 [00:16<00:57,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9351, UAS: 0.9605, LAS: 0.9289, UEM: 0.6192, LEM: 0.3952, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2865, partial_loss/deprel_loss: 0.2876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4484, loss: 0.5258, batch_reg_loss: 0.1610, reg_loss: 0.1611 ||:  24%|##4       | 27/111 [00:18<00:57,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9619, LAS: 0.9303, UEM: 0.6544, LEM: 0.4337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1432, partial_loss/deprel_loss: 0.2489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3888, loss: 0.5141, batch_reg_loss: 0.1610, reg_loss: 0.1611 ||:  27%|##7       | 30/111 [00:21<00:58,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9629, LAS: 0.9312, UEM: 0.6662, LEM: 0.4462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3693, partial_loss/deprel_loss: 0.3934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5496, loss: 0.5084, batch_reg_loss: 0.1610, reg_loss: 0.1610 ||:  30%|##9       | 33/111 [00:23<00:57,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9082, UAS: 0.9629, LAS: 0.9305, UEM: 0.6631, LEM: 0.4380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5729, partial_loss/deprel_loss: 0.5477, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7137, loss: 0.5118, batch_reg_loss: 0.1610, reg_loss: 0.1610 ||:  32%|###2      | 36/111 [00:25<00:53,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9633, LAS: 0.9313, UEM: 0.6878, LEM: 0.4793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2916, partial_loss/deprel_loss: 0.3384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4900, loss: 0.5070, batch_reg_loss: 0.1610, reg_loss: 0.1610 ||:  35%|###5      | 39/111 [00:27<00:54,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9255, UAS: 0.9630, LAS: 0.9308, UEM: 0.6790, LEM: 0.4691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4333, partial_loss/deprel_loss: 0.4353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5959, loss: 0.5128, batch_reg_loss: 0.1610, reg_loss: 0.1610 ||:  38%|###7      | 42/111 [00:29<00:50,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9631, LAS: 0.9308, UEM: 0.6764, LEM: 0.4639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5079, partial_loss/deprel_loss: 0.3939, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5777, loss: 0.5122, batch_reg_loss: 0.1610, reg_loss: 0.1610 ||:  41%|####      | 45/111 [00:31<00:47,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9343, UAS: 0.9633, LAS: 0.9310, UEM: 0.6768, LEM: 0.4627, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2611, partial_loss/deprel_loss: 0.3371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4829, loss: 0.5085, batch_reg_loss: 0.1610, reg_loss: 0.1610 ||:  45%|####5     | 50/111 [00:34<00:38,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9636, LAS: 0.9313, UEM: 0.6799, LEM: 0.4677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1367, partial_loss/deprel_loss: 0.2098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3562, loss: 0.5074, batch_reg_loss: 0.1610, reg_loss: 0.1610 ||:  49%|####8     | 54/111 [00:36<00:36,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9640, LAS: 0.9317, UEM: 0.6884, LEM: 0.4791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4297, partial_loss/deprel_loss: 0.4490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6061, loss: 0.5048, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||:  52%|#####2    | 58/111 [00:39<00:34,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9637, LAS: 0.9314, UEM: 0.6777, LEM: 0.4678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3982, partial_loss/deprel_loss: 0.3819, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5461, loss: 0.5078, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||:  56%|#####5    | 62/111 [00:42<00:31,  1.55it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9078, UAS: 0.9630, LAS: 0.9305, UEM: 0.6654, LEM: 0.4556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6359, partial_loss/deprel_loss: 0.4622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6578, loss: 0.5146, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||:  59%|#####9    | 66/111 [00:44<00:28,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9625, LAS: 0.9298, UEM: 0.6570, LEM: 0.4457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3815, partial_loss/deprel_loss: 0.3840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5444, loss: 0.5197, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||:  63%|######3   | 70/111 [00:46<00:24,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8922, UAS: 0.9622, LAS: 0.9297, UEM: 0.6520, LEM: 0.4398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0289, partial_loss/deprel_loss: 0.5635, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8175, loss: 0.5221, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||:  68%|######7   | 75/111 [00:48<00:20,  1.78it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9626, LAS: 0.9299, UEM: 0.6525, LEM: 0.4355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2345, partial_loss/deprel_loss: 0.3180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4622, loss: 0.5188, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||:  72%|#######2  | 80/111 [00:51<00:16,  1.86it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9625, LAS: 0.9298, UEM: 0.6539, LEM: 0.4358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2805, partial_loss/deprel_loss: 0.3755, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5174, loss: 0.5198, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||:  76%|#######5  | 84/111 [00:54<00:16,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9627, LAS: 0.9299, UEM: 0.6608, LEM: 0.4438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7551, partial_loss/deprel_loss: 0.5496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7516, loss: 0.5183, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||:  79%|#######9  | 88/111 [00:56<00:14,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9627, LAS: 0.9299, UEM: 0.6589, LEM: 0.4416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5500, partial_loss/deprel_loss: 0.4632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6415, loss: 0.5184, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||:  83%|########2 | 92/111 [00:59<00:12,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9560, UAS: 0.9624, LAS: 0.9296, UEM: 0.6645, LEM: 0.4490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0866, partial_loss/deprel_loss: 0.1841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3254, loss: 0.5205, batch_reg_loss: 0.1608, reg_loss: 0.1610 ||:  86%|########6 | 96/111 [01:03<00:10,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9627, LAS: 0.9298, UEM: 0.6662, LEM: 0.4488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1921, partial_loss/deprel_loss: 0.2776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4213, loss: 0.5180, batch_reg_loss: 0.1608, reg_loss: 0.1610 ||:  90%|######### | 100/111 [01:05<00:07,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9626, LAS: 0.9297, UEM: 0.6625, LEM: 0.4451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2944, partial_loss/deprel_loss: 0.3515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5009, loss: 0.5188, batch_reg_loss: 0.1608, reg_loss: 0.1610 ||:  94%|#########3| 104/111 [01:08<00:04,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9625, LAS: 0.9296, UEM: 0.6571, LEM: 0.4391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4424, partial_loss/deprel_loss: 0.4296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5929, loss: 0.5207, batch_reg_loss: 0.1608, reg_loss: 0.1610 ||:  97%|#########7| 108/111 [01:10<00:01,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8862, UAS: 0.9621, LAS: 0.9291, UEM: 0.6547, LEM: 0.4372, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9304, partial_loss/deprel_loss: 0.6028, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8291, loss: 0.5234, batch_reg_loss: 0.1608, reg_loss: 0.1609 ||: 100%|##########| 111/111 [01:12<00:00,  1.52it/s]\n",
+      "2023-04-07 01:38:04,746 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.603  |       N/A\n",
+      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.930  |       N/A\n",
+      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.161  |       N/A\n",
+      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - UEM                      |     0.655  |       N/A\n",
+      "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - LAS                      |     0.929  |       N/A\n",
+      "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - loss                     |     0.523  |       N/A\n",
+      "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - LEM                      |     0.437  |       N/A\n",
+      "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |       N/A\n",
+      "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - EM                       |     0.886  |       N/A\n",
+      "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:38:04,753 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:38:09,561 - INFO - combo.training.trainer - Epoch duration: 0:01:20.506074\n",
+      "2023-04-07 01:38:09,561 - INFO - combo.training.trainer - Estimated training time remaining: 6:19:10\n",
+      "2023-04-07 01:38:09,561 - INFO - allennlp.training.trainer - Epoch 123/399\n",
+      "2023-04-07 01:38:09,561 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:38:09,562 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:38:09,571 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9549, LAS: 0.9194, UEM: 0.5681, LEM: 0.3599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5232, partial_loss/deprel_loss: 0.4827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6516, loss: 0.6007, batch_reg_loss: 0.1608, reg_loss: 0.1608 ||:   3%|2         | 3/111 [00:02<01:23,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9627, LAS: 0.9298, UEM: 0.6188, LEM: 0.3916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2662, partial_loss/deprel_loss: 0.3589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5011, loss: 0.5094, batch_reg_loss: 0.1608, reg_loss: 0.1608 ||:   6%|6         | 7/111 [00:04<01:16,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9634, LAS: 0.9311, UEM: 0.6393, LEM: 0.4116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1946, partial_loss/deprel_loss: 0.2854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4280, loss: 0.5030, batch_reg_loss: 0.1608, reg_loss: 0.1608 ||:   9%|9         | 10/111 [00:07<01:13,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9355, UAS: 0.9645, LAS: 0.9316, UEM: 0.6506, LEM: 0.4153, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2571, partial_loss/deprel_loss: 0.3332, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4788, loss: 0.5021, batch_reg_loss: 0.1608, reg_loss: 0.1608 ||:  13%|#2        | 14/111 [00:09<01:08,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9662, LAS: 0.9337, UEM: 0.6572, LEM: 0.4175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2175, partial_loss/deprel_loss: 0.2773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4261, loss: 0.4903, batch_reg_loss: 0.1608, reg_loss: 0.1608 ||:  16%|#6        | 18/111 [00:12<01:02,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9576, UAS: 0.9671, LAS: 0.9346, UEM: 0.6837, LEM: 0.4518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0700, partial_loss/deprel_loss: 0.1836, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3216, loss: 0.4854, batch_reg_loss: 0.1608, reg_loss: 0.1608 ||:  19%|#8        | 21/111 [00:14<01:02,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9682, LAS: 0.9361, UEM: 0.7249, LEM: 0.5181, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5037, partial_loss/deprel_loss: 0.4371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6111, loss: 0.4779, batch_reg_loss: 0.1607, reg_loss: 0.1608 ||:  22%|##1       | 24/111 [00:16<01:03,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9669, LAS: 0.9349, UEM: 0.7034, LEM: 0.4947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3045, partial_loss/deprel_loss: 0.3622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5114, loss: 0.4832, batch_reg_loss: 0.1607, reg_loss: 0.1608 ||:  25%|##5       | 28/111 [00:19<00:56,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9646, LAS: 0.9328, UEM: 0.6862, LEM: 0.4788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2151, partial_loss/deprel_loss: 0.3070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4493, loss: 0.4968, batch_reg_loss: 0.1607, reg_loss: 0.1608 ||:  29%|##8       | 32/111 [00:21<00:52,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9367, UAS: 0.9639, LAS: 0.9318, UEM: 0.6867, LEM: 0.4800, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2530, partial_loss/deprel_loss: 0.3480, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4897, loss: 0.5024, batch_reg_loss: 0.1607, reg_loss: 0.1608 ||:  32%|###2      | 36/111 [00:24<00:49,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9632, LAS: 0.9314, UEM: 0.6798, LEM: 0.4733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3144, partial_loss/deprel_loss: 0.3244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4831, loss: 0.5084, batch_reg_loss: 0.1607, reg_loss: 0.1608 ||:  36%|###6      | 40/111 [00:26<00:45,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9624, LAS: 0.9305, UEM: 0.6818, LEM: 0.4755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1474, partial_loss/deprel_loss: 0.2510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3910, loss: 0.5125, batch_reg_loss: 0.1607, reg_loss: 0.1607 ||:  40%|###9      | 44/111 [00:29<00:45,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9616, LAS: 0.9297, UEM: 0.6681, LEM: 0.4633, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4001, partial_loss/deprel_loss: 0.4014, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5619, loss: 0.5174, batch_reg_loss: 0.1607, reg_loss: 0.1607 ||:  42%|####2     | 47/111 [00:31<00:43,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9607, LAS: 0.9289, UEM: 0.6482, LEM: 0.4455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5704, partial_loss/deprel_loss: 0.4718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6522, loss: 0.5269, batch_reg_loss: 0.1607, reg_loss: 0.1607 ||:  47%|####6     | 52/111 [00:34<00:36,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9599, LAS: 0.9278, UEM: 0.6335, LEM: 0.4289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3542, partial_loss/deprel_loss: 0.3405, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5039, loss: 0.5339, batch_reg_loss: 0.1607, reg_loss: 0.1607 ||:  51%|#####1    | 57/111 [00:36<00:31,  1.74it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9248, UAS: 0.9601, LAS: 0.9277, UEM: 0.6278, LEM: 0.4223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3126, partial_loss/deprel_loss: 0.3265, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4844, loss: 0.5320, batch_reg_loss: 0.1607, reg_loss: 0.1607 ||:  56%|#####5    | 62/111 [00:38<00:26,  1.86it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9605, LAS: 0.9281, UEM: 0.6417, LEM: 0.4369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1840, partial_loss/deprel_loss: 0.2735, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4163, loss: 0.5269, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  59%|#####9    | 66/111 [00:41<00:26,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9610, LAS: 0.9285, UEM: 0.6508, LEM: 0.4438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2534, partial_loss/deprel_loss: 0.3795, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5149, loss: 0.5238, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  63%|######3   | 70/111 [00:44<00:26,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9156, UAS: 0.9610, LAS: 0.9285, UEM: 0.6460, LEM: 0.4381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6746, partial_loss/deprel_loss: 0.4760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6763, loss: 0.5240, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  67%|######6   | 74/111 [00:47<00:24,  1.50it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9408, UAS: 0.9608, LAS: 0.9282, UEM: 0.6378, LEM: 0.4305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2414, partial_loss/deprel_loss: 0.3349, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4768, loss: 0.5275, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  70%|#######   | 78/111 [00:49<00:21,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9609, LAS: 0.9282, UEM: 0.6335, LEM: 0.4236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3490, partial_loss/deprel_loss: 0.3569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5159, loss: 0.5275, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  74%|#######3  | 82/111 [00:52<00:18,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9609, LAS: 0.9282, UEM: 0.6348, LEM: 0.4253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1496, partial_loss/deprel_loss: 0.2676, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4046, loss: 0.5278, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  77%|#######7  | 86/111 [00:54<00:15,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9612, LAS: 0.9283, UEM: 0.6366, LEM: 0.4246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2001, partial_loss/deprel_loss: 0.2907, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4332, loss: 0.5276, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  81%|########1 | 90/111 [01:00<00:17,  1.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9614, LAS: 0.9285, UEM: 0.6366, LEM: 0.4239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1536, partial_loss/deprel_loss: 0.2921, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4250, loss: 0.5268, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  84%|########3 | 93/111 [01:02<00:14,  1.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9613, LAS: 0.9283, UEM: 0.6353, LEM: 0.4225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6619, partial_loss/deprel_loss: 0.4325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6390, loss: 0.5270, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  87%|########7 | 97/111 [01:05<00:10,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9613, LAS: 0.9283, UEM: 0.6374, LEM: 0.4249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5876, partial_loss/deprel_loss: 0.5230, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6964, loss: 0.5270, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  90%|######### | 100/111 [01:07<00:08,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9580, UAS: 0.9616, LAS: 0.9286, UEM: 0.6455, LEM: 0.4341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0841, partial_loss/deprel_loss: 0.1611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3063, loss: 0.5250, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  93%|#########2| 103/111 [01:09<00:05,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9521, UAS: 0.9621, LAS: 0.9290, UEM: 0.6533, LEM: 0.4414, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0820, partial_loss/deprel_loss: 0.2228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3552, loss: 0.5223, batch_reg_loss: 0.1605, reg_loss: 0.1607 ||:  95%|#########5| 106/111 [01:11<00:03,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9618, LAS: 0.9288, UEM: 0.6516, LEM: 0.4389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3803, partial_loss/deprel_loss: 0.3741, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5359, loss: 0.5229, batch_reg_loss: 0.1605, reg_loss: 0.1607 ||:  99%|#########9| 110/111 [01:14<00:00,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9619, LAS: 0.9288, UEM: 0.6520, LEM: 0.4385, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2427, partial_loss/deprel_loss: 0.2956, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4456, loss: 0.5222, batch_reg_loss: 0.1605, reg_loss: 0.1607 ||: 100%|##########| 111/111 [01:14<00:00,  1.48it/s]\n",
+      "2023-04-07 01:39:27,734 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:39:27,734 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:39:27,734 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:39:27,734 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:39:27,734 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:39:27,734 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:39:27,734 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.296  |       N/A\n",
+      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.243  |       N/A\n",
+      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.161  |       N/A\n",
+      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - UEM                      |     0.652  |       N/A\n",
+      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - LAS                      |     0.929  |       N/A\n",
+      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - loss                     |     0.522  |       N/A\n",
+      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - LEM                      |     0.439  |       N/A\n",
+      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |       N/A\n",
+      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - EM                       |     0.935  |       N/A\n",
+      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:39:27,740 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:39:32,872 - INFO - combo.training.trainer - Epoch duration: 0:01:23.310651\n",
+      "2023-04-07 01:39:32,872 - INFO - combo.training.trainer - Estimated training time remaining: 6:17:51\n",
+      "2023-04-07 01:39:32,872 - INFO - allennlp.training.trainer - Epoch 124/399\n",
+      "2023-04-07 01:39:32,872 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:39:32,873 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:39:32,880 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9491, LAS: 0.9161, UEM: 0.6139, LEM: 0.4149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5117, partial_loss/deprel_loss: 0.4023, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5847, loss: 0.5831, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||:   3%|2         | 3/111 [00:02<01:17,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9380, UAS: 0.9620, LAS: 0.9297, UEM: 0.7283, LEM: 0.5279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2584, partial_loss/deprel_loss: 0.3415, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4854, loss: 0.4947, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||:   6%|6         | 7/111 [00:04<01:11,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9588, LAS: 0.9263, UEM: 0.6802, LEM: 0.4857, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2412, partial_loss/deprel_loss: 0.2967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4461, loss: 0.5317, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||:   9%|9         | 10/111 [00:06<01:12,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9610, LAS: 0.9292, UEM: 0.6884, LEM: 0.4948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2238, partial_loss/deprel_loss: 0.2941, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4406, loss: 0.5143, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||:  12%|#1        | 13/111 [00:09<01:10,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9613, LAS: 0.9293, UEM: 0.6973, LEM: 0.5000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1493, partial_loss/deprel_loss: 0.2606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3989, loss: 0.5118, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||:  14%|#4        | 16/111 [00:11<01:11,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9637, LAS: 0.9318, UEM: 0.7138, LEM: 0.5118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1904, partial_loss/deprel_loss: 0.2853, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4268, loss: 0.4976, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||:  17%|#7        | 19/111 [00:14<01:11,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9640, LAS: 0.9321, UEM: 0.6946, LEM: 0.4842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4298, partial_loss/deprel_loss: 0.4258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5871, loss: 0.4999, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||:  21%|##        | 23/111 [00:16<01:04,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9295, UAS: 0.9647, LAS: 0.9322, UEM: 0.6975, LEM: 0.4816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2924, partial_loss/deprel_loss: 0.3637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5099, loss: 0.4974, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||:  23%|##3       | 26/111 [00:18<01:00,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9642, LAS: 0.9318, UEM: 0.6884, LEM: 0.4722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1649, partial_loss/deprel_loss: 0.2476, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3915, loss: 0.5012, batch_reg_loss: 0.1604, reg_loss: 0.1605 ||:  27%|##7       | 30/111 [00:21<00:55,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8632, UAS: 0.9608, LAS: 0.9285, UEM: 0.6741, LEM: 0.4611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3414, partial_loss/deprel_loss: 0.6991, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9880, loss: 0.5256, batch_reg_loss: 0.1604, reg_loss: 0.1605 ||:  32%|###1      | 35/111 [00:23<00:47,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9610, LAS: 0.9290, UEM: 0.6652, LEM: 0.4505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2631, partial_loss/deprel_loss: 0.2850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4410, loss: 0.5230, batch_reg_loss: 0.1604, reg_loss: 0.1605 ||:  36%|###6      | 40/111 [00:25<00:40,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9595, LAS: 0.9278, UEM: 0.6427, LEM: 0.4307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7856, partial_loss/deprel_loss: 0.4250, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6576, loss: 0.5322, batch_reg_loss: 0.1604, reg_loss: 0.1605 ||:  41%|####      | 45/111 [00:27<00:35,  1.88it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9603, LAS: 0.9287, UEM: 0.6684, LEM: 0.4677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1457, partial_loss/deprel_loss: 0.3193, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4450, loss: 0.5273, batch_reg_loss: 0.1604, reg_loss: 0.1605 ||:  44%|####4     | 49/111 [00:30<00:34,  1.78it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9606, LAS: 0.9289, UEM: 0.6664, LEM: 0.4633, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1772, partial_loss/deprel_loss: 0.3141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4471, loss: 0.5259, batch_reg_loss: 0.1604, reg_loss: 0.1605 ||:  48%|####7     | 53/111 [00:33<00:34,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9604, LAS: 0.9284, UEM: 0.6559, LEM: 0.4512, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4398, partial_loss/deprel_loss: 0.4302, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5925, loss: 0.5301, batch_reg_loss: 0.1604, reg_loss: 0.1605 ||:  51%|#####1    | 57/111 [00:36<00:35,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9336, UAS: 0.9608, LAS: 0.9289, UEM: 0.6569, LEM: 0.4490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2930, partial_loss/deprel_loss: 0.3515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5002, loss: 0.5271, batch_reg_loss: 0.1604, reg_loss: 0.1604 ||:  55%|#####4    | 61/111 [00:39<00:33,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9612, LAS: 0.9292, UEM: 0.6546, LEM: 0.4441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3279, partial_loss/deprel_loss: 0.3412, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4989, loss: 0.5240, batch_reg_loss: 0.1604, reg_loss: 0.1604 ||:  59%|#####8    | 65/111 [00:42<00:31,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9609, LAS: 0.9288, UEM: 0.6453, LEM: 0.4344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4810, partial_loss/deprel_loss: 0.4411, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6094, loss: 0.5271, batch_reg_loss: 0.1604, reg_loss: 0.1604 ||:  62%|######2   | 69/111 [00:44<00:27,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9244, UAS: 0.9615, LAS: 0.9291, UEM: 0.6501, LEM: 0.4342, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3155, partial_loss/deprel_loss: 0.4211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5603, loss: 0.5236, batch_reg_loss: 0.1604, reg_loss: 0.1604 ||:  66%|######5   | 73/111 [00:47<00:25,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9460, UAS: 0.9618, LAS: 0.9295, UEM: 0.6574, LEM: 0.4425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1190, partial_loss/deprel_loss: 0.2381, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3747, loss: 0.5203, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||:  69%|######9   | 77/111 [00:50<00:23,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9619, LAS: 0.9296, UEM: 0.6547, LEM: 0.4383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2334, partial_loss/deprel_loss: 0.2876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4371, loss: 0.5202, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||:  72%|#######2  | 80/111 [00:52<00:21,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9544, UAS: 0.9620, LAS: 0.9295, UEM: 0.6601, LEM: 0.4470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0805, partial_loss/deprel_loss: 0.1624, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3063, loss: 0.5197, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||:  75%|#######4  | 83/111 [00:54<00:19,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9623, LAS: 0.9298, UEM: 0.6635, LEM: 0.4503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4317, partial_loss/deprel_loss: 0.4249, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5866, loss: 0.5184, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||:  78%|#######8  | 87/111 [00:57<00:16,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9623, LAS: 0.9299, UEM: 0.6621, LEM: 0.4477, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2083, partial_loss/deprel_loss: 0.3284, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4647, loss: 0.5186, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||:  82%|########1 | 91/111 [00:59<00:13,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9624, LAS: 0.9299, UEM: 0.6604, LEM: 0.4445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3465, partial_loss/deprel_loss: 0.3166, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4829, loss: 0.5171, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||:  85%|########4 | 94/111 [01:01<00:11,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9430, UAS: 0.9622, LAS: 0.9298, UEM: 0.6586, LEM: 0.4426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1817, partial_loss/deprel_loss: 0.2733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4153, loss: 0.5183, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||:  88%|########8 | 98/111 [01:04<00:08,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9618, LAS: 0.9294, UEM: 0.6544, LEM: 0.4381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4789, partial_loss/deprel_loss: 0.4105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5844, loss: 0.5203, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||:  92%|#########1| 102/111 [01:07<00:05,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9501, UAS: 0.9622, LAS: 0.9298, UEM: 0.6596, LEM: 0.4425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1177, partial_loss/deprel_loss: 0.2160, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3566, loss: 0.5175, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||:  95%|#########5| 106/111 [01:09<00:03,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9620, LAS: 0.9296, UEM: 0.6558, LEM: 0.4387, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2018, partial_loss/deprel_loss: 0.3323, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4664, loss: 0.5189, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||:  99%|#########9| 110/111 [01:12<00:00,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9184, UAS: 0.9619, LAS: 0.9295, UEM: 0.6539, LEM: 0.4372, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5260, partial_loss/deprel_loss: 0.4188, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6005, loss: 0.5196, batch_reg_loss: 0.1602, reg_loss: 0.1604 ||: 100%|##########| 111/111 [01:13<00:00,  1.52it/s]\n",
+      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.419  |       N/A\n",
+      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.526  |       N/A\n",
+      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.160  |       N/A\n",
+      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - UEM                      |     0.654  |       N/A\n",
+      "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - LAS                      |     0.929  |       N/A\n",
+      "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - loss                     |     0.520  |       N/A\n",
+      "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - LEM                      |     0.437  |       N/A\n",
+      "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |       N/A\n",
+      "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - EM                       |     0.918  |       N/A\n",
+      "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:40:49,222 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:40:54,297 - INFO - combo.training.trainer - Epoch duration: 0:01:21.425042\n",
+      "2023-04-07 01:40:54,298 - INFO - combo.training.trainer - Estimated training time remaining: 6:16:27\n",
+      "2023-04-07 01:40:54,298 - INFO - allennlp.training.trainer - Epoch 125/399\n",
+      "2023-04-07 01:40:54,298 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:40:54,299 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:40:54,308 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9613, LAS: 0.9313, UEM: 0.6735, LEM: 0.4888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5213, partial_loss/deprel_loss: 0.4072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5903, loss: 0.4758, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||:   3%|2         | 3/111 [00:02<01:25,  1.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9645, LAS: 0.9329, UEM: 0.6774, LEM: 0.4719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3121, partial_loss/deprel_loss: 0.3536, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5055, loss: 0.4733, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||:   5%|5         | 6/111 [00:04<01:24,  1.24it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9655, LAS: 0.9342, UEM: 0.6826, LEM: 0.4728, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1777, partial_loss/deprel_loss: 0.2511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3966, loss: 0.4649, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||:   8%|8         | 9/111 [00:07<01:23,  1.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9142, UAS: 0.9650, LAS: 0.9340, UEM: 0.6952, LEM: 0.5047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5937, partial_loss/deprel_loss: 0.4311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6239, loss: 0.4787, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||:  11%|#         | 12/111 [00:09<01:19,  1.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9408, UAS: 0.9649, LAS: 0.9337, UEM: 0.6848, LEM: 0.4846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2166, partial_loss/deprel_loss: 0.3294, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4670, loss: 0.4813, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||:  14%|#4        | 16/111 [00:11<01:09,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9513, UAS: 0.9660, LAS: 0.9351, UEM: 0.7062, LEM: 0.5062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1316, partial_loss/deprel_loss: 0.2023, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3484, loss: 0.4730, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||:  19%|#8        | 21/111 [00:14<00:59,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9748, UAS: 0.9654, LAS: 0.9346, UEM: 0.7213, LEM: 0.5392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0280, partial_loss/deprel_loss: 0.0973, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2436, loss: 0.4750, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||:  23%|##3       | 26/111 [00:17<00:52,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9428, UAS: 0.9653, LAS: 0.9340, UEM: 0.7162, LEM: 0.5280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1675, partial_loss/deprel_loss: 0.2431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3882, loss: 0.4790, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||:  28%|##7       | 31/111 [00:19<00:45,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9649, LAS: 0.9334, UEM: 0.7044, LEM: 0.5135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2151, partial_loss/deprel_loss: 0.2969, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4407, loss: 0.4833, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||:  32%|###1      | 35/111 [00:22<00:47,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9654, LAS: 0.9339, UEM: 0.7023, LEM: 0.5059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3088, partial_loss/deprel_loss: 0.3605, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5103, loss: 0.4810, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||:  35%|###5      | 39/111 [00:25<00:47,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9652, UAS: 0.9658, LAS: 0.9344, UEM: 0.7101, LEM: 0.5151, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0582, partial_loss/deprel_loss: 0.1520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2933, loss: 0.4785, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||:  39%|###8      | 43/111 [00:28<00:47,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9472, UAS: 0.9658, LAS: 0.9344, UEM: 0.7116, LEM: 0.5160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1175, partial_loss/deprel_loss: 0.2207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3602, loss: 0.4784, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||:  41%|####1     | 46/111 [00:30<00:45,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9647, LAS: 0.9330, UEM: 0.7041, LEM: 0.5079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2282, partial_loss/deprel_loss: 0.3713, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5028, loss: 0.4888, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||:  44%|####4     | 49/111 [00:32<00:43,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9644, LAS: 0.9326, UEM: 0.7008, LEM: 0.5038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1494, partial_loss/deprel_loss: 0.2460, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3868, loss: 0.4925, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||:  47%|####6     | 52/111 [00:34<00:42,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9156, UAS: 0.9636, LAS: 0.9317, UEM: 0.6896, LEM: 0.4940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5430, partial_loss/deprel_loss: 0.4607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6372, loss: 0.4988, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||:  50%|####9     | 55/111 [00:37<00:40,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9632, LAS: 0.9313, UEM: 0.6814, LEM: 0.4846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3158, partial_loss/deprel_loss: 0.4089, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5504, loss: 0.5032, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||:  52%|#####2    | 58/111 [00:39<00:38,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9521, UAS: 0.9635, LAS: 0.9314, UEM: 0.6849, LEM: 0.4860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0668, partial_loss/deprel_loss: 0.2211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3503, loss: 0.5031, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||:  55%|#####4    | 61/111 [00:41<00:36,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9631, LAS: 0.9309, UEM: 0.6769, LEM: 0.4773, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2835, partial_loss/deprel_loss: 0.3242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4761, loss: 0.5067, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||:  59%|#####8    | 65/111 [00:43<00:31,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9631, LAS: 0.9309, UEM: 0.6753, LEM: 0.4744, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2259, partial_loss/deprel_loss: 0.3241, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4645, loss: 0.5067, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||:  62%|######2   | 69/111 [00:46<00:28,  1.48it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9633, LAS: 0.9310, UEM: 0.6719, LEM: 0.4695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3911, partial_loss/deprel_loss: 0.3975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5563, loss: 0.5057, batch_reg_loss: 0.1601, reg_loss: 0.1601 ||:  66%|######5   | 73/111 [00:48<00:24,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9328, UAS: 0.9633, LAS: 0.9308, UEM: 0.6678, LEM: 0.4625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2641, partial_loss/deprel_loss: 0.3907, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5254, loss: 0.5079, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  69%|######9   | 77/111 [00:52<00:23,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9255, UAS: 0.9636, LAS: 0.9310, UEM: 0.6684, LEM: 0.4607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3835, partial_loss/deprel_loss: 0.4084, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5635, loss: 0.5069, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  72%|#######2  | 80/111 [00:54<00:21,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9632, LAS: 0.9306, UEM: 0.6658, LEM: 0.4573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2415, partial_loss/deprel_loss: 0.2731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4268, loss: 0.5088, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  75%|#######4  | 83/111 [00:56<00:19,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9625, LAS: 0.9298, UEM: 0.6636, LEM: 0.4546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1750, partial_loss/deprel_loss: 0.3212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4520, loss: 0.5155, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  77%|#######7  | 86/111 [00:58<00:17,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9619, LAS: 0.9293, UEM: 0.6578, LEM: 0.4483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4905, partial_loss/deprel_loss: 0.4107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5867, loss: 0.5193, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  81%|########1 | 90/111 [01:01<00:14,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9208, UAS: 0.9620, LAS: 0.9293, UEM: 0.6549, LEM: 0.4443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3594, partial_loss/deprel_loss: 0.3532, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5144, loss: 0.5188, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  85%|########4 | 94/111 [01:03<00:11,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9413, UAS: 0.9620, LAS: 0.9293, UEM: 0.6545, LEM: 0.4433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1414, partial_loss/deprel_loss: 0.2675, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4023, loss: 0.5179, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  88%|########8 | 98/111 [01:06<00:09,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9618, LAS: 0.9291, UEM: 0.6529, LEM: 0.4411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1656, partial_loss/deprel_loss: 0.2876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4232, loss: 0.5198, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  91%|######### | 101/111 [01:08<00:06,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9024, UAS: 0.9616, LAS: 0.9288, UEM: 0.6486, LEM: 0.4364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5981, partial_loss/deprel_loss: 0.4744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6592, loss: 0.5213, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  94%|#########3| 104/111 [01:10<00:04,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9617, LAS: 0.9288, UEM: 0.6468, LEM: 0.4344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4200, partial_loss/deprel_loss: 0.3656, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5364, loss: 0.5212, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  96%|#########6| 107/111 [01:12<00:02,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9617, LAS: 0.9290, UEM: 0.6453, LEM: 0.4317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4425, partial_loss/deprel_loss: 0.4211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5854, loss: 0.5202, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  99%|#########9| 110/111 [01:15<00:00,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9619, LAS: 0.9291, UEM: 0.6506, LEM: 0.4377, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1172, partial_loss/deprel_loss: 0.2338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3705, loss: 0.5188, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||: 100%|##########| 111/111 [01:16<00:00,  1.46it/s]\n",
+      "2023-04-07 01:42:13,636 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9276, UAS: 0.9530, LAS: 0.9045, UEM: 0.6088, LEM: 0.3165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3952, partial_loss/deprel_loss: 16.7865, partial_loss/cycle_loss: 0.0000, batch_loss: 13.5082, loss: 20.0456, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:09,  1.05it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9492, LAS: 0.8996, UEM: 0.5886, LEM: 0.3032, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4041, partial_loss/deprel_loss: 25.1117, partial_loss/cycle_loss: 0.0000, batch_loss: 20.1702, loss: 22.7926, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:06,  1.04it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8697, UAS: 0.9418, LAS: 0.8909, UEM: 0.5511, LEM: 0.2718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3135, partial_loss/deprel_loss: 45.1808, partial_loss/cycle_loss: 0.0000, batch_loss: 36.4074, loss: 26.0686, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  69%|######9   | 9/13 [00:08<00:03,  1.08it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8880, UAS: 0.9479, LAS: 0.8988, UEM: 0.6540, LEM: 0.4003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7454, partial_loss/deprel_loss: 28.2911, partial_loss/cycle_loss: 0.0000, batch_loss: 22.7820, loss: 24.2716, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:10<00:00,  1.20it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8880, UAS: 0.9479, LAS: 0.8988, UEM: 0.6540, LEM: 0.4003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7454, partial_loss/deprel_loss: 28.2911, partial_loss/cycle_loss: 0.0000, batch_loss: 22.7820, loss: 24.2716, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:10<00:00,  1.21it/s]\n",
+      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
+      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.234  |    28.291\n",
+      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.117  |     0.745\n",
+      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.160  |     0.000\n",
+      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - UEM                      |     0.651  |     0.654\n",
+      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - LAS                      |     0.929  |     0.899\n",
+      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - loss                     |     0.519  |    24.272\n",
+      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - LEM                      |     0.438  |     0.400\n",
+      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |     0.948\n",
+      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - EM                       |     0.947  |     0.888\n",
+      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:42:24,432 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:42:31,104 - INFO - combo.training.trainer - Epoch duration: 0:01:36.805760\n",
+      "2023-04-07 01:42:31,104 - INFO - combo.training.trainer - Estimated training time remaining: 6:15:37\n",
+      "2023-04-07 01:42:31,105 - INFO - allennlp.training.trainer - Epoch 126/399\n",
+      "2023-04-07 01:42:31,105 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:42:31,106 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:42:31,115 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9523, LAS: 0.9153, UEM: 0.4448, LEM: 0.1759, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8348, partial_loss/deprel_loss: 0.5327, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7531, loss: 0.6257, batch_reg_loss: 0.1600, reg_loss: 0.1600 ||:   3%|2         | 3/111 [00:02<01:16,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9519, LAS: 0.9174, UEM: 0.4296, LEM: 0.1925, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3077, partial_loss/deprel_loss: 0.3612, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5105, loss: 0.6160, batch_reg_loss: 0.1600, reg_loss: 0.1600 ||:   5%|5         | 6/111 [00:04<01:16,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9510, UAS: 0.9612, LAS: 0.9279, UEM: 0.6479, LEM: 0.4082, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1347, partial_loss/deprel_loss: 0.2565, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3921, loss: 0.5449, batch_reg_loss: 0.1600, reg_loss: 0.1600 ||:   8%|8         | 9/111 [00:06<01:17,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9316, UAS: 0.9587, LAS: 0.9255, UEM: 0.5725, LEM: 0.3480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3705, partial_loss/deprel_loss: 0.3808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5387, loss: 0.5659, batch_reg_loss: 0.1600, reg_loss: 0.1600 ||:  12%|#1        | 13/111 [00:09<01:11,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9550, LAS: 0.9218, UEM: 0.5284, LEM: 0.3201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3982, partial_loss/deprel_loss: 0.3401, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5117, loss: 0.5809, batch_reg_loss: 0.1599, reg_loss: 0.1600 ||:  14%|#4        | 16/111 [00:11<01:08,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9485, UAS: 0.9576, LAS: 0.9248, UEM: 0.5812, LEM: 0.3710, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1394, partial_loss/deprel_loss: 0.1916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3411, loss: 0.5551, batch_reg_loss: 0.1599, reg_loss: 0.1600 ||:  17%|#7        | 19/111 [00:13<01:07,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9591, LAS: 0.9260, UEM: 0.6086, LEM: 0.3964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5340, partial_loss/deprel_loss: 0.4585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6335, loss: 0.5456, batch_reg_loss: 0.1599, reg_loss: 0.1600 ||:  20%|#9        | 22/111 [00:16<01:04,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9595, LAS: 0.9265, UEM: 0.6058, LEM: 0.3898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2019, partial_loss/deprel_loss: 0.2954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4366, loss: 0.5419, batch_reg_loss: 0.1599, reg_loss: 0.1600 ||:  23%|##2       | 25/111 [00:18<01:02,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9592, LAS: 0.9265, UEM: 0.5935, LEM: 0.3796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2432, partial_loss/deprel_loss: 0.3101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4567, loss: 0.5441, batch_reg_loss: 0.1599, reg_loss: 0.1600 ||:  25%|##5       | 28/111 [00:20<01:00,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9537, UAS: 0.9607, LAS: 0.9278, UEM: 0.6173, LEM: 0.3985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0671, partial_loss/deprel_loss: 0.2273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3552, loss: 0.5343, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||:  29%|##8       | 32/111 [00:23<00:56,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9744, UAS: 0.9618, LAS: 0.9291, UEM: 0.6616, LEM: 0.4600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0308, partial_loss/deprel_loss: 0.1074, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2519, loss: 0.5274, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||:  32%|###1      | 35/111 [00:25<00:57,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9629, LAS: 0.9300, UEM: 0.6791, LEM: 0.4738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1931, partial_loss/deprel_loss: 0.2645, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4101, loss: 0.5188, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||:  34%|###4      | 38/111 [00:28<00:55,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9631, LAS: 0.9299, UEM: 0.6741, LEM: 0.4640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3212, partial_loss/deprel_loss: 0.3834, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5308, loss: 0.5209, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||:  37%|###6      | 41/111 [00:30<00:53,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9458, UAS: 0.9636, LAS: 0.9306, UEM: 0.6738, LEM: 0.4614, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1649, partial_loss/deprel_loss: 0.2527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3950, loss: 0.5159, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||:  40%|###9      | 44/111 [00:32<00:49,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8795, UAS: 0.9616, LAS: 0.9286, UEM: 0.6619, LEM: 0.4516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1917, partial_loss/deprel_loss: 0.6342, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9055, loss: 0.5302, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||:  42%|####2     | 47/111 [00:34<00:46,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9264, UAS: 0.9616, LAS: 0.9287, UEM: 0.6567, LEM: 0.4456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3388, partial_loss/deprel_loss: 0.3337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4945, loss: 0.5289, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||:  45%|####5     | 50/111 [00:36<00:43,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9619, LAS: 0.9291, UEM: 0.6671, LEM: 0.4614, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4964, partial_loss/deprel_loss: 0.3825, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5651, loss: 0.5256, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||:  48%|####7     | 53/111 [00:38<00:41,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9622, LAS: 0.9292, UEM: 0.6709, LEM: 0.4650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3431, partial_loss/deprel_loss: 0.4040, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5517, loss: 0.5249, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||:  51%|#####1    | 57/111 [00:41<00:37,  1.44it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9502, UAS: 0.9625, LAS: 0.9295, UEM: 0.6701, LEM: 0.4623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1366, partial_loss/deprel_loss: 0.2424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3811, loss: 0.5231, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||:  55%|#####4    | 61/111 [00:43<00:32,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9627, LAS: 0.9295, UEM: 0.6651, LEM: 0.4552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2284, partial_loss/deprel_loss: 0.3486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4844, loss: 0.5233, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||:  59%|#####8    | 65/111 [00:46<00:30,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9307, UAS: 0.9625, LAS: 0.9294, UEM: 0.6603, LEM: 0.4487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2891, partial_loss/deprel_loss: 0.3650, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5096, loss: 0.5236, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||:  62%|######2   | 69/111 [00:49<00:28,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9630, LAS: 0.9299, UEM: 0.6681, LEM: 0.4553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2423, partial_loss/deprel_loss: 0.3194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4638, loss: 0.5196, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||:  65%|######4   | 72/111 [00:51<00:27,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9628, LAS: 0.9297, UEM: 0.6628, LEM: 0.4496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5273, partial_loss/deprel_loss: 0.4679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6396, loss: 0.5218, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||:  68%|######7   | 75/111 [00:54<00:27,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9489, UAS: 0.9633, LAS: 0.9302, UEM: 0.6708, LEM: 0.4573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1428, partial_loss/deprel_loss: 0.2046, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3520, loss: 0.5175, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||:  71%|#######1  | 79/111 [00:56<00:23,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9580, UAS: 0.9638, LAS: 0.9310, UEM: 0.6793, LEM: 0.4667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0782, partial_loss/deprel_loss: 0.1631, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3059, loss: 0.5128, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||:  75%|#######4  | 83/111 [00:59<00:20,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9636, LAS: 0.9306, UEM: 0.6747, LEM: 0.4620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1512, partial_loss/deprel_loss: 0.2864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4191, loss: 0.5153, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||:  78%|#######8  | 87/111 [01:02<00:16,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9633, LAS: 0.9305, UEM: 0.6681, LEM: 0.4555, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2875, partial_loss/deprel_loss: 0.3476, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4953, loss: 0.5166, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||:  82%|########1 | 91/111 [01:04<00:12,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9631, LAS: 0.9301, UEM: 0.6639, LEM: 0.4504, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1869, partial_loss/deprel_loss: 0.2987, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4361, loss: 0.5193, batch_reg_loss: 0.1597, reg_loss: 0.1599 ||:  86%|########5 | 95/111 [01:06<00:10,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9625, LAS: 0.9295, UEM: 0.6547, LEM: 0.4417, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3615, partial_loss/deprel_loss: 0.4692, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6074, loss: 0.5237, batch_reg_loss: 0.1597, reg_loss: 0.1599 ||:  90%|######### | 100/111 [01:09<00:06,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9627, LAS: 0.9297, UEM: 0.6560, LEM: 0.4417, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2675, partial_loss/deprel_loss: 0.2865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4424, loss: 0.5225, batch_reg_loss: 0.1597, reg_loss: 0.1599 ||:  94%|#########3| 104/111 [01:11<00:03,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9630, LAS: 0.9299, UEM: 0.6602, LEM: 0.4442, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3212, partial_loss/deprel_loss: 0.3380, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4944, loss: 0.5203, batch_reg_loss: 0.1597, reg_loss: 0.1598 ||:  97%|#########7| 108/111 [01:13<00:01,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9630, LAS: 0.9301, UEM: 0.6596, LEM: 0.4437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1864, partial_loss/deprel_loss: 0.2761, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4179, loss: 0.5199, batch_reg_loss: 0.1597, reg_loss: 0.1598 ||: 100%|##########| 111/111 [01:15<00:00,  1.46it/s]\n",
+      "2023-04-07 01:43:50,185 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.276  |       N/A\n",
+      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.186  |       N/A\n",
+      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.160  |       N/A\n",
+      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - UEM                      |     0.660  |       N/A\n",
+      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - LAS                      |     0.930  |       N/A\n",
+      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - loss                     |     0.520  |       N/A\n",
+      "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - LEM                      |     0.444  |       N/A\n",
+      "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |       N/A\n",
+      "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - EM                       |     0.943  |       N/A\n",
+      "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:43:50,192 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:44:00,241 - INFO - combo.training.trainer - Epoch duration: 0:01:29.136743\n",
+      "2023-04-07 01:44:00,242 - INFO - combo.training.trainer - Estimated training time remaining: 6:14:29\n",
+      "2023-04-07 01:44:00,242 - INFO - allennlp.training.trainer - Epoch 127/399\n",
+      "2023-04-07 01:44:00,242 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:44:00,243 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:44:00,251 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9666, LAS: 0.9335, UEM: 0.6822, LEM: 0.4690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4385, partial_loss/deprel_loss: 0.3819, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5529, loss: 0.4783, batch_reg_loss: 0.1597, reg_loss: 0.1597 ||:   3%|2         | 3/111 [00:02<01:17,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9638, LAS: 0.9309, UEM: 0.6726, LEM: 0.4667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1425, partial_loss/deprel_loss: 0.2496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3879, loss: 0.5058, batch_reg_loss: 0.1597, reg_loss: 0.1597 ||:   5%|5         | 6/111 [00:04<01:16,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9619, LAS: 0.9283, UEM: 0.5965, LEM: 0.3874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2555, partial_loss/deprel_loss: 0.3948, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5267, loss: 0.5256, batch_reg_loss: 0.1597, reg_loss: 0.1597 ||:   9%|9         | 10/111 [00:06<01:10,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9636, LAS: 0.9300, UEM: 0.6324, LEM: 0.4101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4912, partial_loss/deprel_loss: 0.4681, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6324, loss: 0.5159, batch_reg_loss: 0.1597, reg_loss: 0.1597 ||:  12%|#1        | 13/111 [00:09<01:11,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9109, UAS: 0.9637, LAS: 0.9308, UEM: 0.6668, LEM: 0.4577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6734, partial_loss/deprel_loss: 0.4497, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6541, loss: 0.5116, batch_reg_loss: 0.1597, reg_loss: 0.1597 ||:  14%|#4        | 16/111 [00:11<01:10,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9514, UAS: 0.9639, LAS: 0.9320, UEM: 0.6639, LEM: 0.4582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2104, partial_loss/deprel_loss: 0.2366, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3910, loss: 0.5048, batch_reg_loss: 0.1597, reg_loss: 0.1597 ||:  18%|#8        | 20/111 [00:14<01:05,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9408, UAS: 0.9655, LAS: 0.9335, UEM: 0.6962, LEM: 0.4888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1528, partial_loss/deprel_loss: 0.2687, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4052, loss: 0.4916, batch_reg_loss: 0.1596, reg_loss: 0.1597 ||:  21%|##        | 23/111 [00:16<01:03,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9646, LAS: 0.9324, UEM: 0.6944, LEM: 0.4846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3410, partial_loss/deprel_loss: 0.3548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5116, loss: 0.4969, batch_reg_loss: 0.1596, reg_loss: 0.1597 ||:  23%|##3       | 26/111 [00:18<01:00,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9652, LAS: 0.9334, UEM: 0.7096, LEM: 0.5095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2559, partial_loss/deprel_loss: 0.3340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4780, loss: 0.4899, batch_reg_loss: 0.1596, reg_loss: 0.1597 ||:  26%|##6       | 29/111 [00:20<00:58,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9649, LAS: 0.9331, UEM: 0.7063, LEM: 0.5084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5047, partial_loss/deprel_loss: 0.4043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5840, loss: 0.4897, batch_reg_loss: 0.1596, reg_loss: 0.1597 ||:  29%|##8       | 32/111 [00:22<00:55,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9646, LAS: 0.9326, UEM: 0.7006, LEM: 0.5012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4657, partial_loss/deprel_loss: 0.4395, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6044, loss: 0.4926, batch_reg_loss: 0.1596, reg_loss: 0.1597 ||:  32%|###1      | 35/111 [00:25<00:54,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9638, LAS: 0.9318, UEM: 0.6895, LEM: 0.4905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4964, partial_loss/deprel_loss: 0.4363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6079, loss: 0.4988, batch_reg_loss: 0.1596, reg_loss: 0.1597 ||:  34%|###4      | 38/111 [00:27<00:52,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9643, LAS: 0.9322, UEM: 0.6923, LEM: 0.4881, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1772, partial_loss/deprel_loss: 0.2341, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3823, loss: 0.4965, batch_reg_loss: 0.1596, reg_loss: 0.1596 ||:  37%|###6      | 41/111 [00:29<00:49,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9366, UAS: 0.9650, LAS: 0.9329, UEM: 0.6934, LEM: 0.4853, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3462, partial_loss/deprel_loss: 0.3507, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5094, loss: 0.4947, batch_reg_loss: 0.1596, reg_loss: 0.1596 ||:  41%|####      | 45/111 [00:31<00:45,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9646, LAS: 0.9323, UEM: 0.6840, LEM: 0.4736, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3669, partial_loss/deprel_loss: 0.4550, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5969, loss: 0.4992, batch_reg_loss: 0.1596, reg_loss: 0.1596 ||:  43%|####3     | 48/111 [00:34<00:44,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9263, UAS: 0.9646, LAS: 0.9325, UEM: 0.6855, LEM: 0.4765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5006, partial_loss/deprel_loss: 0.3715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5569, loss: 0.4968, batch_reg_loss: 0.1596, reg_loss: 0.1596 ||:  46%|####5     | 51/111 [00:36<00:42,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9644, LAS: 0.9320, UEM: 0.6830, LEM: 0.4708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1502, partial_loss/deprel_loss: 0.2345, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3772, loss: 0.5002, batch_reg_loss: 0.1596, reg_loss: 0.1596 ||:  50%|####9     | 55/111 [00:38<00:37,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9638, LAS: 0.9313, UEM: 0.6721, LEM: 0.4593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2561, partial_loss/deprel_loss: 0.3670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5043, loss: 0.5036, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  53%|#####3    | 59/111 [00:41<00:34,  1.52it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9633, LAS: 0.9308, UEM: 0.6646, LEM: 0.4515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2075, partial_loss/deprel_loss: 0.2798, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4249, loss: 0.5076, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  57%|#####6    | 63/111 [00:43<00:31,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9526, UAS: 0.9636, LAS: 0.9312, UEM: 0.6650, LEM: 0.4502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1355, partial_loss/deprel_loss: 0.2434, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3814, loss: 0.5041, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  60%|######    | 67/111 [00:46<00:28,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9367, UAS: 0.9630, LAS: 0.9306, UEM: 0.6607, LEM: 0.4461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2619, partial_loss/deprel_loss: 0.3262, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4728, loss: 0.5077, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  64%|######3   | 71/111 [00:48<00:25,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8759, UAS: 0.9626, LAS: 0.9302, UEM: 0.6624, LEM: 0.4463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1859, partial_loss/deprel_loss: 0.6156, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8891, loss: 0.5098, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  68%|######7   | 75/111 [00:51<00:24,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9623, LAS: 0.9297, UEM: 0.6539, LEM: 0.4374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4116, partial_loss/deprel_loss: 0.3849, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5497, loss: 0.5136, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  71%|#######1  | 79/111 [00:53<00:20,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9624, LAS: 0.9298, UEM: 0.6510, LEM: 0.4334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2462, partial_loss/deprel_loss: 0.2908, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4414, loss: 0.5126, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  75%|#######4  | 83/111 [00:56<00:18,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9621, LAS: 0.9296, UEM: 0.6472, LEM: 0.4299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1450, partial_loss/deprel_loss: 0.2571, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3941, loss: 0.5159, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  78%|#######8  | 87/111 [00:59<00:16,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9611, LAS: 0.9285, UEM: 0.6402, LEM: 0.4247, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6970, partial_loss/deprel_loss: 0.5140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7101, loss: 0.5234, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  81%|########1 | 90/111 [01:01<00:14,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9616, LAS: 0.9290, UEM: 0.6462, LEM: 0.4303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2819, partial_loss/deprel_loss: 0.3448, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4917, loss: 0.5197, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  85%|########4 | 94/111 [01:04<00:11,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9470, UAS: 0.9612, LAS: 0.9286, UEM: 0.6422, LEM: 0.4280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1579, partial_loss/deprel_loss: 0.2391, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3823, loss: 0.5220, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  88%|########8 | 98/111 [01:06<00:08,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9614, LAS: 0.9288, UEM: 0.6433, LEM: 0.4273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2286, partial_loss/deprel_loss: 0.3183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4598, loss: 0.5200, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  93%|#########2| 103/111 [01:08<00:04,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9692, UAS: 0.9617, LAS: 0.9292, UEM: 0.6548, LEM: 0.4426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0445, partial_loss/deprel_loss: 0.1054, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2527, loss: 0.5181, batch_reg_loss: 0.1594, reg_loss: 0.1596 ||:  97%|#########7| 108/111 [01:11<00:01,  1.73it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9456, UAS: 0.9619, LAS: 0.9293, UEM: 0.6544, LEM: 0.4415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1877, partial_loss/deprel_loss: 0.2913, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4300, loss: 0.5172, batch_reg_loss: 0.1594, reg_loss: 0.1596 ||: 100%|##########| 111/111 [01:12<00:00,  1.52it/s]\n",
+      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.291  |       N/A\n",
+      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.188  |       N/A\n",
+      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.160  |       N/A\n",
+      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - UEM                      |     0.654  |       N/A\n",
+      "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - LAS                      |     0.929  |       N/A\n",
+      "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - loss                     |     0.517  |       N/A\n",
+      "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - LEM                      |     0.441  |       N/A\n",
+      "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |       N/A\n",
+      "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - EM                       |     0.946  |       N/A\n",
+      "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:45:16,364 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:45:21,256 - INFO - combo.training.trainer - Epoch duration: 0:01:21.013571\n",
+      "2023-04-07 01:45:21,256 - INFO - combo.training.trainer - Estimated training time remaining: 6:13:04\n",
+      "2023-04-07 01:45:21,257 - INFO - allennlp.training.trainer - Epoch 128/399\n",
+      "2023-04-07 01:45:21,257 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:45:21,258 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:45:21,267 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9686, LAS: 0.9401, UEM: 0.8848, LEM: 0.7510, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7817, partial_loss/deprel_loss: 0.4661, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6887, loss: 0.4405, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||:   3%|2         | 3/111 [00:02<01:29,  1.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9672, LAS: 0.9368, UEM: 0.8125, LEM: 0.6448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1316, partial_loss/deprel_loss: 0.2365, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3749, loss: 0.4518, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||:   5%|5         | 6/111 [00:04<01:22,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9654, LAS: 0.9340, UEM: 0.7629, LEM: 0.5667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3529, partial_loss/deprel_loss: 0.3521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5117, loss: 0.4713, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||:   9%|9         | 10/111 [00:07<01:14,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9637, LAS: 0.9319, UEM: 0.7178, LEM: 0.5154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3760, partial_loss/deprel_loss: 0.3832, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5412, loss: 0.4924, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||:  12%|#1        | 13/111 [00:09<01:10,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9636, LAS: 0.9311, UEM: 0.6900, LEM: 0.4815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3804, partial_loss/deprel_loss: 0.4062, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5605, loss: 0.5032, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||:  14%|#4        | 16/111 [00:11<01:07,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9628, LAS: 0.9302, UEM: 0.6866, LEM: 0.4737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2117, partial_loss/deprel_loss: 0.3412, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4747, loss: 0.5149, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||:  17%|#7        | 19/111 [00:13<01:04,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9633, LAS: 0.9300, UEM: 0.6896, LEM: 0.4680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3266, partial_loss/deprel_loss: 0.3767, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5260, loss: 0.5101, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||:  20%|#9        | 22/111 [00:15<01:02,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9712, UAS: 0.9636, LAS: 0.9310, UEM: 0.7128, LEM: 0.5145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0364, partial_loss/deprel_loss: 0.1140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2578, loss: 0.5061, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||:  23%|##3       | 26/111 [00:18<01:01,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9292, UAS: 0.9634, LAS: 0.9309, UEM: 0.6973, LEM: 0.4973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3625, partial_loss/deprel_loss: 0.3910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5447, loss: 0.5099, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||:  26%|##6       | 29/111 [00:20<01:00,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9631, LAS: 0.9306, UEM: 0.6848, LEM: 0.4836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6988, partial_loss/deprel_loss: 0.4732, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6777, loss: 0.5138, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||:  29%|##8       | 32/111 [00:22<00:57,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9393, UAS: 0.9634, LAS: 0.9310, UEM: 0.6844, LEM: 0.4811, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1891, partial_loss/deprel_loss: 0.3036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4400, loss: 0.5123, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||:  32%|###1      | 35/111 [00:24<00:54,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9637, LAS: 0.9314, UEM: 0.6839, LEM: 0.4814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3352, partial_loss/deprel_loss: 0.4113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5554, loss: 0.5115, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||:  35%|###5      | 39/111 [00:27<00:49,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9635, LAS: 0.9312, UEM: 0.6794, LEM: 0.4762, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1725, partial_loss/deprel_loss: 0.3144, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4454, loss: 0.5129, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||:  38%|###7      | 42/111 [00:29<00:49,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9634, LAS: 0.9313, UEM: 0.6717, LEM: 0.4660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2903, partial_loss/deprel_loss: 0.3103, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4656, loss: 0.5106, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||:  41%|####1     | 46/111 [00:32<00:44,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9631, LAS: 0.9309, UEM: 0.6701, LEM: 0.4657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3267, partial_loss/deprel_loss: 0.3545, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5083, loss: 0.5113, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||:  44%|####4     | 49/111 [00:34<00:43,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9639, LAS: 0.9318, UEM: 0.6815, LEM: 0.4748, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1246, partial_loss/deprel_loss: 0.2929, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4186, loss: 0.5053, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||:  47%|####6     | 52/111 [00:36<00:41,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9413, UAS: 0.9647, LAS: 0.9326, UEM: 0.6911, LEM: 0.4791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2317, partial_loss/deprel_loss: 0.3164, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4588, loss: 0.4997, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||:  50%|#####     | 56/111 [00:39<00:38,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9196, UAS: 0.9643, LAS: 0.9323, UEM: 0.6836, LEM: 0.4717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5482, partial_loss/deprel_loss: 0.4451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6250, loss: 0.5023, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||:  53%|#####3    | 59/111 [00:41<00:36,  1.44it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9204, UAS: 0.9643, LAS: 0.9320, UEM: 0.6791, LEM: 0.4649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3415, partial_loss/deprel_loss: 0.4532, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5901, loss: 0.5038, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||:  56%|#####5    | 62/111 [00:43<00:34,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9637, LAS: 0.9313, UEM: 0.6766, LEM: 0.4639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1466, partial_loss/deprel_loss: 0.2395, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3802, loss: 0.5083, batch_reg_loss: 0.1593, reg_loss: 0.1593 ||:  59%|#####8    | 65/111 [00:45<00:32,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9634, LAS: 0.9310, UEM: 0.6691, LEM: 0.4564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5409, partial_loss/deprel_loss: 0.4361, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6163, loss: 0.5110, batch_reg_loss: 0.1593, reg_loss: 0.1593 ||:  61%|######1   | 68/111 [00:47<00:30,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9635, LAS: 0.9313, UEM: 0.6709, LEM: 0.4585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3952, partial_loss/deprel_loss: 0.3686, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5331, loss: 0.5081, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||:  64%|######3   | 71/111 [00:49<00:28,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9457, UAS: 0.9629, LAS: 0.9306, UEM: 0.6680, LEM: 0.4550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1545, partial_loss/deprel_loss: 0.2424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3841, loss: 0.5118, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||:  68%|######7   | 75/111 [00:52<00:24,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9399, UAS: 0.9630, LAS: 0.9309, UEM: 0.6637, LEM: 0.4490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2650, partial_loss/deprel_loss: 0.3520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4938, loss: 0.5100, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||:  71%|#######1  | 79/111 [00:54<00:20,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9628, LAS: 0.9307, UEM: 0.6595, LEM: 0.4460, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2778, partial_loss/deprel_loss: 0.3128, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4650, loss: 0.5112, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||:  76%|#######5  | 84/111 [00:56<00:15,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9622, LAS: 0.9302, UEM: 0.6550, LEM: 0.4419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4723, partial_loss/deprel_loss: 0.4125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5837, loss: 0.5147, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||:  79%|#######9  | 88/111 [00:59<00:13,  1.71it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9390, UAS: 0.9624, LAS: 0.9305, UEM: 0.6550, LEM: 0.4425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3401, partial_loss/deprel_loss: 0.2957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4638, loss: 0.5130, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||:  84%|########3 | 93/111 [01:01<00:09,  1.85it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9624, LAS: 0.9306, UEM: 0.6547, LEM: 0.4426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4645, partial_loss/deprel_loss: 0.3790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5553, loss: 0.5128, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||:  87%|########7 | 97/111 [01:03<00:07,  1.76it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9192, UAS: 0.9625, LAS: 0.9306, UEM: 0.6569, LEM: 0.4456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5331, partial_loss/deprel_loss: 0.3988, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5848, loss: 0.5122, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||:  91%|######### | 101/111 [01:06<00:06,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9470, UAS: 0.9622, LAS: 0.9302, UEM: 0.6549, LEM: 0.4436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1454, partial_loss/deprel_loss: 0.2793, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4117, loss: 0.5142, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||:  95%|#########4| 105/111 [01:09<00:03,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9624, LAS: 0.9303, UEM: 0.6560, LEM: 0.4425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1664, partial_loss/deprel_loss: 0.2886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4233, loss: 0.5129, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||:  98%|#########8| 109/111 [01:12<00:01,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9176, UAS: 0.9622, LAS: 0.9302, UEM: 0.6526, LEM: 0.4394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5603, partial_loss/deprel_loss: 0.4172, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6050, loss: 0.5139, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||: 100%|##########| 111/111 [01:13<00:00,  1.50it/s]\n",
+      "2023-04-07 01:46:37,762 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.417  |       N/A\n",
+      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.560  |       N/A\n",
+      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.159  |       N/A\n",
+      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - UEM                      |     0.653  |       N/A\n",
+      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - LAS                      |     0.930  |       N/A\n",
+      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - loss                     |     0.514  |       N/A\n",
+      "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - LEM                      |     0.439  |       N/A\n",
+      "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |       N/A\n",
+      "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - EM                       |     0.918  |       N/A\n",
+      "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:46:37,768 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:46:41,880 - INFO - combo.training.trainer - Epoch duration: 0:01:20.623541\n",
+      "2023-04-07 01:46:41,881 - INFO - combo.training.trainer - Estimated training time remaining: 6:11:38\n",
+      "2023-04-07 01:46:41,881 - INFO - allennlp.training.trainer - Epoch 129/399\n",
+      "2023-04-07 01:46:41,881 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:46:41,882 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:46:41,889 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9571, LAS: 0.9253, UEM: 0.6291, LEM: 0.4178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8287, partial_loss/deprel_loss: 0.4590, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6921, loss: 0.5324, batch_reg_loss: 0.1592, reg_loss: 0.1592 ||:   3%|2         | 3/111 [00:02<01:26,  1.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9592, LAS: 0.9265, UEM: 0.5725, LEM: 0.3463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4818, partial_loss/deprel_loss: 0.4078, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5818, loss: 0.5464, batch_reg_loss: 0.1591, reg_loss: 0.1592 ||:   5%|5         | 6/111 [00:04<01:20,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9294, UAS: 0.9626, LAS: 0.9302, UEM: 0.5930, LEM: 0.3601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3725, partial_loss/deprel_loss: 0.3704, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5299, loss: 0.5211, batch_reg_loss: 0.1591, reg_loss: 0.1592 ||:   8%|8         | 9/111 [00:06<01:15,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9638, LAS: 0.9326, UEM: 0.6199, LEM: 0.3914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4593, partial_loss/deprel_loss: 0.3696, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5467, loss: 0.5010, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||:  11%|#         | 12/111 [00:08<01:11,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9640, LAS: 0.9327, UEM: 0.6444, LEM: 0.4161, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1979, partial_loss/deprel_loss: 0.3103, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4470, loss: 0.4944, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||:  14%|#3        | 15/111 [00:10<01:09,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9640, LAS: 0.9322, UEM: 0.6360, LEM: 0.4038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2576, partial_loss/deprel_loss: 0.2993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4501, loss: 0.4992, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||:  16%|#6        | 18/111 [00:12<01:06,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9204, UAS: 0.9635, LAS: 0.9319, UEM: 0.6334, LEM: 0.4055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5344, partial_loss/deprel_loss: 0.4422, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6198, loss: 0.5011, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||:  19%|#8        | 21/111 [00:15<01:07,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9634, LAS: 0.9314, UEM: 0.6320, LEM: 0.3991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2485, partial_loss/deprel_loss: 0.3423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4827, loss: 0.5029, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||:  22%|##1       | 24/111 [00:17<01:03,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9456, UAS: 0.9630, LAS: 0.9313, UEM: 0.6391, LEM: 0.4144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1685, partial_loss/deprel_loss: 0.2535, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3956, loss: 0.5036, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||:  25%|##5       | 28/111 [00:19<00:57,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9584, UAS: 0.9631, LAS: 0.9318, UEM: 0.6667, LEM: 0.4546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0664, partial_loss/deprel_loss: 0.1603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3006, loss: 0.4998, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||:  28%|##7       | 31/111 [00:22<00:57,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9255, UAS: 0.9630, LAS: 0.9316, UEM: 0.6514, LEM: 0.4349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5565, partial_loss/deprel_loss: 0.4437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6253, loss: 0.5023, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||:  32%|###1      | 35/111 [00:24<00:53,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9644, LAS: 0.9331, UEM: 0.6810, LEM: 0.4665, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1582, partial_loss/deprel_loss: 0.2944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4262, loss: 0.4920, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||:  34%|###4      | 38/111 [00:27<00:52,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9537, UAS: 0.9647, LAS: 0.9334, UEM: 0.6813, LEM: 0.4670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1636, partial_loss/deprel_loss: 0.1904, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3441, loss: 0.4904, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||:  37%|###6      | 41/111 [00:29<00:50,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9655, LAS: 0.9341, UEM: 0.6899, LEM: 0.4729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1564, partial_loss/deprel_loss: 0.2981, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4288, loss: 0.4847, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  40%|###9      | 44/111 [00:31<00:49,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9650, LAS: 0.9336, UEM: 0.6775, LEM: 0.4600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3987, partial_loss/deprel_loss: 0.3938, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5538, loss: 0.4880, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  43%|####3     | 48/111 [00:34<00:43,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9524, UAS: 0.9650, LAS: 0.9337, UEM: 0.6821, LEM: 0.4667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0927, partial_loss/deprel_loss: 0.2014, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3387, loss: 0.4874, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  46%|####5     | 51/111 [00:36<00:43,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9400, UAS: 0.9645, LAS: 0.9329, UEM: 0.6861, LEM: 0.4691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1431, partial_loss/deprel_loss: 0.2954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4239, loss: 0.4911, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  49%|####8     | 54/111 [00:38<00:41,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9640, LAS: 0.9326, UEM: 0.6750, LEM: 0.4590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4421, partial_loss/deprel_loss: 0.3833, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5540, loss: 0.4949, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  52%|#####2    | 58/111 [00:41<00:36,  1.44it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9638, LAS: 0.9325, UEM: 0.6746, LEM: 0.4601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6530, partial_loss/deprel_loss: 0.3825, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5956, loss: 0.4935, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  56%|#####5    | 62/111 [00:43<00:32,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9447, UAS: 0.9637, LAS: 0.9322, UEM: 0.6696, LEM: 0.4541, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2146, partial_loss/deprel_loss: 0.2791, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4252, loss: 0.4968, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  59%|#####9    | 66/111 [00:45<00:28,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9640, LAS: 0.9326, UEM: 0.6803, LEM: 0.4734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3815, partial_loss/deprel_loss: 0.4428, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5895, loss: 0.4949, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  63%|######3   | 70/111 [00:47<00:24,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9629, LAS: 0.9315, UEM: 0.6715, LEM: 0.4660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6440, partial_loss/deprel_loss: 0.4679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6621, loss: 0.5023, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  67%|######6   | 74/111 [00:49<00:21,  1.75it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9632, LAS: 0.9317, UEM: 0.6740, LEM: 0.4683, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2068, partial_loss/deprel_loss: 0.2518, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4017, loss: 0.5003, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  71%|#######1  | 79/111 [00:52<00:17,  1.86it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9632, LAS: 0.9317, UEM: 0.6723, LEM: 0.4657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3288, partial_loss/deprel_loss: 0.3709, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5215, loss: 0.5008, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  75%|#######4  | 83/111 [00:54<00:15,  1.82it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9627, LAS: 0.9313, UEM: 0.6709, LEM: 0.4648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3954, partial_loss/deprel_loss: 0.3580, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5244, loss: 0.5027, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||:  78%|#######8  | 87/111 [00:57<00:14,  1.65it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9434, UAS: 0.9632, LAS: 0.9318, UEM: 0.6740, LEM: 0.4668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1702, partial_loss/deprel_loss: 0.2829, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4193, loss: 0.5005, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||:  82%|########1 | 91/111 [01:00<00:12,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9632, LAS: 0.9318, UEM: 0.6711, LEM: 0.4630, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3401, partial_loss/deprel_loss: 0.3492, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5063, loss: 0.5009, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||:  86%|########5 | 95/111 [01:03<00:10,  1.53it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9633, LAS: 0.9318, UEM: 0.6691, LEM: 0.4596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2271, partial_loss/deprel_loss: 0.3264, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4655, loss: 0.5007, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||:  89%|########9 | 99/111 [01:05<00:07,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8938, UAS: 0.9627, LAS: 0.9312, UEM: 0.6639, LEM: 0.4552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8737, partial_loss/deprel_loss: 0.5311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7585, loss: 0.5051, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||:  93%|#########2| 103/111 [01:08<00:05,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9308, UAS: 0.9626, LAS: 0.9309, UEM: 0.6591, LEM: 0.4496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2589, partial_loss/deprel_loss: 0.3584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4974, loss: 0.5073, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||:  96%|#########6| 107/111 [01:11<00:02,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9420, UAS: 0.9626, LAS: 0.9310, UEM: 0.6551, LEM: 0.4449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2786, partial_loss/deprel_loss: 0.3110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4634, loss: 0.5071, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||: 100%|##########| 111/111 [01:13<00:00,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9420, UAS: 0.9626, LAS: 0.9310, UEM: 0.6551, LEM: 0.4449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2786, partial_loss/deprel_loss: 0.3110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4634, loss: 0.5071, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||: 100%|##########| 111/111 [01:13<00:00,  1.50it/s]\n",
+      "2023-04-07 01:47:59,072 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:47:59,072 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:47:59,072 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:47:59,072 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:47:59,072 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.311  |       N/A\n",
+      "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.279  |       N/A\n",
+      "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.159  |       N/A\n",
+      "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - UEM                      |     0.655  |       N/A\n",
+      "2023-04-07 01:47:59,074 - INFO - combo.training.tensorboard_writer - LAS                      |     0.931  |       N/A\n",
+      "2023-04-07 01:47:59,074 - INFO - combo.training.tensorboard_writer - loss                     |     0.507  |       N/A\n",
+      "2023-04-07 01:47:59,074 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:47:59,074 - INFO - combo.training.tensorboard_writer - LEM                      |     0.445  |       N/A\n",
+      "2023-04-07 01:47:59,074 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:47:59,074 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:47:59,074 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |       N/A\n",
+      "2023-04-07 01:47:59,075 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:47:59,075 - INFO - combo.training.tensorboard_writer - EM                       |     0.942  |       N/A\n",
+      "2023-04-07 01:47:59,075 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2023-04-07 01:47:59,081 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:48:06,063 - INFO - combo.training.trainer - Epoch duration: 0:01:24.181700\n",
+      "2023-04-07 01:48:06,063 - INFO - combo.training.trainer - Estimated training time remaining: 6:10:20\n",
+      "2023-04-07 01:48:06,063 - INFO - allennlp.training.trainer - Epoch 130/399\n",
+      "2023-04-07 01:48:06,063 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:48:06,064 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:48:06,073 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9644, LAS: 0.9321, UEM: 0.6007, LEM: 0.3618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2983, partial_loss/deprel_loss: 0.2848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4464, loss: 0.5070, batch_reg_loss: 0.1589, reg_loss: 0.1589 ||:   4%|3         | 4/111 [00:02<01:06,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9630, LAS: 0.9319, UEM: 0.5347, LEM: 0.2950, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2984, partial_loss/deprel_loss: 0.3859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5272, loss: 0.5090, batch_reg_loss: 0.1589, reg_loss: 0.1589 ||:   7%|7         | 8/111 [00:05<01:05,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9602, LAS: 0.9286, UEM: 0.5392, LEM: 0.3094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5463, partial_loss/deprel_loss: 0.4304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6124, loss: 0.5236, batch_reg_loss: 0.1589, reg_loss: 0.1589 ||:  11%|#         | 12/111 [00:07<01:00,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9631, LAS: 0.9321, UEM: 0.5913, LEM: 0.3613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1982, partial_loss/deprel_loss: 0.2946, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4342, loss: 0.5061, batch_reg_loss: 0.1589, reg_loss: 0.1589 ||:  14%|#3        | 15/111 [00:09<01:00,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9651, LAS: 0.9341, UEM: 0.6675, LEM: 0.4530, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1868, partial_loss/deprel_loss: 0.2916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4295, loss: 0.4874, batch_reg_loss: 0.1589, reg_loss: 0.1589 ||:  16%|#6        | 18/111 [00:11<01:02,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9496, UAS: 0.9650, LAS: 0.9341, UEM: 0.6555, LEM: 0.4358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1861, partial_loss/deprel_loss: 0.2947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4318, loss: 0.4924, batch_reg_loss: 0.1588, reg_loss: 0.1589 ||:  19%|#8        | 21/111 [00:13<01:01,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9653, LAS: 0.9344, UEM: 0.6473, LEM: 0.4239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3484, partial_loss/deprel_loss: 0.3837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5355, loss: 0.4921, batch_reg_loss: 0.1588, reg_loss: 0.1589 ||:  22%|##1       | 24/111 [00:15<00:59,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9638, LAS: 0.9329, UEM: 0.6244, LEM: 0.4037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5195, partial_loss/deprel_loss: 0.4305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6071, loss: 0.5015, batch_reg_loss: 0.1588, reg_loss: 0.1589 ||:  25%|##5       | 28/111 [00:18<00:55,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9630, LAS: 0.9317, UEM: 0.6259, LEM: 0.4043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9956, partial_loss/deprel_loss: 0.5592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8053, loss: 0.5075, batch_reg_loss: 0.1588, reg_loss: 0.1589 ||:  29%|##8       | 32/111 [00:21<00:52,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9632, LAS: 0.9318, UEM: 0.6266, LEM: 0.4038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4981, partial_loss/deprel_loss: 0.4304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6027, loss: 0.5074, batch_reg_loss: 0.1588, reg_loss: 0.1588 ||:  32%|###2      | 36/111 [00:23<00:48,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9090, UAS: 0.9640, LAS: 0.9322, UEM: 0.6423, LEM: 0.4150, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5620, partial_loss/deprel_loss: 0.4993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6706, loss: 0.5044, batch_reg_loss: 0.1588, reg_loss: 0.1588 ||:  36%|###6      | 40/111 [00:26<00:46,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9647, LAS: 0.9332, UEM: 0.6779, LEM: 0.4652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1671, partial_loss/deprel_loss: 0.2614, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4013, loss: 0.4988, batch_reg_loss: 0.1588, reg_loss: 0.1588 ||:  39%|###8      | 43/111 [00:29<00:50,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9457, UAS: 0.9657, LAS: 0.9343, UEM: 0.7038, LEM: 0.4956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1492, partial_loss/deprel_loss: 0.2090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3558, loss: 0.4886, batch_reg_loss: 0.1588, reg_loss: 0.1588 ||:  42%|####2     | 47/111 [00:31<00:44,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9126, UAS: 0.9643, LAS: 0.9328, UEM: 0.6897, LEM: 0.4799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6428, partial_loss/deprel_loss: 0.4771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6690, loss: 0.4994, batch_reg_loss: 0.1588, reg_loss: 0.1588 ||:  47%|####6     | 52/111 [00:34<00:37,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9641, LAS: 0.9324, UEM: 0.6784, LEM: 0.4671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4256, partial_loss/deprel_loss: 0.3724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5417, loss: 0.5004, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  51%|#####1    | 57/111 [00:36<00:31,  1.71it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9473, UAS: 0.9646, LAS: 0.9329, UEM: 0.6881, LEM: 0.4768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1164, partial_loss/deprel_loss: 0.2322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3677, loss: 0.4959, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  55%|#####4    | 61/111 [00:38<00:29,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9084, UAS: 0.9646, LAS: 0.9331, UEM: 0.6927, LEM: 0.4829, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7745, partial_loss/deprel_loss: 0.3842, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6210, loss: 0.4928, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  59%|#####8    | 65/111 [00:41<00:28,  1.60it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9164, UAS: 0.9634, LAS: 0.9317, UEM: 0.6818, LEM: 0.4728, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6007, partial_loss/deprel_loss: 0.4266, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6201, loss: 0.5024, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  62%|######2   | 69/111 [00:44<00:28,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9624, LAS: 0.9309, UEM: 0.6704, LEM: 0.4636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7995, partial_loss/deprel_loss: 0.4756, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6991, loss: 0.5085, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  66%|######5   | 73/111 [00:47<00:26,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9618, LAS: 0.9302, UEM: 0.6615, LEM: 0.4558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5721, partial_loss/deprel_loss: 0.4385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6239, loss: 0.5133, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  68%|######8   | 76/111 [00:49<00:24,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9620, LAS: 0.9302, UEM: 0.6593, LEM: 0.4514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1839, partial_loss/deprel_loss: 0.2956, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4320, loss: 0.5124, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  71%|#######1  | 79/111 [00:51<00:22,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9622, LAS: 0.9302, UEM: 0.6649, LEM: 0.4552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0736, partial_loss/deprel_loss: 0.2425, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3674, loss: 0.5128, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  74%|#######3  | 82/111 [00:54<00:21,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9530, UAS: 0.9626, LAS: 0.9307, UEM: 0.6698, LEM: 0.4592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1218, partial_loss/deprel_loss: 0.2427, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3772, loss: 0.5096, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  77%|#######6  | 85/111 [00:56<00:19,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9628, LAS: 0.9308, UEM: 0.6682, LEM: 0.4564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3937, partial_loss/deprel_loss: 0.3968, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5549, loss: 0.5091, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  79%|#######9  | 88/111 [00:58<00:17,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9630, LAS: 0.9310, UEM: 0.6678, LEM: 0.4544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2192, partial_loss/deprel_loss: 0.3421, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4762, loss: 0.5076, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  82%|########1 | 91/111 [01:00<00:14,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8878, UAS: 0.9628, LAS: 0.9308, UEM: 0.6676, LEM: 0.4532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0291, partial_loss/deprel_loss: 0.5194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7800, loss: 0.5087, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  85%|########4 | 94/111 [01:03<00:12,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9626, LAS: 0.9306, UEM: 0.6626, LEM: 0.4482, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5218, partial_loss/deprel_loss: 0.4520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6246, loss: 0.5101, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  87%|########7 | 97/111 [01:05<00:10,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9303, UAS: 0.9626, LAS: 0.9306, UEM: 0.6591, LEM: 0.4438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3161, partial_loss/deprel_loss: 0.3380, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4923, loss: 0.5099, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  91%|######### | 101/111 [01:08<00:07,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9627, LAS: 0.9307, UEM: 0.6601, LEM: 0.4457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7448, partial_loss/deprel_loss: 0.5054, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7119, loss: 0.5095, batch_reg_loss: 0.1586, reg_loss: 0.1588 ||:  95%|#########4| 105/111 [01:10<00:04,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9627, LAS: 0.9308, UEM: 0.6589, LEM: 0.4450, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1161, partial_loss/deprel_loss: 0.2363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3709, loss: 0.5088, batch_reg_loss: 0.1586, reg_loss: 0.1588 ||:  98%|#########8| 109/111 [01:13<00:01,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9627, LAS: 0.9307, UEM: 0.6574, LEM: 0.4431, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6138, partial_loss/deprel_loss: 0.4042, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6048, loss: 0.5099, batch_reg_loss: 0.1586, reg_loss: 0.1588 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
+      "2023-04-07 01:49:23,847 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9558, LAS: 0.9078, UEM: 0.7180, LEM: 0.4174, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4751, partial_loss/deprel_loss: 23.4358, partial_loss/cycle_loss: 0.0000, batch_loss: 18.8436, loss: 24.3775, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:08,  1.14it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8372, UAS: 0.9387, LAS: 0.8868, UEM: 0.5723, LEM: 0.3041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6799, partial_loss/deprel_loss: 53.1680, partial_loss/cycle_loss: 0.0000, batch_loss: 42.8704, loss: 28.7997, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:06,  1.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9395, LAS: 0.8866, UEM: 0.5282, LEM: 0.2489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7739, partial_loss/deprel_loss: 28.3741, partial_loss/cycle_loss: 0.0000, batch_loss: 22.8540, loss: 27.7545, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  69%|######9   | 9/13 [00:08<00:03,  1.07it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9457, LAS: 0.8958, UEM: 0.6517, LEM: 0.4020, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1904, partial_loss/deprel_loss: 17.1259, partial_loss/cycle_loss: 0.0000, batch_loss: 13.7388, loss: 25.1794, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:10<00:01,  1.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9482, LAS: 0.8982, UEM: 0.6599, LEM: 0.3943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5900, partial_loss/deprel_loss: 23.0872, partial_loss/cycle_loss: 0.0000, batch_loss: 18.5878, loss: 24.2782, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.00s/it]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9482, LAS: 0.8982, UEM: 0.6599, LEM: 0.3943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5900, partial_loss/deprel_loss: 23.0872, partial_loss/cycle_loss: 0.0000, batch_loss: 18.5878, loss: 24.2782, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.01it/s]\n",
+      "2023-04-07 01:49:36,765 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:49:36,765 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
+      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.404  |    23.087\n",
+      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.614  |     0.590\n",
+      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.159  |     0.000\n",
+      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - UEM                      |     0.657  |     0.660\n",
+      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - LAS                      |     0.931  |     0.898\n",
+      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - loss                     |     0.510  |    24.278\n",
+      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - LEM                      |     0.443  |     0.394\n",
+      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:49:36,767 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |     0.948\n",
+      "2023-04-07 01:49:36,767 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:49:36,767 - INFO - combo.training.tensorboard_writer - EM                       |     0.916  |     0.901\n",
+      "2023-04-07 01:49:36,767 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:49:36,772 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:49:41,759 - INFO - combo.training.trainer - Epoch duration: 0:01:35.695957\n",
+      "2023-04-07 01:49:41,760 - INFO - combo.training.trainer - Estimated training time remaining: 6:09:25\n",
+      "2023-04-07 01:49:41,760 - INFO - allennlp.training.trainer - Epoch 131/399\n",
+      "2023-04-07 01:49:41,760 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:49:41,761 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:49:41,771 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9658, LAS: 0.9335, UEM: 0.6562, LEM: 0.4297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2158, partial_loss/deprel_loss: 0.3432, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4763, loss: 0.4845, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||:   3%|2         | 3/111 [00:02<01:25,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9690, LAS: 0.9351, UEM: 0.6834, LEM: 0.4218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2940, partial_loss/deprel_loss: 0.3080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4639, loss: 0.4758, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||:   5%|5         | 6/111 [00:04<01:19,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9434, UAS: 0.9650, LAS: 0.9318, UEM: 0.6375, LEM: 0.4047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1942, partial_loss/deprel_loss: 0.2715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4146, loss: 0.5000, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||:   9%|9         | 10/111 [00:06<01:09,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9116, UAS: 0.9639, LAS: 0.9309, UEM: 0.6198, LEM: 0.3833, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4991, partial_loss/deprel_loss: 0.4957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6550, loss: 0.5093, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||:  14%|#3        | 15/111 [00:09<01:00,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9096, UAS: 0.9632, LAS: 0.9305, UEM: 0.6157, LEM: 0.3840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7437, partial_loss/deprel_loss: 0.4854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6957, loss: 0.5132, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||:  17%|#7        | 19/111 [00:11<00:58,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9644, LAS: 0.9318, UEM: 0.6112, LEM: 0.3696, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3087, partial_loss/deprel_loss: 0.3383, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4910, loss: 0.5065, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||:  21%|##        | 23/111 [00:13<00:52,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9700, UAS: 0.9657, LAS: 0.9339, UEM: 0.6792, LEM: 0.4690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0435, partial_loss/deprel_loss: 0.1104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2556, loss: 0.4905, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||:  24%|##4       | 27/111 [00:16<00:52,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9643, LAS: 0.9328, UEM: 0.6564, LEM: 0.4454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3674, partial_loss/deprel_loss: 0.3604, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5203, loss: 0.4984, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||:  28%|##7       | 31/111 [00:18<00:49,  1.63it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9642, LAS: 0.9326, UEM: 0.6407, LEM: 0.4252, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3813, partial_loss/deprel_loss: 0.3253, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4951, loss: 0.4981, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||:  32%|###2      | 36/111 [00:20<00:42,  1.78it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9645, LAS: 0.9329, UEM: 0.6449, LEM: 0.4271, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4363, partial_loss/deprel_loss: 0.3574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5318, loss: 0.4958, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||:  37%|###6      | 41/111 [00:23<00:37,  1.85it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9644, LAS: 0.9328, UEM: 0.6491, LEM: 0.4322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4255, partial_loss/deprel_loss: 0.4384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5944, loss: 0.4963, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||:  41%|####      | 45/111 [00:26<00:38,  1.70it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9642, LAS: 0.9327, UEM: 0.6549, LEM: 0.4391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3966, partial_loss/deprel_loss: 0.3687, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5328, loss: 0.4974, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||:  44%|####4     | 49/111 [00:28<00:37,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9646, LAS: 0.9330, UEM: 0.6640, LEM: 0.4502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2790, partial_loss/deprel_loss: 0.3283, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4769, loss: 0.4947, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||:  48%|####7     | 53/111 [00:31<00:37,  1.57it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9304, UAS: 0.9653, LAS: 0.9338, UEM: 0.6784, LEM: 0.4668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2823, partial_loss/deprel_loss: 0.3371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4846, loss: 0.4883, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||:  51%|#####1    | 57/111 [00:34<00:37,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9657, LAS: 0.9338, UEM: 0.6797, LEM: 0.4635, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1760, partial_loss/deprel_loss: 0.2770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4153, loss: 0.4867, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||:  55%|#####4    | 61/111 [00:37<00:34,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9659, LAS: 0.9341, UEM: 0.6800, LEM: 0.4620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2181, partial_loss/deprel_loss: 0.3302, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4663, loss: 0.4860, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||:  58%|#####7    | 64/111 [00:39<00:32,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9398, UAS: 0.9655, LAS: 0.9335, UEM: 0.6778, LEM: 0.4590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1973, partial_loss/deprel_loss: 0.2701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4140, loss: 0.4904, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||:  61%|######1   | 68/111 [00:42<00:29,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9646, LAS: 0.9325, UEM: 0.6730, LEM: 0.4548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6611, partial_loss/deprel_loss: 0.4525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6527, loss: 0.4967, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||:  64%|######3   | 71/111 [00:44<00:27,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9640, LAS: 0.9318, UEM: 0.6679, LEM: 0.4515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4213, partial_loss/deprel_loss: 0.4116, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5720, loss: 0.5014, batch_reg_loss: 0.1585, reg_loss: 0.1585 ||:  68%|######7   | 75/111 [00:46<00:24,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9636, LAS: 0.9316, UEM: 0.6655, LEM: 0.4514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5326, partial_loss/deprel_loss: 0.4338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6120, loss: 0.5018, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||:  71%|#######1  | 79/111 [00:49<00:21,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9635, LAS: 0.9314, UEM: 0.6593, LEM: 0.4451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4088, partial_loss/deprel_loss: 0.3212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4972, loss: 0.5036, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||:  74%|#######3  | 82/111 [00:51<00:19,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9638, LAS: 0.9319, UEM: 0.6595, LEM: 0.4433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1496, partial_loss/deprel_loss: 0.2449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3843, loss: 0.5006, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||:  77%|#######7  | 86/111 [00:54<00:16,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9638, LAS: 0.9319, UEM: 0.6648, LEM: 0.4531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6573, partial_loss/deprel_loss: 0.5130, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7003, loss: 0.5010, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||:  80%|########  | 89/111 [00:56<00:15,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9636, LAS: 0.9317, UEM: 0.6590, LEM: 0.4469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4891, partial_loss/deprel_loss: 0.4768, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6377, loss: 0.5029, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||:  84%|########3 | 93/111 [00:59<00:11,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9635, LAS: 0.9316, UEM: 0.6583, LEM: 0.4467, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1251, partial_loss/deprel_loss: 0.2280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3658, loss: 0.5027, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||:  87%|########7 | 97/111 [01:02<00:09,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9636, LAS: 0.9318, UEM: 0.6572, LEM: 0.4449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1973, partial_loss/deprel_loss: 0.2348, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3857, loss: 0.5018, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||:  90%|######### | 100/111 [01:04<00:07,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9639, LAS: 0.9319, UEM: 0.6622, LEM: 0.4478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2035, partial_loss/deprel_loss: 0.3206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4556, loss: 0.5003, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||:  93%|#########2| 103/111 [01:06<00:05,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9637, LAS: 0.9318, UEM: 0.6594, LEM: 0.4448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7736, partial_loss/deprel_loss: 0.4351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6612, loss: 0.5017, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||:  95%|#########5| 106/111 [01:08<00:03,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9633, LAS: 0.9314, UEM: 0.6576, LEM: 0.4430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4196, partial_loss/deprel_loss: 0.3443, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5178, loss: 0.5043, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||:  98%|#########8| 109/111 [01:10<00:01,  1.41it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9633, LAS: 0.9314, UEM: 0.6589, LEM: 0.4443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5801, partial_loss/deprel_loss: 0.4209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6111, loss: 0.5043, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||: 100%|##########| 111/111 [01:12<00:00,  1.53it/s]\n",
+      "2023-04-07 01:50:57,365 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:50:57,365 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:50:57,365 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:50:57,365 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:50:57,365 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.421  |       N/A\n",
+      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.580  |       N/A\n",
+      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.159  |       N/A\n",
+      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - UEM                      |     0.659  |       N/A\n",
+      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - LAS                      |     0.931  |       N/A\n",
+      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - loss                     |     0.504  |       N/A\n",
+      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - LEM                      |     0.444  |       N/A\n",
+      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:50:57,367 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |       N/A\n",
+      "2023-04-07 01:50:57,367 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:50:57,367 - INFO - combo.training.tensorboard_writer - EM                       |     0.916  |       N/A\n",
+      "2023-04-07 01:50:57,367 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:50:57,372 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:51:04,337 - INFO - combo.training.trainer - Epoch duration: 0:01:22.576860\n",
+      "2023-04-07 01:51:04,337 - INFO - combo.training.trainer - Estimated training time remaining: 6:08:03\n",
+      "2023-04-07 01:51:04,338 - INFO - allennlp.training.trainer - Epoch 132/399\n",
+      "2023-04-07 01:51:04,338 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:51:04,339 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:51:04,348 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9239, UAS: 0.9355, LAS: 0.9035, UEM: 0.2982, LEM: 0.1404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4192, partial_loss/deprel_loss: 0.4010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5630, loss: 0.6882, batch_reg_loss: 0.1584, reg_loss: 0.1584 ||:   3%|2         | 3/111 [00:02<01:25,  1.26it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9578, UAS: 0.9504, LAS: 0.9180, UEM: 0.5783, LEM: 0.3771, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1050, partial_loss/deprel_loss: 0.2255, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3598, loss: 0.5970, batch_reg_loss: 0.1584, reg_loss: 0.1584 ||:   6%|6         | 7/111 [00:04<01:14,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9573, LAS: 0.9259, UEM: 0.6287, LEM: 0.4337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5310, partial_loss/deprel_loss: 0.3926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5786, loss: 0.5515, batch_reg_loss: 0.1584, reg_loss: 0.1584 ||:  11%|#         | 12/111 [00:06<01:04,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9336, UAS: 0.9604, LAS: 0.9291, UEM: 0.6289, LEM: 0.4149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3882, partial_loss/deprel_loss: 0.3036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4788, loss: 0.5247, batch_reg_loss: 0.1583, reg_loss: 0.1584 ||:  15%|#5        | 17/111 [00:09<00:55,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9363, UAS: 0.9596, LAS: 0.9288, UEM: 0.5911, LEM: 0.3805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2431, partial_loss/deprel_loss: 0.2964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4441, loss: 0.5271, batch_reg_loss: 0.1583, reg_loss: 0.1584 ||:  20%|#9        | 22/111 [00:11<00:49,  1.80it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9493, UAS: 0.9608, LAS: 0.9298, UEM: 0.6044, LEM: 0.3931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1252, partial_loss/deprel_loss: 0.2280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3657, loss: 0.5187, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||:  23%|##3       | 26/111 [00:14<00:49,  1.72it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9616, LAS: 0.9301, UEM: 0.6135, LEM: 0.3947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4241, partial_loss/deprel_loss: 0.3883, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5538, loss: 0.5136, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||:  27%|##7       | 30/111 [00:16<00:48,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9613, LAS: 0.9295, UEM: 0.5998, LEM: 0.3801, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2229, partial_loss/deprel_loss: 0.3298, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4667, loss: 0.5181, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||:  31%|###       | 34/111 [00:19<00:46,  1.67it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9604, UAS: 0.9620, LAS: 0.9306, UEM: 0.6366, LEM: 0.4269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0532, partial_loss/deprel_loss: 0.1433, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2835, loss: 0.5104, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||:  34%|###4      | 38/111 [00:22<00:48,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9631, LAS: 0.9317, UEM: 0.6435, LEM: 0.4283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1988, partial_loss/deprel_loss: 0.3114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4472, loss: 0.5039, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||:  38%|###7      | 42/111 [00:24<00:43,  1.57it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9622, LAS: 0.9310, UEM: 0.6257, LEM: 0.4133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6065, partial_loss/deprel_loss: 0.4111, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6085, loss: 0.5105, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||:  41%|####1     | 46/111 [00:27<00:41,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9235, UAS: 0.9623, LAS: 0.9310, UEM: 0.6233, LEM: 0.4077, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4085, partial_loss/deprel_loss: 0.4134, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5707, loss: 0.5106, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||:  45%|####5     | 50/111 [00:30<00:41,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9628, LAS: 0.9316, UEM: 0.6238, LEM: 0.4058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2636, partial_loss/deprel_loss: 0.3504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4913, loss: 0.5083, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||:  49%|####8     | 54/111 [00:33<00:39,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9632, LAS: 0.9320, UEM: 0.6408, LEM: 0.4249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3688, partial_loss/deprel_loss: 0.3437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5070, loss: 0.5037, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  51%|#####1    | 57/111 [00:35<00:39,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9636, LAS: 0.9324, UEM: 0.6484, LEM: 0.4327, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1830, partial_loss/deprel_loss: 0.2714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4120, loss: 0.5000, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  54%|#####4    | 60/111 [00:37<00:36,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9638, LAS: 0.9326, UEM: 0.6474, LEM: 0.4314, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2889, partial_loss/deprel_loss: 0.3331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4825, loss: 0.4986, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  57%|#####6    | 63/111 [00:39<00:34,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9625, LAS: 0.9312, UEM: 0.6366, LEM: 0.4223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9148, partial_loss/deprel_loss: 0.4920, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7348, loss: 0.5080, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  60%|######    | 67/111 [00:42<00:30,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9625, LAS: 0.9313, UEM: 0.6407, LEM: 0.4283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3029, partial_loss/deprel_loss: 0.3052, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4629, loss: 0.5070, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  63%|######3   | 70/111 [00:44<00:28,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9623, LAS: 0.9311, UEM: 0.6390, LEM: 0.4277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6995, partial_loss/deprel_loss: 0.4300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6421, loss: 0.5082, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  66%|######5   | 73/111 [00:46<00:26,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9509, UAS: 0.9628, LAS: 0.9315, UEM: 0.6497, LEM: 0.4384, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0792, partial_loss/deprel_loss: 0.2490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3733, loss: 0.5059, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  68%|######8   | 76/111 [00:49<00:26,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9437, UAS: 0.9626, LAS: 0.9311, UEM: 0.6497, LEM: 0.4388, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1317, partial_loss/deprel_loss: 0.2263, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3656, loss: 0.5085, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  71%|#######1  | 79/111 [00:51<00:23,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9628, LAS: 0.9313, UEM: 0.6545, LEM: 0.4447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4289, partial_loss/deprel_loss: 0.4707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6206, loss: 0.5078, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  75%|#######4  | 83/111 [00:53<00:19,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9324, UAS: 0.9630, LAS: 0.9315, UEM: 0.6547, LEM: 0.4427, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2771, partial_loss/deprel_loss: 0.3637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5046, loss: 0.5069, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  77%|#######7  | 86/111 [00:55<00:17,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9633, LAS: 0.9316, UEM: 0.6556, LEM: 0.4405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2261, partial_loss/deprel_loss: 0.3324, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4693, loss: 0.5058, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  80%|########  | 89/111 [00:57<00:15,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9631, LAS: 0.9313, UEM: 0.6521, LEM: 0.4364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2621, partial_loss/deprel_loss: 0.2951, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4466, loss: 0.5071, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  83%|########2 | 92/111 [01:00<00:13,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9728, UAS: 0.9633, LAS: 0.9317, UEM: 0.6672, LEM: 0.4582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0490, partial_loss/deprel_loss: 0.1049, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2518, loss: 0.5055, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  86%|########5 | 95/111 [01:03<00:12,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9637, LAS: 0.9318, UEM: 0.6667, LEM: 0.4554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3139, partial_loss/deprel_loss: 0.3837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5279, loss: 0.5045, batch_reg_loss: 0.1581, reg_loss: 0.1583 ||:  89%|########9 | 99/111 [01:05<00:08,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9452, UAS: 0.9638, LAS: 0.9319, UEM: 0.6678, LEM: 0.4559, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1525, partial_loss/deprel_loss: 0.2578, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3949, loss: 0.5033, batch_reg_loss: 0.1581, reg_loss: 0.1583 ||:  92%|#########1| 102/111 [01:07<00:06,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9633, LAS: 0.9314, UEM: 0.6613, LEM: 0.4506, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5248, partial_loss/deprel_loss: 0.4121, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5928, loss: 0.5068, batch_reg_loss: 0.1581, reg_loss: 0.1583 ||:  95%|#########4| 105/111 [01:09<00:04,  1.36it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9629, LAS: 0.9311, UEM: 0.6577, LEM: 0.4468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4233, partial_loss/deprel_loss: 0.4399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5947, loss: 0.5092, batch_reg_loss: 0.1581, reg_loss: 0.1582 ||:  97%|#########7| 108/111 [01:12<00:02,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9632, LAS: 0.9313, UEM: 0.6598, LEM: 0.4465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1641, partial_loss/deprel_loss: 0.2865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4201, loss: 0.5077, batch_reg_loss: 0.1581, reg_loss: 0.1582 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
+      "2023-04-07 01:52:21,453 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.287  |       N/A\n",
+      "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.164  |       N/A\n",
+      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.158  |       N/A\n",
+      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - UEM                      |     0.660  |       N/A\n",
+      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - LAS                      |     0.931  |       N/A\n",
+      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - loss                     |     0.508  |       N/A\n",
+      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - LEM                      |     0.447  |       N/A\n",
+      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |       N/A\n",
+      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - EM                       |     0.944  |       N/A\n",
+      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:52:21,460 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:52:29,124 - INFO - combo.training.trainer - Epoch duration: 0:01:24.786423\n",
+      "2023-04-07 01:52:29,125 - INFO - combo.training.trainer - Estimated training time remaining: 6:06:46\n",
+      "2023-04-07 01:52:29,125 - INFO - allennlp.training.trainer - Epoch 133/399\n",
+      "2023-04-07 01:52:29,125 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:52:29,126 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:52:29,137 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9731, LAS: 0.9427, UEM: 0.7832, LEM: 0.5870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3008, partial_loss/deprel_loss: 0.2936, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4532, loss: 0.4103, batch_reg_loss: 0.1581, reg_loss: 0.1581 ||:   5%|4         | 5/111 [00:02<00:52,  2.00it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9658, LAS: 0.9356, UEM: 0.7113, LEM: 0.5108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3312, partial_loss/deprel_loss: 0.3483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5030, loss: 0.4581, batch_reg_loss: 0.1581, reg_loss: 0.1581 ||:   7%|7         | 8/111 [00:04<00:59,  1.74it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9656, LAS: 0.9347, UEM: 0.7061, LEM: 0.4976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3322, partial_loss/deprel_loss: 0.3353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4928, loss: 0.4600, batch_reg_loss: 0.1581, reg_loss: 0.1581 ||:  10%|9         | 11/111 [00:06<01:02,  1.61it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9632, LAS: 0.9318, UEM: 0.6725, LEM: 0.4664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7018, partial_loss/deprel_loss: 0.4381, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6489, loss: 0.4809, batch_reg_loss: 0.1581, reg_loss: 0.1581 ||:  13%|#2        | 14/111 [00:08<01:02,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9634, LAS: 0.9313, UEM: 0.6568, LEM: 0.4424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1925, partial_loss/deprel_loss: 0.3132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4472, loss: 0.4887, batch_reg_loss: 0.1581, reg_loss: 0.1581 ||:  15%|#5        | 17/111 [00:11<01:02,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9628, LAS: 0.9303, UEM: 0.6486, LEM: 0.4315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2312, partial_loss/deprel_loss: 0.2814, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4294, loss: 0.4948, batch_reg_loss: 0.1581, reg_loss: 0.1581 ||:  18%|#8        | 20/111 [00:13<01:03,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9638, LAS: 0.9312, UEM: 0.6779, LEM: 0.4617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7755, partial_loss/deprel_loss: 0.4929, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7074, loss: 0.4923, batch_reg_loss: 0.1581, reg_loss: 0.1581 ||:  21%|##        | 23/111 [00:15<01:01,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9616, UAS: 0.9652, LAS: 0.9330, UEM: 0.7083, LEM: 0.4995, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0606, partial_loss/deprel_loss: 0.1413, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2832, loss: 0.4807, batch_reg_loss: 0.1580, reg_loss: 0.1581 ||:  23%|##3       | 26/111 [00:18<01:02,  1.36it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9646, LAS: 0.9325, UEM: 0.7066, LEM: 0.5026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4830, partial_loss/deprel_loss: 0.3893, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5661, loss: 0.4855, batch_reg_loss: 0.1580, reg_loss: 0.1581 ||:  26%|##6       | 29/111 [00:20<00:59,  1.38it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8908, UAS: 0.9635, LAS: 0.9313, UEM: 0.6873, LEM: 0.4828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8328, partial_loss/deprel_loss: 0.5691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7799, loss: 0.4968, batch_reg_loss: 0.1580, reg_loss: 0.1581 ||:  30%|##9       | 33/111 [00:22<00:54,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9328, UAS: 0.9639, LAS: 0.9316, UEM: 0.6871, LEM: 0.4818, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2880, partial_loss/deprel_loss: 0.3547, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4994, loss: 0.4923, batch_reg_loss: 0.1580, reg_loss: 0.1581 ||:  32%|###2      | 36/111 [00:24<00:53,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9619, LAS: 0.9301, UEM: 0.6684, LEM: 0.4652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6564, partial_loss/deprel_loss: 0.4076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6154, loss: 0.5014, batch_reg_loss: 0.1580, reg_loss: 0.1581 ||:  36%|###6      | 40/111 [00:27<00:48,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9191, UAS: 0.9617, LAS: 0.9298, UEM: 0.6542, LEM: 0.4504, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5085, partial_loss/deprel_loss: 0.4750, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6397, loss: 0.5079, batch_reg_loss: 0.1580, reg_loss: 0.1581 ||:  40%|###9      | 44/111 [00:29<00:44,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9423, UAS: 0.9625, LAS: 0.9306, UEM: 0.6561, LEM: 0.4484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2151, partial_loss/deprel_loss: 0.2727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4192, loss: 0.5018, batch_reg_loss: 0.1580, reg_loss: 0.1580 ||:  43%|####3     | 48/111 [00:32<00:40,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9398, UAS: 0.9626, LAS: 0.9304, UEM: 0.6582, LEM: 0.4461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1578, partial_loss/deprel_loss: 0.2982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4281, loss: 0.5035, batch_reg_loss: 0.1580, reg_loss: 0.1580 ||:  47%|####6     | 52/111 [00:35<00:39,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9627, LAS: 0.9306, UEM: 0.6538, LEM: 0.4389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2265, partial_loss/deprel_loss: 0.3118, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4527, loss: 0.5034, batch_reg_loss: 0.1580, reg_loss: 0.1580 ||:  50%|#####     | 56/111 [00:38<00:38,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9630, LAS: 0.9310, UEM: 0.6533, LEM: 0.4381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3521, partial_loss/deprel_loss: 0.3434, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5031, loss: 0.5006, batch_reg_loss: 0.1580, reg_loss: 0.1580 ||:  53%|#####3    | 59/111 [00:40<00:35,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9634, LAS: 0.9315, UEM: 0.6593, LEM: 0.4436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3861, partial_loss/deprel_loss: 0.3899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5471, loss: 0.4973, batch_reg_loss: 0.1580, reg_loss: 0.1580 ||:  56%|#####5    | 62/111 [00:42<00:34,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9632, LAS: 0.9313, UEM: 0.6543, LEM: 0.4386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4943, partial_loss/deprel_loss: 0.4377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6070, loss: 0.4994, batch_reg_loss: 0.1580, reg_loss: 0.1580 ||:  59%|#####8    | 65/111 [00:44<00:33,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9637, LAS: 0.9317, UEM: 0.6609, LEM: 0.4441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2084, partial_loss/deprel_loss: 0.2780, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4221, loss: 0.4958, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  61%|######1   | 68/111 [00:47<00:32,  1.31it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9776, UAS: 0.9645, LAS: 0.9327, UEM: 0.6818, LEM: 0.4724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0263, partial_loss/deprel_loss: 0.0802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2273, loss: 0.4900, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  65%|######4   | 72/111 [00:50<00:29,  1.33it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9231, UAS: 0.9648, LAS: 0.9329, UEM: 0.6870, LEM: 0.4766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3513, partial_loss/deprel_loss: 0.4002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5484, loss: 0.4877, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  68%|######7   | 75/111 [00:52<00:27,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9364, UAS: 0.9645, LAS: 0.9325, UEM: 0.6847, LEM: 0.4736, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2349, partial_loss/deprel_loss: 0.3626, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4950, loss: 0.4920, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  71%|#######1  | 79/111 [00:55<00:23,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9640, LAS: 0.9320, UEM: 0.6775, LEM: 0.4668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7113, partial_loss/deprel_loss: 0.4739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6793, loss: 0.4946, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  75%|#######4  | 83/111 [00:57<00:19,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9639, LAS: 0.9317, UEM: 0.6702, LEM: 0.4585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4289, partial_loss/deprel_loss: 0.4559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6084, loss: 0.4979, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  78%|#######8  | 87/111 [01:00<00:16,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9635, LAS: 0.9313, UEM: 0.6640, LEM: 0.4533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5999, partial_loss/deprel_loss: 0.4465, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6351, loss: 0.5010, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  81%|########1 | 90/111 [01:02<00:14,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9118, UAS: 0.9631, LAS: 0.9310, UEM: 0.6608, LEM: 0.4497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6336, partial_loss/deprel_loss: 0.5125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6946, loss: 0.5039, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  85%|########4 | 94/111 [01:04<00:11,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9634, LAS: 0.9313, UEM: 0.6633, LEM: 0.4514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4677, partial_loss/deprel_loss: 0.3887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5624, loss: 0.5020, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  88%|########8 | 98/111 [01:07<00:08,  1.49it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9508, UAS: 0.9631, LAS: 0.9310, UEM: 0.6651, LEM: 0.4536, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1180, partial_loss/deprel_loss: 0.2272, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3632, loss: 0.5052, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  92%|#########1| 102/111 [01:09<00:05,  1.59it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9632, LAS: 0.9310, UEM: 0.6633, LEM: 0.4508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1988, partial_loss/deprel_loss: 0.3010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4385, loss: 0.5050, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  96%|#########6| 107/111 [01:11<00:02,  1.74it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9630, LAS: 0.9308, UEM: 0.6586, LEM: 0.4462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2975, partial_loss/deprel_loss: 0.2869, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4469, loss: 0.5058, batch_reg_loss: 0.1578, reg_loss: 0.1580 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
+      "2023-04-07 01:53:46,006 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:53:46,006 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:53:46,006 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:53:46,006 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:53:46,006 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:53:46,006 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.287  |       N/A\n",
+      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.297  |       N/A\n",
+      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.158  |       N/A\n",
+      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - UEM                      |     0.659  |       N/A\n",
+      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - LAS                      |     0.931  |       N/A\n",
+      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - loss                     |     0.506  |       N/A\n",
+      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - LEM                      |     0.446  |       N/A\n",
+      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |       N/A\n",
+      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - EM                       |     0.939  |       N/A\n",
+      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:53:46,012 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:53:50,768 - INFO - combo.training.trainer - Epoch duration: 0:01:21.642784\n",
+      "2023-04-07 01:53:50,768 - INFO - combo.training.trainer - Estimated training time remaining: 6:05:22\n",
+      "2023-04-07 01:53:50,768 - INFO - allennlp.training.trainer - Epoch 134/399\n",
+      "2023-04-07 01:53:50,768 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:53:50,769 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:53:50,776 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9718, LAS: 0.9412, UEM: 0.7633, LEM: 0.5488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3156, partial_loss/deprel_loss: 0.3260, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4818, loss: 0.4079, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:   3%|2         | 3/111 [00:02<01:31,  1.18it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9428, UAS: 0.9762, LAS: 0.9468, UEM: 0.8419, LEM: 0.6702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2195, partial_loss/deprel_loss: 0.2797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4255, loss: 0.3891, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:   5%|5         | 6/111 [00:05<01:29,  1.17it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9733, LAS: 0.9431, UEM: 0.8027, LEM: 0.6205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5134, partial_loss/deprel_loss: 0.4853, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6488, loss: 0.4243, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:   8%|8         | 9/111 [00:07<01:24,  1.21it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9493, UAS: 0.9699, LAS: 0.9392, UEM: 0.7601, LEM: 0.5743, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2198, partial_loss/deprel_loss: 0.2679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4161, loss: 0.4574, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:  11%|#         | 12/111 [00:09<01:19,  1.25it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9578, UAS: 0.9700, LAS: 0.9394, UEM: 0.7412, LEM: 0.5441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1170, partial_loss/deprel_loss: 0.2407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3738, loss: 0.4592, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:  14%|#4        | 16/111 [00:12<01:13,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9695, LAS: 0.9389, UEM: 0.7309, LEM: 0.5301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4520, partial_loss/deprel_loss: 0.3602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5364, loss: 0.4606, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:  17%|#7        | 19/111 [00:14<01:09,  1.32it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9080, UAS: 0.9663, LAS: 0.9359, UEM: 0.7046, LEM: 0.5065, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7200, partial_loss/deprel_loss: 0.4309, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6465, loss: 0.4794, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:  20%|#9        | 22/111 [00:16<01:06,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9653, LAS: 0.9347, UEM: 0.6950, LEM: 0.4916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2095, partial_loss/deprel_loss: 0.3036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4425, loss: 0.4847, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:  23%|##3       | 26/111 [00:19<00:59,  1.43it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9653, LAS: 0.9347, UEM: 0.6830, LEM: 0.4757, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4296, partial_loss/deprel_loss: 0.4066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5690, loss: 0.4861, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:  26%|##6       | 29/111 [00:21<00:57,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8952, UAS: 0.9645, LAS: 0.9338, UEM: 0.6744, LEM: 0.4669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8113, partial_loss/deprel_loss: 0.4967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7174, loss: 0.4907, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:  29%|##8       | 32/111 [00:23<00:54,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9649, LAS: 0.9343, UEM: 0.6683, LEM: 0.4565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1948, partial_loss/deprel_loss: 0.3047, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4405, loss: 0.4874, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:  32%|###2      | 36/111 [00:25<00:50,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9644, LAS: 0.9336, UEM: 0.6664, LEM: 0.4544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3603, partial_loss/deprel_loss: 0.3563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5148, loss: 0.4898, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:  35%|###5      | 39/111 [00:27<00:49,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9366, UAS: 0.9648, LAS: 0.9339, UEM: 0.6610, LEM: 0.4440, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3040, partial_loss/deprel_loss: 0.2915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4517, loss: 0.4882, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  39%|###8      | 43/111 [00:30<00:44,  1.54it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9580, UAS: 0.9658, LAS: 0.9349, UEM: 0.6893, LEM: 0.4781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0704, partial_loss/deprel_loss: 0.1725, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3098, loss: 0.4800, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  42%|####2     | 47/111 [00:33<00:43,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9647, LAS: 0.9337, UEM: 0.6763, LEM: 0.4668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6020, partial_loss/deprel_loss: 0.4514, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6392, loss: 0.4875, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  45%|####5     | 50/111 [00:35<00:42,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9651, LAS: 0.9342, UEM: 0.6885, LEM: 0.4830, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3910, partial_loss/deprel_loss: 0.3737, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5349, loss: 0.4831, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  48%|####7     | 53/111 [00:37<00:41,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9645, LAS: 0.9335, UEM: 0.6874, LEM: 0.4803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8582, partial_loss/deprel_loss: 0.5299, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7533, loss: 0.4878, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  50%|#####     | 56/111 [00:39<00:39,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9646, LAS: 0.9337, UEM: 0.6868, LEM: 0.4777, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2436, partial_loss/deprel_loss: 0.3096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4541, loss: 0.4881, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  53%|#####3    | 59/111 [00:41<00:36,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9632, LAS: 0.9320, UEM: 0.6767, LEM: 0.4680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3082, partial_loss/deprel_loss: 0.5926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8934, loss: 0.4992, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  57%|#####6    | 63/111 [00:44<00:32,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9628, LAS: 0.9318, UEM: 0.6657, LEM: 0.4568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4753, partial_loss/deprel_loss: 0.3602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5409, loss: 0.5014, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  60%|######    | 67/111 [00:46<00:29,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9629, LAS: 0.9317, UEM: 0.6634, LEM: 0.4513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1659, partial_loss/deprel_loss: 0.2795, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4145, loss: 0.5002, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  64%|######3   | 71/111 [00:50<00:29,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9411, UAS: 0.9631, LAS: 0.9319, UEM: 0.6611, LEM: 0.4487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2327, partial_loss/deprel_loss: 0.2979, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4425, loss: 0.4989, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  68%|######7   | 75/111 [00:52<00:24,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9624, LAS: 0.9312, UEM: 0.6529, LEM: 0.4410, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6647, partial_loss/deprel_loss: 0.3638, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5816, loss: 0.5027, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  71%|#######1  | 79/111 [00:55<00:21,  1.46it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9530, UAS: 0.9625, LAS: 0.9314, UEM: 0.6539, LEM: 0.4423, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1623, partial_loss/deprel_loss: 0.2136, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3610, loss: 0.5015, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  74%|#######3  | 82/111 [00:57<00:20,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9600, UAS: 0.9631, LAS: 0.9319, UEM: 0.6668, LEM: 0.4563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0680, partial_loss/deprel_loss: 0.1759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3119, loss: 0.4982, batch_reg_loss: 0.1576, reg_loss: 0.1577 ||:  77%|#######7  | 86/111 [01:00<00:17,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9634, LAS: 0.9321, UEM: 0.6686, LEM: 0.4560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1692, partial_loss/deprel_loss: 0.3149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4434, loss: 0.4973, batch_reg_loss: 0.1576, reg_loss: 0.1577 ||:  81%|########1 | 90/111 [01:02<00:13,  1.56it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9634, LAS: 0.9322, UEM: 0.6708, LEM: 0.4582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1608, partial_loss/deprel_loss: 0.2269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3713, loss: 0.4965, batch_reg_loss: 0.1576, reg_loss: 0.1577 ||:  86%|########5 | 95/111 [01:04<00:09,  1.67it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9634, LAS: 0.9321, UEM: 0.6702, LEM: 0.4563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3192, partial_loss/deprel_loss: 0.3119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4710, loss: 0.4978, batch_reg_loss: 0.1576, reg_loss: 0.1577 ||:  90%|######### | 100/111 [01:07<00:06,  1.81it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9284, UAS: 0.9633, LAS: 0.9318, UEM: 0.6683, LEM: 0.4531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3566, partial_loss/deprel_loss: 0.3839, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5360, loss: 0.5001, batch_reg_loss: 0.1576, reg_loss: 0.1577 ||:  94%|#########3| 104/111 [01:09<00:04,  1.72it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9434, UAS: 0.9633, LAS: 0.9319, UEM: 0.6666, LEM: 0.4517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2006, partial_loss/deprel_loss: 0.2815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4229, loss: 0.4998, batch_reg_loss: 0.1576, reg_loss: 0.1577 ||:  97%|#########7| 108/111 [01:12<00:01,  1.69it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9632, LAS: 0.9319, UEM: 0.6637, LEM: 0.4491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2409, partial_loss/deprel_loss: 0.2592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4131, loss: 0.4991, batch_reg_loss: 0.1576, reg_loss: 0.1577 ||: 100%|##########| 111/111 [01:13<00:00,  1.50it/s]\n",
+      "2023-04-07 01:55:07,230 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
+      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
+      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
+      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
+      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.259  |       N/A\n",
+      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.241  |       N/A\n",
+      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.158  |       N/A\n",
+      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - UEM                      |     0.664  |       N/A\n",
+      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - LAS                      |     0.932  |       N/A\n",
+      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - loss                     |     0.499  |       N/A\n",
+      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - LEM                      |     0.449  |       N/A\n",
+      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:55:07,232 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
+      "2023-04-07 01:55:07,232 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |       N/A\n",
+      "2023-04-07 01:55:07,232 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
+      "2023-04-07 01:55:07,232 - INFO - combo.training.tensorboard_writer - EM                       |     0.943  |       N/A\n",
+      "2023-04-07 01:55:07,232 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:55:07,236 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:55:11,923 - INFO - combo.training.trainer - Epoch duration: 0:01:21.154867\n",
+      "2023-04-07 01:55:11,924 - INFO - combo.training.trainer - Estimated training time remaining: 6:03:57\n",
+      "2023-04-07 01:55:11,924 - INFO - allennlp.training.trainer - Epoch 135/399\n",
+      "2023-04-07 01:55:11,924 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:55:11,925 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:55:11,933 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9691, LAS: 0.9380, UEM: 0.5843, LEM: 0.3390, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2373, partial_loss/deprel_loss: 0.3147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4568, loss: 0.4858, batch_reg_loss: 0.1576, reg_loss: 0.1576 ||:   4%|3         | 4/111 [00:02<01:06,  1.62it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9676, LAS: 0.9361, UEM: 0.6419, LEM: 0.3989, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4023, partial_loss/deprel_loss: 0.3518, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5195, loss: 0.4727, batch_reg_loss: 0.1576, reg_loss: 0.1576 ||:   6%|6         | 7/111 [00:04<01:09,  1.49it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9674, LAS: 0.9363, UEM: 0.6454, LEM: 0.4098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4563, partial_loss/deprel_loss: 0.3694, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5443, loss: 0.4696, batch_reg_loss: 0.1576, reg_loss: 0.1576 ||:   9%|9         | 10/111 [00:07<01:10,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9138, UAS: 0.9644, LAS: 0.9332, UEM: 0.6007, LEM: 0.3720, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6226, partial_loss/deprel_loss: 0.4763, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6631, loss: 0.4970, batch_reg_loss: 0.1576, reg_loss: 0.1576 ||:  13%|#2        | 14/111 [00:09<01:04,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9651, LAS: 0.9338, UEM: 0.6030, LEM: 0.3691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4544, partial_loss/deprel_loss: 0.4473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6063, loss: 0.4959, batch_reg_loss: 0.1575, reg_loss: 0.1576 ||:  15%|#5        | 17/111 [00:11<01:03,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9548, UAS: 0.9668, LAS: 0.9357, UEM: 0.6544, LEM: 0.4272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1150, partial_loss/deprel_loss: 0.1990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3397, loss: 0.4817, batch_reg_loss: 0.1575, reg_loss: 0.1576 ||:  18%|#8        | 20/111 [00:13<01:03,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9659, LAS: 0.9352, UEM: 0.6471, LEM: 0.4242, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5934, partial_loss/deprel_loss: 0.4032, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5988, loss: 0.4846, batch_reg_loss: 0.1575, reg_loss: 0.1576 ||:  21%|##        | 23/111 [00:16<01:03,  1.38it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9362, UAS: 0.9641, LAS: 0.9333, UEM: 0.6212, LEM: 0.3983, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3112, partial_loss/deprel_loss: 0.3003, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4600, loss: 0.4957, batch_reg_loss: 0.1575, reg_loss: 0.1576 ||:  24%|##4       | 27/111 [00:18<00:59,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9648, LAS: 0.9337, UEM: 0.6407, LEM: 0.4168, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2263, partial_loss/deprel_loss: 0.3393, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4742, loss: 0.4937, batch_reg_loss: 0.1575, reg_loss: 0.1576 ||:  27%|##7       | 30/111 [00:20<00:56,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9644, LAS: 0.9333, UEM: 0.6349, LEM: 0.4096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3704, partial_loss/deprel_loss: 0.3750, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5316, loss: 0.4975, batch_reg_loss: 0.1575, reg_loss: 0.1576 ||:  30%|##9       | 33/111 [00:23<00:54,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9655, LAS: 0.9345, UEM: 0.6660, LEM: 0.4442, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1504, partial_loss/deprel_loss: 0.2351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3756, loss: 0.4871, batch_reg_loss: 0.1575, reg_loss: 0.1575 ||:  32%|###2      | 36/111 [00:26<01:04,  1.16it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9662, LAS: 0.9350, UEM: 0.6732, LEM: 0.4479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1823, partial_loss/deprel_loss: 0.2917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4273, loss: 0.4840, batch_reg_loss: 0.1575, reg_loss: 0.1575 ||:  35%|###5      | 39/111 [00:28<00:58,  1.23it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9670, LAS: 0.9356, UEM: 0.6809, LEM: 0.4519, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1688, partial_loss/deprel_loss: 0.2671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4049, loss: 0.4804, batch_reg_loss: 0.1575, reg_loss: 0.1575 ||:  38%|###7      | 42/111 [00:31<00:54,  1.27it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9457, UAS: 0.9672, LAS: 0.9359, UEM: 0.6859, LEM: 0.4582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1178, partial_loss/deprel_loss: 0.2272, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3628, loss: 0.4778, batch_reg_loss: 0.1575, reg_loss: 0.1575 ||:  41%|####      | 45/111 [00:33<00:50,  1.30it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9668, LAS: 0.9354, UEM: 0.6857, LEM: 0.4583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2961, partial_loss/deprel_loss: 0.3744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5162, loss: 0.4803, batch_reg_loss: 0.1575, reg_loss: 0.1575 ||:  43%|####3     | 48/111 [00:35<00:46,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9315, UAS: 0.9666, LAS: 0.9353, UEM: 0.6826, LEM: 0.4584, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3903, partial_loss/deprel_loss: 0.3601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5236, loss: 0.4821, batch_reg_loss: 0.1575, reg_loss: 0.1575 ||:  47%|####6     | 52/111 [00:37<00:42,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8952, UAS: 0.9658, LAS: 0.9346, UEM: 0.6777, LEM: 0.4554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7723, partial_loss/deprel_loss: 0.4786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6948, loss: 0.4863, batch_reg_loss: 0.1575, reg_loss: 0.1575 ||:  50%|####9     | 55/111 [00:39<00:39,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8946, UAS: 0.9643, LAS: 0.9332, UEM: 0.6707, LEM: 0.4501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9087, partial_loss/deprel_loss: 0.4306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6837, loss: 0.4946, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  52%|#####2    | 58/111 [00:42<00:38,  1.39it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9643, LAS: 0.9332, UEM: 0.6744, LEM: 0.4534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1724, partial_loss/deprel_loss: 0.2206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3684, loss: 0.4935, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  56%|#####5    | 62/111 [00:44<00:34,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8704, UAS: 0.9634, LAS: 0.9321, UEM: 0.6687, LEM: 0.4472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2048, partial_loss/deprel_loss: 0.6180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8928, loss: 0.5009, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  59%|#####8    | 65/111 [00:46<00:32,  1.43it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8924, UAS: 0.9634, LAS: 0.9317, UEM: 0.6662, LEM: 0.4438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7750, partial_loss/deprel_loss: 0.5395, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7440, loss: 0.5028, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  62%|######2   | 69/111 [00:49<00:27,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9630, LAS: 0.9314, UEM: 0.6552, LEM: 0.4332, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2282, partial_loss/deprel_loss: 0.3793, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5065, loss: 0.5066, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  67%|######6   | 74/111 [00:51<00:22,  1.64it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9381, UAS: 0.9623, LAS: 0.9308, UEM: 0.6477, LEM: 0.4274, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1806, partial_loss/deprel_loss: 0.2618, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4030, loss: 0.5100, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  70%|#######   | 78/111 [00:54<00:20,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9625, LAS: 0.9310, UEM: 0.6503, LEM: 0.4295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2958, partial_loss/deprel_loss: 0.3772, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5183, loss: 0.5094, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  74%|#######3  | 82/111 [00:56<00:18,  1.60it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9623, LAS: 0.9308, UEM: 0.6431, LEM: 0.4219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3598, partial_loss/deprel_loss: 0.3868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5388, loss: 0.5104, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  77%|#######7  | 86/111 [00:59<00:15,  1.66it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9800, UAS: 0.9630, LAS: 0.9316, UEM: 0.6675, LEM: 0.4568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0234, partial_loss/deprel_loss: 0.0818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2275, loss: 0.5049, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  81%|########1 | 90/111 [01:01<00:13,  1.56it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9625, LAS: 0.9312, UEM: 0.6606, LEM: 0.4513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6511, partial_loss/deprel_loss: 0.4525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6496, loss: 0.5073, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  86%|########5 | 95/111 [01:04<00:09,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9624, LAS: 0.9311, UEM: 0.6529, LEM: 0.4436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3028, partial_loss/deprel_loss: 0.3201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4740, loss: 0.5081, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  90%|######### | 100/111 [01:06<00:06,  1.79it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9629, LAS: 0.9315, UEM: 0.6583, LEM: 0.4480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3456, partial_loss/deprel_loss: 0.4009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5472, loss: 0.5050, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  95%|#########4| 105/111 [01:09<00:03,  1.90it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9260, UAS: 0.9632, LAS: 0.9317, UEM: 0.6619, LEM: 0.4502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4365, partial_loss/deprel_loss: 0.4079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5709, loss: 0.5032, batch_reg_loss: 0.1573, reg_loss: 0.1575 ||:  98%|#########8| 109/111 [01:11<00:01,  1.78it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9632, LAS: 0.9317, UEM: 0.6597, LEM: 0.4482, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4608, partial_loss/deprel_loss: 0.3829, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5558, loss: 0.5031, batch_reg_loss: 0.1573, reg_loss: 0.1575 ||: 100%|##########| 111/111 [01:13<00:00,  1.52it/s]\n",
+      "2023-04-07 01:56:27,897 - INFO - allennlp.training.trainer - Validating\n",
+      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8755, UAS: 0.9614, LAS: 0.9128, UEM: 0.7969, LEM: 0.5543, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0105, partial_loss/deprel_loss: 34.5376, partial_loss/cycle_loss: 0.0000, batch_loss: 27.8322, loss: 19.9957, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:09,  1.01it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8697, UAS: 0.9551, LAS: 0.9059, UEM: 0.7413, LEM: 0.4867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3425, partial_loss/deprel_loss: 44.6023, partial_loss/cycle_loss: 0.0000, batch_loss: 35.9504, loss: 23.2370, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:06,  1.03it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9458, LAS: 0.8954, UEM: 0.6814, LEM: 0.4354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7257, partial_loss/deprel_loss: 28.0299, partial_loss/cycle_loss: 0.0000, batch_loss: 22.5690, loss: 25.5143, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:07<00:04,  1.00it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9509, LAS: 0.9015, UEM: 0.6917, LEM: 0.4261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4239, partial_loss/deprel_loss: 24.7843, partial_loss/cycle_loss: 0.0000, batch_loss: 19.9122, loss: 23.2583, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:10<00:01,  1.02it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9485, LAS: 0.8984, UEM: 0.6581, LEM: 0.3961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9117, partial_loss/deprel_loss: 29.0845, partial_loss/cycle_loss: 0.0000, batch_loss: 23.4500, loss: 23.9880, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.03it/s]\n",
+      "2023-04-07 01:56:40,528 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
+      "2023-04-07 01:56:40,528 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:56:40,528 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
+      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
+      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
+      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
+      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
+      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.383  |    29.085\n",
+      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.461  |     0.912\n",
+      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.157  |     0.000\n",
+      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - UEM                      |     0.660  |     0.658\n",
+      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - LAS                      |     0.932  |     0.898\n",
+      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - loss                     |     0.503  |    23.988\n",
+      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
+      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - LEM                      |     0.448  |     0.396\n",
+      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
+      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |     0.949\n",
+      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
+      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - EM                       |     0.921  |     0.884\n",
+      "2023-04-07 01:56:40,530 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
+      "2023-04-07 01:56:40,533 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
+      "2023-04-07 01:56:44,748 - INFO - combo.training.trainer - Epoch duration: 0:01:32.824060\n",
+      "2023-04-07 01:56:44,748 - INFO - combo.training.trainer - Estimated training time remaining: 6:02:55\n",
+      "2023-04-07 01:56:44,749 - INFO - allennlp.training.trainer - Epoch 136/399\n",
+      "2023-04-07 01:56:44,749 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
+      "2023-04-07 01:56:44,750 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
+      "2023-04-07 01:56:44,759 - INFO - allennlp.training.trainer - Training\n",
+      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9701, LAS: 0.9398, UEM: 0.6759, LEM: 0.4194, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1820, partial_loss/deprel_loss: 0.2697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4095, loss: 0.4615, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||:   4%|3         | 4/111 [00:02<01:11,  1.49it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9697, LAS: 0.9401, UEM: 0.7084, LEM: 0.4874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4933, partial_loss/deprel_loss: 0.3671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5497, loss: 0.4480, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||:   7%|7         | 8/111 [00:05<01:07,  1.52it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9413, UAS: 0.9687, LAS: 0.9379, UEM: 0.6801, LEM: 0.4486, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2307, partial_loss/deprel_loss: 0.3055, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4479, loss: 0.4613, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||:  10%|9         | 11/111 [00:07<01:06,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9682, LAS: 0.9380, UEM: 0.6869, LEM: 0.4659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1802, partial_loss/deprel_loss: 0.2410, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3861, loss: 0.4555, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||:  14%|#3        | 15/111 [00:09<01:03,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9685, LAS: 0.9379, UEM: 0.6714, LEM: 0.4464, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2852, partial_loss/deprel_loss: 0.3214, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4714, loss: 0.4577, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||:  17%|#7        | 19/111 [00:12<01:01,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9658, LAS: 0.9350, UEM: 0.6613, LEM: 0.4399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9620, partial_loss/deprel_loss: 0.5151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7618, loss: 0.4760, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||:  21%|##        | 23/111 [00:15<00:58,  1.51it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9653, LAS: 0.9344, UEM: 0.6476, LEM: 0.4248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5369, partial_loss/deprel_loss: 0.3851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5727, loss: 0.4804, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||:  23%|##3       | 26/111 [00:17<00:57,  1.48it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9266, UAS: 0.9657, LAS: 0.9349, UEM: 0.6618, LEM: 0.4411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4090, partial_loss/deprel_loss: 0.3663, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5321, loss: 0.4762, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||:  26%|##6       | 29/111 [00:19<00:57,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9647, LAS: 0.9336, UEM: 0.6680, LEM: 0.4505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0720, partial_loss/deprel_loss: 0.2051, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3357, loss: 0.4839, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||:  29%|##8       | 32/111 [00:21<00:57,  1.37it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9482, UAS: 0.9650, LAS: 0.9338, UEM: 0.6674, LEM: 0.4472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1642, partial_loss/deprel_loss: 0.2539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3932, loss: 0.4823, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||:  32%|###2      | 36/111 [00:24<00:54,  1.38it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9315, UAS: 0.9646, LAS: 0.9335, UEM: 0.6565, LEM: 0.4366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4016, partial_loss/deprel_loss: 0.3892, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5489, loss: 0.4877, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||:  35%|###5      | 39/111 [00:26<00:51,  1.40it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9291, UAS: 0.9645, LAS: 0.9335, UEM: 0.6487, LEM: 0.4291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4346, partial_loss/deprel_loss: 0.3860, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5530, loss: 0.4894, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||:  38%|###7      | 42/111 [00:28<00:48,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9616, UAS: 0.9646, LAS: 0.9337, UEM: 0.6573, LEM: 0.4420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0802, partial_loss/deprel_loss: 0.1775, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3153, loss: 0.4892, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||:  41%|####1     | 46/111 [00:31<00:45,  1.41it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9332, UAS: 0.9645, LAS: 0.9333, UEM: 0.6492, LEM: 0.4313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2660, partial_loss/deprel_loss: 0.3857, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5190, loss: 0.4911, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||:  45%|####5     | 50/111 [00:34<00:41,  1.47it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9644, LAS: 0.9332, UEM: 0.6480, LEM: 0.4294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6622, partial_loss/deprel_loss: 0.4969, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6872, loss: 0.4916, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||:  49%|####8     | 54/111 [00:36<00:37,  1.50it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9653, LAS: 0.9342, UEM: 0.6665, LEM: 0.4463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2271, partial_loss/deprel_loss: 0.3296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4663, loss: 0.4853, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||:  52%|#####2    | 58/111 [00:38<00:33,  1.58it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9645, LAS: 0.9335, UEM: 0.6710, LEM: 0.4583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5423, partial_loss/deprel_loss: 0.4684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6404, loss: 0.4904, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||:  56%|#####5    | 62/111 [00:41<00:29,  1.68it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9643, LAS: 0.9335, UEM: 0.6663, LEM: 0.4535, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3827, partial_loss/deprel_loss: 0.3363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5027, loss: 0.4911, batch_reg_loss: 0.1572, reg_loss: 0.1572 ||:  60%|######    | 67/111 [00:43<00:24,  1.83it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9639, LAS: 0.9331, UEM: 0.6543, LEM: 0.4413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3624, partial_loss/deprel_loss: 0.3598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5175, loss: 0.4936, batch_reg_loss: 0.1572, reg_loss: 0.1572 ||:  65%|######4   | 72/111 [00:45<00:20,  1.93it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9639, LAS: 0.9333, UEM: 0.6653, LEM: 0.4611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4176, partial_loss/deprel_loss: 0.3589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5278, loss: 0.4929, batch_reg_loss: 0.1572, reg_loss: 0.1572 ||:  68%|######8   | 76/111 [00:48<00:20,  1.75it/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9470, UAS: 0.9643, LAS: 0.9336, UEM: 0.6732, LEM: 0.4684, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1612, partial_loss/deprel_loss: 0.2706, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4059, loss: 0.4902, batch_reg_loss: 0.1572, reg_loss: 0.1572 ||:  72%|#######2  | 80/111 [00:51<00:19,  1.55it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9637, LAS: 0.9332, UEM: 0.6708, LEM: 0.4675, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2048, partial_loss/deprel_loss: 0.2418, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3916, loss: 0.4919, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||:  76%|#######5  | 84/111 [00:54<00:18,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9633, LAS: 0.9327, UEM: 0.6642, LEM: 0.4607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7137, partial_loss/deprel_loss: 0.5212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7168, loss: 0.4959, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||:  79%|#######9  | 88/111 [00:57<00:16,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9628, LAS: 0.9321, UEM: 0.6605, LEM: 0.4564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5023, partial_loss/deprel_loss: 0.4027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5797, loss: 0.4999, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||:  82%|########1 | 91/111 [01:00<00:14,  1.35it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9626, LAS: 0.9319, UEM: 0.6593, LEM: 0.4546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1783, partial_loss/deprel_loss: 0.2851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4208, loss: 0.5013, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||:  85%|########4 | 94/111 [01:02<00:12,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9473, UAS: 0.9628, LAS: 0.9321, UEM: 0.6646, LEM: 0.4604, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1742, partial_loss/deprel_loss: 0.2021, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3536, loss: 0.4988, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||:  87%|########7 | 97/111 [01:04<00:10,  1.29it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9209, UAS: 0.9628, LAS: 0.9321, UEM: 0.6630, LEM: 0.4590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4777, partial_loss/deprel_loss: 0.3639, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5438, loss: 0.4990, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||:  90%|######### | 100/111 [01:06<00:08,  1.34it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9631, LAS: 0.9322, UEM: 0.6644, LEM: 0.4581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3459, partial_loss/deprel_loss: 0.3799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5302, loss: 0.4976, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||:  94%|#########3| 104/111 [01:09<00:04,  1.45it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9630, LAS: 0.9320, UEM: 0.6604, LEM: 0.4538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3434, partial_loss/deprel_loss: 0.3645, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5174, loss: 0.4983, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||:  96%|#########6| 107/111 [01:11<00:02,  1.44it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9631, LAS: 0.9321, UEM: 0.6599, LEM: 0.4515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2039, partial_loss/deprel_loss: 0.2603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4061, loss: 0.4970, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||: 100%|##########| 111/111 [01:14<00:00,  1.42it/s]\n",
+      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9631, LAS: 0.9321, UEM: 0.6599, LEM: 0.4515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2039, partial_loss/deprel_loss: 0.2603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4061, loss: 0.4970, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||: 100%|##########| 111/111 [01:14<00:00,  1.50it/s]\n",
+      "2023-04-07 01:58:01,554 - INFO - combo.training.trainer - Ran out of patience.  Stopping training.\n",
+      "2023-04-07 01:58:01,554 - INFO - allennlp.training.checkpointer - loading best weights\n",
+      "2023-04-07 01:58:02,804 - INFO - allennlp.common.util - Metrics: {\n",
+      "  \"best_epoch\": 135,\n",
+      "  \"peak_worker_0_memory_MB\": 7070.32421875,\n",
+      "  \"peak_gpu_0_memory_MB\": 2425.27294921875,\n",
+      "  \"training_duration\": \"3:06:53.221860\",\n",
+      "  \"training_start_epoch\": 0,\n",
+      "  \"training_epochs\": 135,\n",
+      "  \"epoch\": 135,\n",
+      "  \"training_UPOS_ACC\": 0.0,\n",
+      "  \"training_XPOS_ACC\": 0.0,\n",
+      "  \"training_SEMREL_ACC\": 0.0,\n",
+      "  \"training_LEMMA_ACC\": 0.0,\n",
+      "  \"training_FEATS_ACC\": 0.0,\n",
+      "  \"training_EM\": 0.9211469292640686,\n",
+      "  \"training_UAS\": 0.9631774675364263,\n",
+      "  \"training_LAS\": 0.9317305657860291,\n",
+      "  \"training_UEM\": 0.6596950631978689,\n",
+      "  \"training_LEM\": 0.4481664116080032,\n",
+      "  \"training_EUAS\": 0.0,\n",
+      "  \"training_ELAS\": 0.0,\n",
+      "  \"training_EUEM\": 0.0,\n",
+      "  \"training_ELEM\": 0.0,\n",
+      "  \"training_partial_loss/head_loss\": 0.4608195722103119,\n",
+      "  \"training_partial_loss/deprel_loss\": 0.3828725218772888,\n",
+      "  \"training_partial_loss/cycle_loss\": 0.0,\n",
+      "  \"training_loss\": 0.5030799737653217,\n",
+      "  \"training_reg_loss\": 0.15746027405734533,\n",
+      "  \"training_worker_0_memory_MB\": 7070.32421875,\n",
+      "  \"training_gpu_0_memory_MB\": 2425.27294921875,\n",
+      "  \"training_patience\": 1,\n",
+      "  \"validation_UPOS_ACC\": 0.0,\n",
+      "  \"validation_XPOS_ACC\": 0.0,\n",
+      "  \"validation_SEMREL_ACC\": 0.0,\n",
+      "  \"validation_LEMMA_ACC\": 0.0,\n",
+      "  \"validation_FEATS_ACC\": 0.0,\n",
+      "  \"validation_EM\": 0.8841390609741211,\n",
+      "  \"validation_UAS\": 0.948533243417221,\n",
+      "  \"validation_LAS\": 0.898415228519756,\n",
+      "  \"validation_UEM\": 0.6580882352941176,\n",
+      "  \"validation_LEM\": 0.3961397058823529,\n",
+      "  \"validation_EUAS\": 0.0,\n",
+      "  \"validation_ELAS\": 0.0,\n",
+      "  \"validation_EUEM\": 0.0,\n",
+      "  \"validation_ELEM\": 0.0,\n",
+      "  \"validation_partial_loss/head_loss\": 0.91168212890625,\n",
+      "  \"validation_partial_loss/deprel_loss\": 29.084543228149414,\n",
+      "  \"validation_partial_loss/cycle_loss\": 0.0,\n",
+      "  \"validation_loss\": 23.987967637869026,\n",
+      "  \"validation_reg_loss\": 0.0,\n",
+      "  \"best_validation_UPOS_ACC\": 0.0,\n",
+      "  \"best_validation_XPOS_ACC\": 0.0,\n",
+      "  \"best_validation_SEMREL_ACC\": 0.0,\n",
+      "  \"best_validation_LEMMA_ACC\": 0.0,\n",
+      "  \"best_validation_FEATS_ACC\": 0.0,\n",
+      "  \"best_validation_EM\": 0.8841390609741211,\n",
+      "  \"best_validation_UAS\": 0.948533243417221,\n",
+      "  \"best_validation_LAS\": 0.898415228519756,\n",
+      "  \"best_validation_UEM\": 0.6580882352941176,\n",
+      "  \"best_validation_LEM\": 0.3961397058823529,\n",
+      "  \"best_validation_EUAS\": 0.0,\n",
+      "  \"best_validation_ELAS\": 0.0,\n",
+      "  \"best_validation_EUEM\": 0.0,\n",
+      "  \"best_validation_ELEM\": 0.0,\n",
+      "  \"best_validation_partial_loss/head_loss\": 0.91168212890625,\n",
+      "  \"best_validation_partial_loss/deprel_loss\": 29.084543228149414,\n",
+      "  \"best_validation_partial_loss/cycle_loss\": 0.0,\n",
+      "  \"best_validation_loss\": 23.987967637869026,\n",
+      "  \"best_validation_reg_loss\": 0.0\n",
+      "}\n",
+      "2023-04-07 01:58:02,805 - INFO - allennlp.models.archival - archiving weights and vocabulary to ./allennlpru3hb8qq/model.tar.gz\n",
+      "2023-04-07 02:10:56,965 - INFO - combo.main - Training model stored in: ./allennlpru3hb8qq\n"
+     ]
+    }
+   ],
+   "source": [
+    "! {COMBO} --mode train \\\n",
+    "    --training_data_path connlu/pdbc-train.conllu \\\n",
+    "    --validation_data_path connlu/pdbc-validation.conllu \\\n",
+    "    --cuda_device 0 \\\n",
+    "    --pretrained_transformer_name allegro/herbert-large-cased \\\n",
+    "    --targets head,deprel \\\n",
+    "    --serialization_dir ."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "e2c0090a",
+   "metadata": {},
+   "source": [
+    "Change `allennlp...` to the directory produced by COMBO."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "f630757b",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "! rm -r model-pdbc/\n",
+    "! mv allennlpru3hb8qq/ model-pdbc/"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "combo_python39",
+   "language": "python",
+   "name": "combo_python39"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.16"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git b/TrainingAndEval.ipynb a/TrainingAndEval.ipynb
new file mode 100644
index 0000000..753718e
--- /dev/null
+++ a/TrainingAndEval.ipynb
@@ -0,0 +1,1546 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "97d0c9ab",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "2023-04-11 11:17:29.095631: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations:  AVX2 FMA\n",
+      "To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
+      "2023-04-11 11:17:29.331444: E tensorflow/stream_executor/cuda/cuda_blas.cc:2981] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered\n",
+      "2023-04-11 11:17:30.167497: W tensorflow/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory\n",
+      "2023-04-11 11:17:30.167593: W tensorflow/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory\n",
+      "2023-04-11 11:17:30.167603: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly.\n"
+     ]
+    }
+   ],
+   "source": [
+    "import importlib\n",
+    "\n",
+    "from collections import Counter\n",
+    "\n",
+    "import tensorflow as tf\n",
+    "\n",
+    "from datasets import load_dataset\n",
+    "from IPython.display import display, HTML, IFrame"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7464a6fa",
+   "metadata": {},
+   "source": [
+    "**Comment out to use GPU!**"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "c41d6630",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "#import os\n",
+    "#os.environ[\"CUDA_VISIBLE_DEVICES\"] = \"-1\""
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "f30d7b7c",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "1 Physical GPUs, 1 Logical GPUs\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "2023-04-11 11:17:31.717262: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
+      "2023-04-11 11:17:31.762533: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
+      "2023-04-11 11:17:31.763529: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
+      "2023-04-11 11:17:31.765670: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations:  AVX2 FMA\n",
+      "To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
+      "2023-04-11 11:17:31.769196: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
+      "2023-04-11 11:17:31.770058: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
+      "2023-04-11 11:17:31.770816: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
+      "2023-04-11 11:17:32.722287: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
+      "2023-04-11 11:17:32.723281: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
+      "2023-04-11 11:17:32.724062: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
+      "2023-04-11 11:17:32.724846: I tensorflow/core/common_runtime/gpu/gpu_device.cc:1616] Created device /job:localhost/replica:0/task:0/device:GPU:0 with 20480 MB memory:  -> device: 0, name: NVIDIA A100 80GB PCIe, pci bus id: 0000:00:05.0, compute capability: 8.0\n"
+     ]
+    }
+   ],
+   "source": [
+    "# https://www.tensorflow.org/guide/gpu\n",
+    "gpus = tf.config.list_physical_devices('GPU')\n",
+    "if gpus:\n",
+    "    try:\n",
+    "        tf.config.set_logical_device_configuration(\n",
+    "            gpus[0],\n",
+    "            [tf.config.LogicalDeviceConfiguration(memory_limit=20*1024)]\n",
+    "        )\n",
+    "        logical_gpus = tf.config.list_logical_devices('GPU')\n",
+    "        print(len(gpus), \"Physical GPUs,\", len(logical_gpus), \"Logical GPUs\")\n",
+    "    except RuntimeError as e:\n",
+    "        print(e)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "89afdb1e",
+   "metadata": {
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "/device:GPU:0\n",
+      "2.10.0\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "2023-04-11 11:17:32.739308: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
+      "2023-04-11 11:17:32.740224: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
+      "2023-04-11 11:17:32.740975: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
+      "2023-04-11 11:17:32.741809: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
+      "2023-04-11 11:17:32.742586: I tensorflow/stream_executor/cuda/cuda_gpu_executor.cc:980] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero\n",
+      "2023-04-11 11:17:32.743322: I tensorflow/core/common_runtime/gpu/gpu_device.cc:1616] Created device /device:GPU:0 with 20480 MB memory:  -> device: 0, name: NVIDIA A100 80GB PCIe, pci bus id: 0000:00:05.0, compute capability: 8.0\n"
+     ]
+    }
+   ],
+   "source": [
+    "print(tf.test.gpu_device_name())\n",
+    "print(tf.__version__)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "2b0ab576",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Found cached dataset pdb_c_beta (/home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1)\n"
+     ]
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "55f181333dc44c7a811c515cc55c4988",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  0%|          | 0/3 [00:00<?, ?it/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    }
+   ],
+   "source": [
+    "pdbc_dataset = load_dataset('pdb_c_beta')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "2f4c317a",
+   "metadata": {
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-ff2490f308f7f25b.arrow\n",
+      "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-cbb40b0e978ab6ee.arrow\n",
+      "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-3facbd810991cd6c.arrow\n",
+      "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-e54a8628e59de21f.arrow\n",
+      "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-9692de6b8224e758.arrow\n",
+      "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-4042ffa1dc5d9323.arrow\n",
+      "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-fb250709424f85ec.arrow\n",
+      "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-1f6ce0a488a89d56.arrow\n",
+      "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-2ae4daf5101c7aa2.arrow\n",
+      "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-a1686820d15bcf04.arrow\n",
+      "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-fe2c12481861f4bd.arrow\n",
+      "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-da5a875c385c3570.arrow\n"
+     ]
+    }
+   ],
+   "source": [
+    "import importlib\n",
+    "\n",
+    "from neural_parser import hybrid_tree_utils\n",
+    "importlib.reload(hybrid_tree_utils)\n",
+    "from neural_parser import dataset_utils\n",
+    "importlib.reload(dataset_utils)\n",
+    "\n",
+    "pdbc_dataset_spines = dataset_utils.add_spines_and_attachments(pdbc_dataset)\n",
+    "pdbc_dataset_spines_compressed = dataset_utils.add_spines_and_attachments(pdbc_dataset, compress=True)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "de1966ed",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-1dfcf507d62f6da8.arrow\n",
+      "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-264c0111246b25c1.arrow\n",
+      "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-6a40675124a412f0.arrow\n"
+     ]
+    }
+   ],
+   "source": [
+    "features = pdbc_dataset_spines['train'].features\n",
+    "pdbc_dataset_spines_cont = pdbc_dataset_spines.filter(\n",
+    "    lambda instance: hybrid_tree_utils.tree_from_dataset_instance(instance, features).is_continuous()\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "id": "33ff295b",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "DatasetDict({\n",
+       "    train: Dataset({\n",
+       "        features: ['corp_id', 'sent_id', 'tokens', 'lemmas', 'cposes', 'poses', 'tags', 'heads', 'deprels', 'nonterminals', 'spines', 'anchors', 'anchor_hs'],\n",
+       "        num_rows: 15903\n",
+       "    })\n",
+       "    validation: Dataset({\n",
+       "        features: ['corp_id', 'sent_id', 'tokens', 'lemmas', 'cposes', 'poses', 'tags', 'heads', 'deprels', 'nonterminals', 'spines', 'anchors', 'anchor_hs'],\n",
+       "        num_rows: 1980\n",
+       "    })\n",
+       "    test: Dataset({\n",
+       "        features: ['corp_id', 'sent_id', 'tokens', 'lemmas', 'cposes', 'poses', 'tags', 'heads', 'deprels', 'nonterminals', 'spines', 'anchors', 'anchor_hs'],\n",
+       "        num_rows: 1990\n",
+       "    })\n",
+       "})"
+      ]
+     },
+     "execution_count": 8,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "pdbc_dataset_spines_cont"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "id": "a8ddbc1f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "MODEL = 'allegro/herbert-large-cased'"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "id": "8029594b",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class ClassificationTask(object):\n",
+    "    \n",
+    "    def __init__(\n",
+    "            self,\n",
+    "            name,\n",
+    "            dataset,\n",
+    "        ):\n",
+    "        self.name = name\n",
+    "        self.dataset = dataset"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 36,
+   "id": "be8e93fa",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def crop(dataset, n):\n",
+    "    return dataset.filter(lambda example: len(example['tokens']) <= n)\n",
+    "\n",
+    "spines_pdbc = ClassificationTask(\n",
+    "    'spines_pdbc',\n",
+    "    pdbc_dataset_spines,\n",
+    "    #crop(pdbc_dataset, 6),\n",
+    ")\n",
+    "\n",
+    "spines_pdbc_cont = ClassificationTask(\n",
+    "    'spines_pdbc_cont',\n",
+    "    pdbc_dataset_spines_cont,\n",
+    "    #crop(pdbc_dataset, 6),\n",
+    ")\n",
+    "\n",
+    "spines_pdbc_compressed = ClassificationTask(\n",
+    "    'spines_pdbc_compressed',\n",
+    "    pdbc_dataset_spines_compressed,\n",
+    "    #crop(pdbc_dataset, 6),\n",
+    ")\n",
+    "\n",
+    "TASK = spines_pdbc_compressed\n",
+    "TRAIN = False"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 37,
+   "id": "7824fcee",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from neural_parser import training"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 38,
+   "id": "1eb5f41a",
+   "metadata": {
+    "scrolled": false
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Loading BERT tokenizer...\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-49fe5b05228c3588.arrow\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Preprocessing the dataset for BERT...\n"
+     ]
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "5f108b00fcab4db8a610f24ae03b7308",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  0%|          | 0/2211 [00:00<?, ?ex/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Loading cached processed dataset at /home/kkrasnowska/.cache/huggingface/datasets/pdb_c_beta/pdb_c_beta/0.2.0/d9c6dc764ae2a3483fa112c6159db4a0342dba8083bdb3b5981c45435b0692e1/cache-b8e2900fbd9615fd.arrow\n",
+      "You're using a HerbertTokenizerFast tokenizer. Please note that with a fast tokenizer, using the `__call__` method is faster than using a method to encode the text followed by a call to the `pad` method to get a padded encoding.\n"
+     ]
+    }
+   ],
+   "source": [
+    "trainer = training.Trainer(\n",
+    "    MODEL,\n",
+    "    dataset=TASK.dataset,\n",
+    "    batch_size=16,\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "ac012dc7",
+   "metadata": {},
+   "source": [
+    "### Training with TensorBoard logging"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 39,
+   "id": "276708cc",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "('keras_fit_logs_spines_pdbc_compressed', 'models_spines_pdbc_compressed')"
+      ]
+     },
+     "execution_count": 39,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "log_dir = f'keras_fit_logs_{TASK.name}'\n",
+    "model_dir = f'models_{TASK.name}'\n",
+    "\n",
+    "log_dir, model_dir"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 40,
+   "id": "e8ccde06",
+   "metadata": {
+    "scrolled": false
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "The tensorboard extension is already loaded. To reload it, use:\n",
+      "  %reload_ext tensorboard\n",
+      "huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...\n",
+      "To disable this warning, you can either:\n",
+      "\t- Avoid using `tokenizers` before the fork if possible\n",
+      "\t- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "\n",
+       "      <iframe id=\"tensorboard-frame-83a6a03964d4187a\" width=\"100%\" height=\"800\" frameborder=\"0\">\n",
+       "      </iframe>\n",
+       "      <script>\n",
+       "        (function() {\n",
+       "          const frame = document.getElementById(\"tensorboard-frame-83a6a03964d4187a\");\n",
+       "          const url = new URL(\"/\", window.location);\n",
+       "          const port = 6004;\n",
+       "          if (port) {\n",
+       "            url.port = port;\n",
+       "          }\n",
+       "          frame.src = url;\n",
+       "        })();\n",
+       "      </script>\n",
+       "    "
+      ],
+      "text/plain": [
+       "<IPython.core.display.HTML object>"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    }
+   ],
+   "source": [
+    "%load_ext tensorboard\n",
+    "! killall tensorboard\n",
+    "%tensorboard --port 6004 \\\n",
+    "    --logdir_spec logs:{log_dir},logs0:{keras_fit_logs_spines_pdbc}"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 41,
+   "id": "a5b0da64",
+   "metadata": {
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "CPU times: user 6 µs, sys: 1 µs, total: 7 µs\n",
+      "Wall time: 15.7 µs\n"
+     ]
+    }
+   ],
+   "source": [
+    "%%time\n",
+    "\n",
+    "if TRAIN:\n",
+    "    parser = trainer.train(\n",
+    "        lr=0.00001,\n",
+    "        epochs=50,\n",
+    "        log_dir=log_dir,\n",
+    "        model_dir=model_dir,\n",
+    "    )"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 42,
+   "id": "e42b2bd4",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "#import importlib\n",
+    "#from neural_parser import hybrid_tree_utils\n",
+    "#importlib.reload(hybrid_tree_utils)\n",
+    "#from neural_parser import data_utils\n",
+    "#importlib.reload(data_utils)\n",
+    "#from neural_parser import constituency_parser\n",
+    "#importlib.reload(constituency_parser)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 43,
+   "id": "2f65dead",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "created 3 classifier(s)\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Some layers from the model checkpoint at models_spines_pdbc_compressed/model were not used when initializing TFBertForMultiTargetTokenClassification: ['dropout_73']\n",
+      "- This IS expected if you are initializing TFBertForMultiTargetTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n",
+      "- This IS NOT expected if you are initializing TFBertForMultiTargetTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n",
+      "All the layers of TFBertForMultiTargetTokenClassification were initialized from the model checkpoint at models_spines_pdbc_compressed/model.\n",
+      "If your task is similar to the task the model of the checkpoint was trained on, you can already use TFBertForMultiTargetTokenClassification for predictions without further training.\n"
+     ]
+    }
+   ],
+   "source": [
+    "if not TRAIN:\n",
+    "    from neural_parser import constituency_parser\n",
+    "    parser = constituency_parser.ConstituencyParser.load(model_dir)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 44,
+   "id": "24edee79",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "sentences = [\n",
+    "    'Miał em kotka .',\n",
+    "    'Wlazł kotek na płotek i mruga .',\n",
+    "]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 45,
+   "id": "4a7cd10b",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "1/1 [==============================] - 10s 10s/step\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "[(['Miał', 'em', 'kotka', '.'],\n",
+       "  {'spines': ['ROOT_S_VP_V', '<EMPTY>', 'NP_N', 'Punct'],\n",
+       "   'anchors': ['<ROOT>', 'V', 'S', 'ROOT'],\n",
+       "   'anchor_hs': ['<ROOT>', '1', '1', '1']}),\n",
+       " (['Wlazł', 'kotek', 'na', 'płotek', 'i', 'mruga', '.'],\n",
+       "  {'spines': ['VP_V',\n",
+       "    'NP_N',\n",
+       "    'PrepNP_Prep',\n",
+       "    'NP_N',\n",
+       "    'ROOT_S_VP_Conj',\n",
+       "    'VP_V',\n",
+       "    'Punct'],\n",
+       "   'anchors': ['VP', 'S', 'VP', 'PrepNP', '<ROOT>', 'VP', 'ROOT'],\n",
+       "   'anchor_hs': ['1', '1', '2', '1', '<ROOT>', '1', '1']})]"
+      ]
+     },
+     "execution_count": 45,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "parser.parse(sentences)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "b814587d",
+   "metadata": {},
+   "source": [
+    "### Evaluation\n",
+    "\n",
+    "#### Hybrid"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 46,
+   "id": "4ac4b9df",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "<module 'neural_parser.constants' from '/home/kkrasnowska/neural-parsing/ICCS/neural_parser/constants.py'>"
+      ]
+     },
+     "execution_count": 46,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "from neural_parser import hybrid_tree_utils\n",
+    "importlib.reload(hybrid_tree_utils)\n",
+    "from neural_parser import constants\n",
+    "importlib.reload(constants)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 47,
+   "id": "d1b28792",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from spacy import displacy\n",
+    "\n",
+    "def to_deps(tokens, deprels, heads):\n",
+    "    deps = {'words' : [], 'arcs' : []}\n",
+    "    for i, (token, deprel, head) in enumerate(zip(tokens, deprels, heads)):\n",
+    "        deps['words'].append({'text' : token, 'tag' : 'X'})\n",
+    "        if head >= 0:\n",
+    "            d = 'left' if head > i else 'right'\n",
+    "            start, end = sorted((i, head))\n",
+    "            deps['arcs'].append({'start' : start, 'end' : end, 'label' : deprel, 'dir' : d})\n",
+    "    return deps\n",
+    "\n",
+    "def display_deps(tokens, deprels, heads):\n",
+    "    displacy.render(to_deps(tokens, deprels, heads), manual=True, options={'distance' : 80})\n",
+    "    \n",
+    "import urllib.parse\n",
+    "import json\n",
+    "\n",
+    "def show_tree(tree):\n",
+    "    tree_json = json.dumps(hybrid_tree_utils.tree2dict(tree)['tree'])\n",
+    "    src = f'http://127.0.0.1:8010/?tree={urllib.parse.quote(tree_json)}'\n",
+    "    display(IFrame(src, 950, 550))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 48,
+   "id": "9f443569",
+   "metadata": {
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2211\n",
+      "2205\n",
+      "['Całuję', '.']\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "{'heads': [None, 0],\n",
+       " 'deprels': ['ROOT', 'punct'],\n",
+       " 'spines': ['ROOT_S_VP_V', 'Punct'],\n",
+       " 'anchors': ['<ROOT>', 'ROOT'],\n",
+       " 'anchor_hs': ['<ROOT>', '1']}"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "['Drzemał', '.']\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "{'heads': [None, 0],\n",
+       " 'deprels': ['ROOT', 'punct'],\n",
+       " 'spines': ['ROOT_S_VP_V', 'Punct'],\n",
+       " 'anchors': ['<ROOT>', 'ROOT'],\n",
+       " 'anchor_hs': ['<ROOT>', '1']}"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    }
+   ],
+   "source": [
+    "HDR = [\n",
+    "    'heads', 'deprels',\n",
+    "    constants.SPINES, constants.ANCHORS, constants.ANCHOR_HS\n",
+    "]\n",
+    "\n",
+    "values = ['heads']\n",
+    "\n",
+    "def get_gold_data(dataset):\n",
+    "    GOLD = []\n",
+    "    for sent in dataset:\n",
+    "        tokens = sent[constants.TOKENS]\n",
+    "        tags = {\n",
+    "            c : [dataset.features[c].feature.int2str(v) if c not in values else v for v in sent[c]]\n",
+    "            for c in HDR\n",
+    "        }\n",
+    "        GOLD.append([tokens, tags])\n",
+    "    GOLD = sorted(GOLD, key=lambda x: (len(x[0]), ''.join(x[0])))\n",
+    "    print(len(GOLD))\n",
+    "    TOKENS, TAGS = zip(*GOLD)\n",
+    "    return TOKENS, TAGS\n",
+    "\n",
+    "TOKENS_VAL, TAGS_VAL = get_gold_data(TASK.dataset['validation'])\n",
+    "TOKENS_TEST, TAGS_TEST = get_gold_data(TASK.dataset['test'])\n",
+    "\n",
+    "print(TOKENS_VAL[0])\n",
+    "display(TAGS_VAL[0])\n",
+    "print(TOKENS_TEST[0])\n",
+    "display(TAGS_TEST[0])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 49,
+   "id": "3f53c039",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "70/70 [==============================] - 17s 152ms/step\n",
+      "69/69 [==============================] - 12s 168ms/step\n",
+      "['Całuję', '.']\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "{'spines': ['ROOT_S_VP_V', 'Punct'],\n",
+       " 'anchors': ['<ROOT>', 'ROOT'],\n",
+       " 'anchor_hs': ['<ROOT>', '1']}"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "['Drzemał', '.']\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "{'spines': ['ROOT_S_VP_V', 'Punct'],\n",
+       " 'anchors': ['<ROOT>', 'ROOT'],\n",
+       " 'anchor_hs': ['<ROOT>', '1']}"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    }
+   ],
+   "source": [
+    "def get_predicted_data(TOKENS_TRUE):\n",
+    "    PARSED = parser.parse([' '.join(toks) for toks in TOKENS_TRUE])\n",
+    "    TOKENS, TAGS = zip(*PARSED)\n",
+    "    try:\n",
+    "        assert(TOKENS == TOKENS_TRUE)\n",
+    "    except:\n",
+    "        for tp, tt in zip(TOKENS, TOKENS_TRUE):\n",
+    "            if tp != tt:\n",
+    "                print(tp)\n",
+    "                print(tt)\n",
+    "        raise\n",
+    "    return TOKENS, TAGS\n",
+    "\n",
+    "TOKENS_P_VAL, TAGS_P_VAL = get_predicted_data(TOKENS_VAL)\n",
+    "TOKENS_P_TEST, TAGS_P_TEST = get_predicted_data(TOKENS_TEST)\n",
+    "\n",
+    "print(TOKENS_P_VAL[0])\n",
+    "display(TAGS_P_VAL[0])\n",
+    "print(TOKENS_P_TEST[0])\n",
+    "display(TAGS_P_TEST[0])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 50,
+   "id": "17c1d9cb",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2211\n",
+      "2205\n",
+      "['Całuję', '.']\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "{'heads': [None, 0], 'deprels': ['root', 'punct']}"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "['Drzemał', '.']\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "{'heads': [None, 0], 'deprels': ['root', 'punct']}"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    }
+   ],
+   "source": [
+    "import conllu\n",
+    "\n",
+    "def get_combo_data(path):\n",
+    "    fields = list(conllu.parser.DEFAULT_FIELDS)\n",
+    "    fields[1] = 'token' \n",
+    "    with open(path) as f:\n",
+    "        x = conllu.parse(f.read(), fields=fields)\n",
+    "    COMBO = []\n",
+    "    for sent in x:\n",
+    "        tokens = [tok['token'] for tok in sent]\n",
+    "        heads = [tok['head'] - 1 if tok['head'] != 0 else None for tok in sent]\n",
+    "        deprels = [tok['deprel'] for tok in sent]\n",
+    "        COMBO.append([tokens, {'heads' : heads, 'deprels' : deprels}])\n",
+    "\n",
+    "    COMBO = sorted(COMBO, key=lambda x: (len(x[0]), ''.join(x[0])))\n",
+    "    print(len(COMBO))\n",
+    "    TOKENS, TAGS = zip(*COMBO)\n",
+    "    return TOKENS, TAGS\n",
+    "\n",
+    "TOKENS_C_VAL, TAGS_C_VAL = get_combo_data('COMBO/connlu/pdbc-validation-pred.conllu')\n",
+    "TOKENS_C_TEST, TAGS_C_TEST = get_combo_data('COMBO/connlu/pdbc-test-pred.conllu')\n",
+    "\n",
+    "assert(TOKENS_C_VAL == TOKENS_VAL)\n",
+    "assert(TOKENS_C_TEST == TOKENS_TEST)\n",
+    "\n",
+    "print(TOKENS_C_VAL[0])\n",
+    "display(TAGS_C_VAL[0])\n",
+    "print(TOKENS_C_TEST[0])\n",
+    "display(TAGS_C_TEST[0])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 51,
+   "id": "004918c6",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def _tree2spans(tree, spans, labeled=True, headed=False):\n",
+    "    if headed and not labeled:\n",
+    "        raise RuntimeError('cant’t use headed=True with labeled=False')\n",
+    "    if not tree.children:\n",
+    "        return {tree.from_index}\n",
+    "    span = set()\n",
+    "    for child in tree.children:\n",
+    "        span.update(_tree2spans(child, spans, labeled, headed))\n",
+    "    spans += [(tuple(sorted(span)), tree.category if labeled else 'SPAN', tree.is_head if headed else False)]\n",
+    "    return span\n",
+    "\n",
+    "def tree2spans(tree, labeled=True, headed=False):\n",
+    "    spans = []\n",
+    "    _tree2spans(tree, spans, labeled=labeled, headed=headed)\n",
+    "    # TODO\n",
+    "    #try:\n",
+    "    #    assert(len(spans) == len(set(spans)))\n",
+    "    #except:\n",
+    "    #    show_tree(tree)\n",
+    "    #    (display(spans))\n",
+    "    #    1/0\n",
+    "    return set(spans)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 52,
+   "id": "65d493ca",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "<module 'neural_parser.hybrid_tree_utils' from '/home/kkrasnowska/neural-parsing/ICCS/neural_parser/hybrid_tree_utils.py'>"
+      ]
+     },
+     "execution_count": 52,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "from sklearn.metrics import precision_score, recall_score, f1_score, accuracy_score\n",
+    "\n",
+    "importlib.reload(hybrid_tree_utils)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 53,
+   "id": "e5f88e76",
+   "metadata": {
+    "scrolled": false
+   },
+   "outputs": [],
+   "source": [
+    "ROOT = 'ROOT'\n",
+    "\n",
+    "def evaluate(tokens, tags_true, tags_pred, tags_combo, labeled=True, headed=False):\n",
+    "\n",
+    "    P, R = [0, 0], [0, 0]\n",
+    "    accuracies = {\n",
+    "        key : {'true' : [], 'pred' : []} for key in ('heads', ('heads', 'deprels'))\n",
+    "    }\n",
+    "\n",
+    "    k = 0\n",
+    "    i = 0\n",
+    "    PROBLEM_TREES = []\n",
+    "\n",
+    "    for toks, true, pred, combo in zip(tokens, tags_true, tags_pred, tags_combo):\n",
+    "        \n",
+    "        #sent = ' '.join(toks)\n",
+    "        #cats = HDR\n",
+    "        #true = dict(zip(cats, zip(*true)))\n",
+    "        #pred = dict(zip(cats, zip(*pred)))\n",
+    "        #print('----------------------------')\n",
+    "        #print(sent)\n",
+    "        dummy = {'lemmas' : ['_' for _ in toks], 'tags' : ['_' for _ in toks]}\n",
+    "        true.update(dummy)\n",
+    "        pred.update(dummy)\n",
+    "        pred.update(combo)\n",
+    "        try:\n",
+    "            tree_true = hybrid_tree_utils.make_tree(toks, true, ROOT, decompress=True)\n",
+    "        except:\n",
+    "            print(toks)\n",
+    "            display(true)\n",
+    "            raise\n",
+    "        try:\n",
+    "            tree_pred = hybrid_tree_utils.make_tree(toks, pred, ROOT, decompress=True)\n",
+    "        except:\n",
+    "            print(toks)\n",
+    "            display(pred)\n",
+    "            print('=============================')\n",
+    "            raise\n",
+    "            tree_pred, problems = None, None\n",
+    "        #if 'reattach' in problems:\n",
+    "        #    show_tree(tree_pred)\n",
+    "        \n",
+    "        #if pred['lemmas_corr'] != pred['lemmas']:\n",
+    "        #    print(pred['lemmas_corr'])\n",
+    "        #    print(pred['lemmas'])\n",
+    "        \n",
+    "        for key, v in accuracies.items():\n",
+    "            if type(key) == str:\n",
+    "                v['pred'] += [-1 if p is None else p for p in pred[key]]\n",
+    "                v['true'] += [-1 if k is None else k for k in true[key]]\n",
+    "            else:\n",
+    "                v['pred'] += ['#'.join(map(str, x)) for x in zip(*(pred[kk] for kk in key))]\n",
+    "                v['true'] += ['#'.join(map(str, x)) for x in zip(*(true[kk] for kk in key))]\n",
+    "        \n",
+    "        spans_true = tree2spans(tree_true, labeled=labeled, headed=headed)\n",
+    "        spans_pred = tree2spans(tree_pred, labeled=labeled, headed=headed) if tree_pred else set()\n",
+    "        if 'adwokata' in toks:\n",
+    "            print(spans_true)\n",
+    "            print(spans_pred)\n",
+    "        tp = len(spans_true.intersection(spans_pred))\n",
+    "        P[0] += tp\n",
+    "        R[0] += tp\n",
+    "        P[1] += len(spans_pred)\n",
+    "        R[1] += len(spans_true)\n",
+    "        leafs = tree_true.get_yield()\n",
+    "        discont = [leaf.from_index for leaf in leafs] != list(range(len(leafs)))\n",
+    "        #if k < 5 and len(toks) > 9 and [leaf.features['index'] for leaf in leafs] != list(range(len(leafs))):\n",
+    "        #if k < 5 and spans_combo != spans_true:\n",
+    "        #if k < 5 and not OK:\n",
+    "        #if discont and len(toks) > 12 and k < 0 and spans_pred == spans_true:\n",
+    "        if len(toks) == 8 and k < 0:\n",
+    "            print('GOLD TREE:')\n",
+    "            show_tree(tree_true)\n",
+    "            display(true)\n",
+    "            #display(_tree2dict(tree_true))\n",
+    "            print('PREDICTED TREE:')\n",
+    "            show_tree(tree_pred)\n",
+    "            display(pred)\n",
+    "            print('FP:', spans_pred - spans_true)\n",
+    "            print('FN:', spans_true - spans_pred)\n",
+    "            k += 1\n",
+    "        i += 1\n",
+    "    \n",
+    "    p, r = P[0]/P[1], R[0]/R[1]\n",
+    "    return {\n",
+    "        'P' : p, 'R': r, 'F1': (2 * p * r) / (p + r),\n",
+    "        'UAS' : accuracy_score(accuracies['heads']['true'], accuracies['heads']['pred']),\n",
+    "        'LAS' : accuracy_score(accuracies[('heads', 'deprels')]['true'], accuracies[('heads', 'deprels')]['pred']),\n",
+    "    }"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "df6a06fb",
+   "metadata": {},
+   "source": [
+    "0.9630140404796617\n",
+    "0.9605916493076027\n",
+    "0.9618013196384767\n",
+    "\n",
+    "– stare liczenie, bez kompresji, z tagami"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 54,
+   "id": "8f8a771a",
+   "metadata": {
+    "scrolled": false
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "unlabeled{((3,), 'SPAN', False), ((2, 3), 'SPAN', False), ((4,), 'SPAN', False), ((0, 1, 2, 3, 4), 'SPAN', False), ((0, 1, 2, 3), 'SPAN', False), ((2,), 'SPAN', False), ((0, 1), 'SPAN', False)}\n",
+      "{((3,), 'SPAN', False), ((2, 3), 'SPAN', False), ((4,), 'SPAN', False), ((0, 1, 2, 3, 4), 'SPAN', False), ((0, 1, 2, 3), 'SPAN', False), ((2,), 'SPAN', False), ((0, 1), 'SPAN', False)}\n",
+      "non-headed{((2,), 'Prep', False), ((4,), 'Punct', False), ((2, 3), 'PrepNP', False), ((3,), 'N', False), ((0, 1, 2, 3), 'S', False), ((0, 1), 'VP', False), ((0, 1), 'V', False), ((3,), 'NP', False), ((0, 1, 2, 3, 4), 'ROOT', False)}\n",
+      "{((2,), 'Prep', False), ((4,), 'Punct', False), ((2, 3), 'PrepNP', False), ((3,), 'N', False), ((0, 1, 2, 3), 'S', False), ((0, 1), 'VP', False), ((0, 1), 'V', False), ((3,), 'NP', False), ((0, 1, 2, 3, 4), 'ROOT', False)}\n",
+      "headed{((0, 1, 2, 3), 'S', True), ((4,), 'Punct', False), ((0, 1), 'VP', True), ((2, 3), 'PrepNP', False), ((0, 1), 'V', True), ((3,), 'NP', False), ((0, 1, 2, 3, 4), 'ROOT', False), ((2,), 'Prep', True), ((3,), 'N', True)}\n",
+      "{((0, 1, 2, 3), 'S', True), ((4,), 'Punct', False), ((0, 1), 'VP', True), ((2, 3), 'PrepNP', False), ((0, 1), 'V', True), ((3,), 'NP', False), ((0, 1, 2, 3, 4), 'ROOT', False), ((2,), 'Prep', True), ((3,), 'N', True)}\n"
+     ]
+    }
+   ],
+   "source": [
+    "EVAL_DATA = {\n",
+    "    '1val' : (TOKENS_VAL, TAGS_VAL, TAGS_P_VAL, TAGS_C_VAL),\n",
+    "    '2test' : (TOKENS_TEST, TAGS_TEST, TAGS_P_TEST, TAGS_C_TEST),\n",
+    "}\n",
+    "EVAL_MODES = {\n",
+    "    '1unlabeled' : {'labeled' : False, 'headed' : False},\n",
+    "    '2non-headed' : {'labeled' : True, 'headed' : False},\n",
+    "    '3headed' : {'labeled' : True, 'headed' : True},\n",
+    "}\n",
+    "\n",
+    "METRICS = ('P', 'R', 'F1')\n",
+    "\n",
+    "RESULTS = []\n",
+    "\n",
+    "tex = []\n",
+    "tex.append('\\\\toprule\\n')\n",
+    "tex.append('& \\\\multicolumn{3}{c}{validation} & \\\\multicolumn{3}{c}{test} \\\\\\\\\\n')\n",
+    "tex.append('& precision & recall & F1 & precision & recall & F1 \\\\\\\\\\n')\n",
+    "tex.append('\\\\midrule\\n')\n",
+    "for mode_name, mode in sorted(EVAL_MODES.items()):\n",
+    "    print(mode_name[1:], end='')\n",
+    "    tex.append(mode_name)\n",
+    "    for data_name, data in sorted(EVAL_DATA.items()):\n",
+    "        evaluation = evaluate(*data, **mode)\n",
+    "        for metric in METRICS:\n",
+    "            tex.append(f' & {100 * evaluation[metric]:.2f}\\\\%')\n",
+    "            RESULTS.append((data_name, mode_name, metric, evaluation[metric]))\n",
+    "    tex.append(' \\\\\\\\\\n')\n",
+    "tex.append('\\\\bottomrule\\n')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 55,
+   "id": "63192852",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import pandas as pd"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 56,
+   "id": "78250b1b",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "rows = set((r[0][1:], r[1][1:] if r[2] in ('P', 'R', 'F1') else '-', r[2], r[3]) for r in RESULTS)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 57,
+   "id": "bba6ed15",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "results = pd.DataFrame(data=rows, columns=['dataset', 'measure_type', 'measure', 'value'])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 58,
+   "id": "543377f8",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th>dataset</th>\n",
+       "      <th>measure_type</th>\n",
+       "      <th>measure</th>\n",
+       "      <th>value</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>dataset</th>\n",
+       "      <th>measure</th>\n",
+       "      <th>measure_type</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"9\" valign=\"top\">test</th>\n",
+       "      <th rowspan=\"3\" valign=\"top\">F1</th>\n",
+       "      <th>headed</th>\n",
+       "      <th>7</th>\n",
+       "      <td>test</td>\n",
+       "      <td>headed</td>\n",
+       "      <td>F1</td>\n",
+       "      <td>0.959192</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>non-headed</th>\n",
+       "      <th>8</th>\n",
+       "      <td>test</td>\n",
+       "      <td>non-headed</td>\n",
+       "      <td>F1</td>\n",
+       "      <td>0.965236</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>unlabeled</th>\n",
+       "      <th>15</th>\n",
+       "      <td>test</td>\n",
+       "      <td>unlabeled</td>\n",
+       "      <td>F1</td>\n",
+       "      <td>0.964436</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"3\" valign=\"top\">P</th>\n",
+       "      <th>headed</th>\n",
+       "      <th>9</th>\n",
+       "      <td>test</td>\n",
+       "      <td>headed</td>\n",
+       "      <td>P</td>\n",
+       "      <td>0.959611</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>non-headed</th>\n",
+       "      <th>6</th>\n",
+       "      <td>test</td>\n",
+       "      <td>non-headed</td>\n",
+       "      <td>P</td>\n",
+       "      <td>0.965658</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>unlabeled</th>\n",
+       "      <th>13</th>\n",
+       "      <td>test</td>\n",
+       "      <td>unlabeled</td>\n",
+       "      <td>P</td>\n",
+       "      <td>0.964118</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"3\" valign=\"top\">R</th>\n",
+       "      <th>headed</th>\n",
+       "      <th>2</th>\n",
+       "      <td>test</td>\n",
+       "      <td>headed</td>\n",
+       "      <td>R</td>\n",
+       "      <td>0.958773</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>non-headed</th>\n",
+       "      <th>5</th>\n",
+       "      <td>test</td>\n",
+       "      <td>non-headed</td>\n",
+       "      <td>R</td>\n",
+       "      <td>0.964815</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>unlabeled</th>\n",
+       "      <th>0</th>\n",
+       "      <td>test</td>\n",
+       "      <td>unlabeled</td>\n",
+       "      <td>R</td>\n",
+       "      <td>0.964754</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"9\" valign=\"top\">val</th>\n",
+       "      <th rowspan=\"3\" valign=\"top\">F1</th>\n",
+       "      <th>headed</th>\n",
+       "      <th>14</th>\n",
+       "      <td>val</td>\n",
+       "      <td>headed</td>\n",
+       "      <td>F1</td>\n",
+       "      <td>0.957423</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>non-headed</th>\n",
+       "      <th>4</th>\n",
+       "      <td>val</td>\n",
+       "      <td>non-headed</td>\n",
+       "      <td>F1</td>\n",
+       "      <td>0.963231</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>unlabeled</th>\n",
+       "      <th>1</th>\n",
+       "      <td>val</td>\n",
+       "      <td>unlabeled</td>\n",
+       "      <td>F1</td>\n",
+       "      <td>0.962553</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"3\" valign=\"top\">P</th>\n",
+       "      <th>headed</th>\n",
+       "      <th>10</th>\n",
+       "      <td>val</td>\n",
+       "      <td>headed</td>\n",
+       "      <td>P</td>\n",
+       "      <td>0.958145</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>non-headed</th>\n",
+       "      <th>16</th>\n",
+       "      <td>val</td>\n",
+       "      <td>non-headed</td>\n",
+       "      <td>P</td>\n",
+       "      <td>0.963958</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>unlabeled</th>\n",
+       "      <th>11</th>\n",
+       "      <td>val</td>\n",
+       "      <td>unlabeled</td>\n",
+       "      <td>P</td>\n",
+       "      <td>0.962762</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"3\" valign=\"top\">R</th>\n",
+       "      <th>headed</th>\n",
+       "      <th>17</th>\n",
+       "      <td>val</td>\n",
+       "      <td>headed</td>\n",
+       "      <td>R</td>\n",
+       "      <td>0.956702</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>non-headed</th>\n",
+       "      <th>12</th>\n",
+       "      <td>val</td>\n",
+       "      <td>non-headed</td>\n",
+       "      <td>R</td>\n",
+       "      <td>0.962505</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>unlabeled</th>\n",
+       "      <th>3</th>\n",
+       "      <td>val</td>\n",
+       "      <td>unlabeled</td>\n",
+       "      <td>R</td>\n",
+       "      <td>0.962343</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                                dataset measure_type measure     value\n",
+       "dataset measure measure_type                                          \n",
+       "test    F1      headed       7     test       headed      F1  0.959192\n",
+       "                non-headed   8     test   non-headed      F1  0.965236\n",
+       "                unlabeled    15    test    unlabeled      F1  0.964436\n",
+       "        P       headed       9     test       headed       P  0.959611\n",
+       "                non-headed   6     test   non-headed       P  0.965658\n",
+       "                unlabeled    13    test    unlabeled       P  0.964118\n",
+       "        R       headed       2     test       headed       R  0.958773\n",
+       "                non-headed   5     test   non-headed       R  0.964815\n",
+       "                unlabeled    0     test    unlabeled       R  0.964754\n",
+       "val     F1      headed       14     val       headed      F1  0.957423\n",
+       "                non-headed   4      val   non-headed      F1  0.963231\n",
+       "                unlabeled    1      val    unlabeled      F1  0.962553\n",
+       "        P       headed       10     val       headed       P  0.958145\n",
+       "                non-headed   16     val   non-headed       P  0.963958\n",
+       "                unlabeled    11     val    unlabeled       P  0.962762\n",
+       "        R       headed       17     val       headed       R  0.956702\n",
+       "                non-headed   12     val   non-headed       R  0.962505\n",
+       "                unlabeled    3      val    unlabeled       R  0.962343"
+      ]
+     },
+     "execution_count": 58,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "results.groupby(['dataset', 'measure', 'measure_type'], group_keys=True).apply(lambda x: x)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 59,
+   "id": "0b5d3fe4",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\\toprule\n",
+      "& \\multicolumn{3}{c}{validation} & \\multicolumn{3}{c}{test} \\\\\n",
+      "& precision & recall & F1 & precision & recall & F1 \\\\\n",
+      "\\midrule\n",
+      "1unlabeled & 96.28\\% & 96.23\\% & 96.26\\% & 96.41\\% & 96.48\\% & 96.44\\% \\\\\n",
+      "2non-headed & 96.40\\% & 96.25\\% & 96.32\\% & 96.57\\% & 96.48\\% & 96.52\\% \\\\\n",
+      "3headed & 95.81\\% & 95.67\\% & 95.74\\% & 95.96\\% & 95.88\\% & 95.92\\% \\\\\n",
+      "\\bottomrule\n"
+     ]
+    }
+   ],
+   "source": [
+    "for t in tex:\n",
+    "    print(t, end='')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "7946f27c",
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "3ff86ee7",
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "378cc977",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def evaluate_spines(tags_true, tags_pred):\n",
+    "\n",
+    "    TRUE, PRED = [], []\n",
+    "    values = set()\n",
+    "\n",
+    "    for true, pred in zip(tags_true, tags_pred):\n",
+    "        t, p = true['spines'], pred['spines']\n",
+    "        TRUE += t\n",
+    "        PRED += p\n",
+    "        values.update(t + p)\n",
+    "    \n",
+    "    print('ACCURACY:', accuracy_score(TRUE, PRED))\n",
+    "    \n",
+    "    values = sorted(values)\n",
+    "    ct = Counter(TRUE)\n",
+    "    cp = Counter(PRED)\n",
+    "    precisions = precision_score(TRUE, PRED, average=None)\n",
+    "    recalls = recall_score(TRUE, PRED, average=None)\n",
+    "    f1s = f1_score(TRUE, PRED, average=None)\n",
+    "    #for v, p, r, f in sorted(zip(values, precisions, recalls, f1s), key=lambda x: -x[3]):\n",
+    "    #    if v.endswith('formarzecz') or v.endswith('formaczas'):\n",
+    "    #        spine = ' $\\\\rightarrow$ '.join(f'\\\\nt{{{n}}}' for n in v.split('_'))\n",
+    "    #        print(f'{spine} & {100 * p:.2f}\\\\% & {100 * r:.2f}\\\\% & {100 * f:.2f}\\\\% \\\\\\\\')\n",
+    "    \n",
+    "    ct_pre, cp_pre = Counter(), Counter()\n",
+    "    for val in values:\n",
+    "        pre = val.split('_')[-1]\n",
+    "        ct_pre[pre] += ct[val]\n",
+    "        cp_pre[pre] += cp[val]\n",
+    "    \n",
+    "    rows = []\n",
+    "    \n",
+    "    for pre in ct_pre.keys():\n",
+    "        # TODO\n",
+    "        if pre == 'ign':\n",
+    "            continue\n",
+    "        if not cp_pre[pre] * ct_pre[pre]:\n",
+    "            print('SKIPPING:', pre)\n",
+    "            continue\n",
+    "        P, R = 0, 0\n",
+    "        rws = []\n",
+    "        for v, p, r, f in sorted(zip(values, precisions, recalls, f1s), key=lambda x: -x[3]):\n",
+    "            if v.endswith(pre):\n",
+    "                if pre in ('N', 'V',):\n",
+    "                    spine = ' $\\\\rightarrow$ '.join(f'\\\\nt{{{n}}}' for n in v.split('_'))\n",
+    "                    rws.append(f'{spine} & {100 * p:.2f}\\\\% & {100 * r:.2f}\\\\% & {100 * f:.2f}\\\\% & {ct[v]} \\\\\\\\')\n",
+    "                wp, wr = cp[v] / cp_pre[pre], ct[v] / ct_pre[pre]\n",
+    "                #print(f'    {v:36s} {100 * p:6.2f} {wp:7.3f} {100 * r:6.2f} {wr:7.3f}')\n",
+    "                P += p * wp\n",
+    "                R += r * wr\n",
+    "        F = 2 * P * R / (P + R)\n",
+    "        if pre in ('N', 'V',):\n",
+    "            rws.append('\\\\midrule')\n",
+    "        spine = f'... $\\\\rightarrow$ \\\\nt{{{pre}}}'\n",
+    "        rws = [f'{spine} & {100 * P:6.2f}\\\\% & {100 * R:6.2f}\\\\% & {100 * F:6.2f}\\\\% & {ct_pre[pre]} \\\\\\\\', '\\\\midrule'] + rws\n",
+    "        rows.append([-F, rws])\n",
+    "    \n",
+    "    for _, rws in sorted(rows):\n",
+    "        for r in rws:\n",
+    "            print(r)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "79a535ee",
+   "metadata": {
+    "scrolled": true
+   },
+   "outputs": [],
+   "source": [
+    "evaluate_spines(TAGS_VAL, TAGS_P_VAL)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ff572777",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "evaluate_spines(TAGS_TEST, TAGS_P_TEST)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "a7784f94",
+   "metadata": {},
+   "source": [
+    "pdbc_hybrid2: cały path (łącznie z powtórzeniamia )+ który <anchor> od dołu:\n",
+    "\n",
+    "P: 0.9554150435214833\n",
+    "R: 0.952102292362631\n",
+    "F1: 0.9537557913442842"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "TF_zajecia",
+   "language": "python",
+   "name": "tf_zajecia"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.10.6"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git b/neural_parser/MultiTarget.py a/neural_parser/MultiTarget.py
new file mode 100644
index 0000000..79d7553
--- /dev/null
+++ a/neural_parser/MultiTarget.py
@@ -0,0 +1,89 @@
+import tensorflow as tf
+
+from transformers import TFBertPreTrainedModel, BertConfig, TFBertMainLayer
+from transformers.modeling_tf_utils import get_initializer, input_processing, TFTokenClassificationLoss
+
+class TFBertForMultiTargetTokenClassification(TFBertPreTrainedModel, TFTokenClassificationLoss):
+    # names with a '.' represents the authorized unexpected/missing layers when a TF model is loaded from a PT model
+    _keys_to_ignore_on_load_unexpected = [
+        r"pooler",
+        r"mlm___cls",
+        r"nsp___cls",
+        r"cls.predictions",
+        r"cls.seq_relationship",
+    ]
+    _keys_to_ignore_on_load_missing = [r"dropout"]
+
+    def __init__(self, config: BertConfig, *inputs, **kwargs):
+        
+        categories = kwargs.pop('categories')
+        labels = kwargs.pop('labels')
+        
+        super().__init__(config, *inputs, **kwargs)
+        
+        self.categories = categories
+        
+        self.bert = TFBertMainLayer(config, add_pooling_layer=False, name="bert")
+        classifier_dropout = (
+            config.classifier_dropout if config.classifier_dropout is not None else config.hidden_dropout_prob
+        )
+        self.dropout = tf.keras.layers.Dropout(rate=classifier_dropout)
+        self.classifiers = [
+            tf.keras.layers.Dense(
+                units=len(labels[cat]),
+                kernel_initializer=get_initializer(config.initializer_range),
+                name=f'classifier_{cat}',
+            ) for cat in self.categories
+        ]
+        print(f'created {len(self.classifiers)} classifier(s)')
+
+    def call(
+        self,
+        input_ids=None,
+        attention_mask=None,
+        token_type_ids=None,
+        position_ids=None,
+        head_mask=None,
+        inputs_embeds=None,
+        output_attentions=None,
+        output_hidden_states=None,
+        return_dict=None,
+        labels=None,
+        training=False,
+        **kwargs,
+    ):
+        inputs = input_processing(
+            func=self.call,
+            config=self.config,
+            input_ids=input_ids,
+            attention_mask=attention_mask,
+            token_type_ids=token_type_ids,
+            position_ids=position_ids,
+            head_mask=head_mask,
+            inputs_embeds=inputs_embeds,
+            output_attentions=output_attentions,
+            output_hidden_states=output_hidden_states,
+            return_dict=return_dict,
+            labels=labels,
+            training=training,
+            kwargs_call=kwargs,
+        )
+        outputs = self.bert(
+            input_ids=inputs["input_ids"],
+            attention_mask=inputs["attention_mask"],
+            token_type_ids=inputs["token_type_ids"],
+            position_ids=inputs["position_ids"],
+            head_mask=inputs["head_mask"],
+            inputs_embeds=inputs["inputs_embeds"],
+            output_attentions=inputs["output_attentions"],
+            output_hidden_states=inputs["output_hidden_states"],
+            return_dict=inputs["return_dict"],
+            training=inputs["training"],
+        )
+        sequence_output = outputs[0]
+        sequence_output = self.dropout(inputs=sequence_output, training=inputs["training"])
+        logits = [classifier(inputs=sequence_output) for classifier in self.classifiers]
+        return dict(zip(self.categories, logits))
+    
+    def serving_output(self, output):
+        return output
diff --git b/neural_parser/constants.py a/neural_parser/constants.py
new file mode 100644
index 0000000..a4ab88d
--- /dev/null
+++ a/neural_parser/constants.py
@@ -0,0 +1,15 @@
+MASK_VALUE = -100
+
+FIRST = 'first'
+LAST = 'last'
+
+EMPTY = '<EMPTY>'
+
+TOKENS = 'tokens'
+LEMMAS = 'lemmas'
+TAGS = 'tags'
+SPINES = 'spines'
+ANCHORS = 'anchors'
+ANCHOR_HS = 'anchor_hs'
+HEADS = 'heads'
+DEPRELS = 'deprels'
diff --git b/neural_parser/constituency_parser.py a/neural_parser/constituency_parser.py
new file mode 100644
index 0000000..a73efe4
--- /dev/null
+++ a/neural_parser/constituency_parser.py
@@ -0,0 +1,139 @@
+import json
+
+import morfeusz2
+
+import tensorflow as tf
+from transformers import AutoTokenizer
+
+from datasets.features import ClassLabel, Sequence
+
+from .data_utils import dict_to_tensors
+from .dataset_utils import masked_word_ids
+from .MultiTarget import TFBertForMultiTargetTokenClassification
+
+from .constants import (
+    SPINES,
+    ANCHORS,
+    ANCHOR_HS,
+)
+
+def maybe_int(s):
+    if s and (s.isdigit() or s[0] == '-' and s[1:].isdigit()):
+        return int(s)
+    return s
+
+def keys_hook(d):
+    return { maybe_int(k) : v for k, v in d.items() }
+
+def get_labels(features, categories):
+    labels = {}
+    for cat in categories:
+        feature = features[cat].feature
+        if type(feature) == ClassLabel:
+            labels[cat] = feature.names
+    return labels
+
+class ConstituencyParser(object):
+    
+    def __init__(
+            self,
+            bert_path,
+            model,
+            labels,
+            bert_tokenizer=None,
+            ):
+        self.bert_path = bert_path
+        self.model = model
+        self.categories = [SPINES, ANCHORS, ANCHOR_HS]
+        self.labels = labels
+        if bert_tokenizer is not None:
+            self.bert_tokenizer = bert_tokenizer
+        else:
+            self.bert_tokenizer = AutoTokenizer.from_pretrained(bert_path)
+        self.morfeusz = morfeusz2.Morfeusz(generate=False, expand_tags=True)
+    
+    def save(self, path):
+        self.model.save_pretrained(f'{path}/model')
+        config = {
+            'labels' : self.labels,
+            'bert_path' : self.bert_path,
+        }
+        with open(f'{path}/config.json', 'w') as f:
+            json.dump(config, f, ensure_ascii=False)
+    
+    def create(
+            bert_path,
+            features,
+            bert_tokenizer=None,
+            ):
+        categories = [SPINES, ANCHORS, ANCHOR_HS]
+        labels = get_labels(features, categories)
+        model = TFBertForMultiTargetTokenClassification.from_pretrained(
+            bert_path,
+            from_pt=True,
+            categories=categories,
+            labels=labels,
+        )
+        return ConstituencyParser(
+            bert_path,
+            model,
+            labels,
+            bert_tokenizer=bert_tokenizer
+        )
+    
+    def load(path):
+        with open(f'{path}/config.json') as f:
+            config = json.load(f, object_hook=keys_hook)
+        labels = config['labels']
+        bert_path = config['bert_path']
+        categories = [SPINES, ANCHORS, ANCHOR_HS]
+        model = TFBertForMultiTargetTokenClassification.from_pretrained(
+            f'{path}/model',
+            categories=categories,
+            labels=labels,
+        )
+        return ConstituencyParser(
+            bert_path,
+            model,
+            labels,
+        )
+    
+    def align_with_mask(self, labels, mask):
+        return [
+            lbl if not hasattr(lbl, '__iter__') or type(lbl) == str else self.align_with_mask(lbl, mask)
+            for lbl, m in zip(labels, mask) if m is not None
+        ]
+    
+    def parse(self, sentences, force_long=False):
+        
+        if isinstance(sentences, str):
+            sentences = [sentences]
+        tokens = [s.split() for s in sentences]
+        tokenized = self.bert_tokenizer(
+            tokens,
+            is_split_into_words=True,
+            return_offsets_mapping=True,
+            padding=True,
+        )
+        
+        M = len(tokenized['input_ids'][0])
+        if M > self.bert_tokenizer.model_max_length and not force_long:
+            raise RuntimeError(f'Bert tokenizer produced a sequence of {M} tokens which exceeds the model’s limit ({self.bert_tokenizer.model_max_length}). Parse shorter sentences or call parse with force_long=True at your own risk.')
+        x = dict_to_tensors(dict(tokenized))
+        
+        predicted = self.model.predict(x)
+        labels = dict()
+        for cat, pred in predicted.items():
+            label_ids = tf.argmax(pred, axis=-1).numpy()
+            lbls = [[self.labels[cat][i] for i in l_ids] for l_ids in label_ids]
+            labels[cat] = lbls
+        
+        trees = []
+        
+        for i, (tkns, sentence) in enumerate(zip(tokens, sentences)):
+            
+            mask = masked_word_ids(tokenized.word_ids(i))
+            lbls = {cat : self.align_with_mask(lbls[i], mask) for cat, lbls in labels.items()}
+            trees.append((tkns, lbls))
+        
+        return trees
diff --git b/neural_parser/data_utils.py a/neural_parser/data_utils.py
new file mode 100644
index 0000000..6452ab0
--- /dev/null
+++ a/neural_parser/data_utils.py
@@ -0,0 +1,41 @@
+from collections import defaultdict
+from itertools import chain
+
+import numpy as np
+import tensorflow as tf
+
+from datasets.features import ClassLabel
+
+from .constants import MASK_VALUE
+
+# based on tensorflow.data.data_collator.DataCollatorForTokenClassification
+class DataCollator(object):
+    
+    def __init__(self, tokenizer, features):
+        self.tokenizer = tokenizer
+        self.features = features
+    
+    def _pad_labels(self, labels, sequence_length):
+        if self.tokenizer.padding_side == 'right':
+            return list(labels) + [MASK_VALUE] * (sequence_length - len(labels))
+        else:
+            return [MASK_VALUE] * (sequence_length - len(labels)) + list(labels)
+
+    def __call__(self, instance):
+
+        batch = self.tokenizer.pad(
+            instance,
+            padding=True,
+        )
+        sequence_length = tf.convert_to_tensor(batch['input_ids']).shape[1]
+        for category, feat in self.features.items():
+            if type(feat.feature) == ClassLabel:
+                padded_labels = [self._pad_labels(lbl, sequence_length) for lbl in batch[category]]
+                batch[category] = padded_labels
+            else:
+                raise ValueError(f'Unsupported feature type {type(feat.feature)} for "{category}".')
+        batch = {k: tf.convert_to_tensor(v) for k, v in batch.items()}
+        return batch
+
+def dict_to_tensors(d):
+    return { k : tf.convert_to_tensor(v) for k, v in d.items() }
diff --git b/neural_parser/dataset_utils.py a/neural_parser/dataset_utils.py
new file mode 100644
index 0000000..8917060
--- /dev/null
+++ a/neural_parser/dataset_utils.py
@@ -0,0 +1,138 @@
+from collections import Counter, defaultdict
+from itertools import chain
+
+from datasets import ClassLabel, Sequence
+
+from .hybrid_tree_utils import tree_from_dataset_instance
+
+from .constants import (
+    FIRST,
+    LAST,
+    MASK_VALUE,
+    EMPTY,
+    TOKENS,
+    SPINES,
+    ANCHORS,
+    ANCHOR_HS,
+)
+
+def _do_collect_spines(tree):
+    if not tree.children:
+        return [tree], []
+    heads = [child for child in tree.children if child.is_head]
+    assert(len(heads) == 1)
+    head = heads[0]
+    paths = []
+    my_path = [tree]
+    non_heads = []
+    for child in tree.children:
+        child_path, grandchildren_paths = _do_collect_spines(child)
+        paths += grandchildren_paths
+        if child == head:
+            my_path += child_path
+        else:
+            non_heads.append(child_path)
+    for child_path in non_heads:
+        # h == which <tree.category> counting from the bottom is the anchor
+        h = [n.category for n in my_path].count(tree.category)
+        paths.append((tree.category, h, child_path))
+    return my_path, paths
+
+def _collect_spines(tree):
+    try:
+        path, paths = _do_collect_spines(tree)
+    except:
+        print(tree.to_brackets())
+        raise
+    return {p[-1] : (anchor, h, p[:-1]) for anchor, h, p in [('<ROOT>', '<ROOT>', path)] + paths}
+
+def _compress_spine(spine):
+    compressed = []
+    for category in spine:
+        if category in compressed:
+            assert(category == compressed[-1])
+        else:
+            compressed.append(category)
+    return compressed
+
+def _add_spines_and_attachments(instance, dataset_features, compress):
+    tree = tree_from_dataset_instance(instance, dataset_features)
+    spines = _collect_spines(tree)
+    leafs_linear = sorted(tree.get_yield(), key=lambda leaf: leaf.from_index)
+    rows = []
+    for leaf in leafs_linear:
+        anchor, anchor_h, spine = spines[leaf]
+        spine = [node.category for node in spine]
+        if compress:
+            spine = _compress_spine(spine)
+        spine = '_'.join(spine) if spine else EMPTY
+        rows.append((spine, anchor, str(anchor_h)))
+    spines, anchors, anchor_hs = zip(*rows)
+    return {
+        SPINES : spines,
+        ANCHORS : anchors,
+        ANCHOR_HS : anchor_hs,
+    }
+
+def cast_labels(dataset, columns):
+    vals = defaultdict(Counter)
+    for d in dataset.values():
+        for column in columns:
+            vals[column].update(chain.from_iterable(s[column] for s in d))
+    new_features = dataset['train'].features.copy()
+    for column in columns:
+        new_features[column] = Sequence(ClassLabel(names=sorted(vals[column].keys())))
+    return dataset.cast(new_features)
+
+def add_spines_and_attachments(dataset, compress=False):
+    dataset_features = dataset['train'].features
+    new_dataset = dataset.map(lambda instance: _add_spines_and_attachments(instance, dataset_features, compress=compress))
+    return cast_labels(new_dataset, [SPINES, ANCHORS, ANCHOR_HS])
+
+# https://huggingface.co/docs/transformers/v4.23.1/en/tasks/token_classification
+
+def masked_word_ids(word_ids, masking_strategy=FIRST):
+    masked = []
+    for i, word_idx in enumerate(word_ids):
+        # Set the label for the first/last token of each word.
+        # Mask the label for:
+        #   * special tokens (word id = None)
+        #   * other tokens in a word
+        if word_idx is None:
+            masked.append(None)
+        else:
+            if masking_strategy == FIRST:
+                masked.append(word_idx if word_idx != word_ids[i - 1] else None)
+            elif masking_strategy == LAST:
+                masked.append(word_idx if word_idx != word_ids[i + 1] else None)
+    return masked
+
+def _align_row(values, masked_word_ids):
+    return [MASK_VALUE if idx is None else values[idx] for idx in masked_word_ids]
+
+def _align_example(example, masked_ids):
+    
+    column_names = list(example.keys())
+    labels = defaultdict(list)
+    masked_row = [MASK_VALUE for x in masked_ids]
+    
+    for column_name in column_names:
+        if column_name not in (SPINES, ANCHORS, ANCHOR_HS):
+            continue
+        values = example[column_name]
+        aligned_labels = _align_row(example[column_name], masked_ids)
+        labels[column_name] = aligned_labels
+    
+    return labels
+
+def bert_tokenize_and_align(example, tokenizer, masking_strategy=FIRST):
+    
+    if masking_strategy not in (FIRST, LAST):
+        raise RuntimeError(f'Uknown masking strategy: {masking_strategy}')
+    
+    tokenized_inputs = tokenizer(example[TOKENS], truncation=True, is_split_into_words=True)
+    word_ids = tokenized_inputs.word_ids()
+    mask = masked_word_ids(word_ids, masking_strategy)
+    labels = _align_example(example, mask)
+    tokenized_inputs.update(labels)
+    return tokenized_inputs
diff --git b/neural_parser/hybrid_tree_utils.py a/neural_parser/hybrid_tree_utils.py
new file mode 100644
index 0000000..4b88bcb
--- /dev/null
+++ a/neural_parser/hybrid_tree_utils.py
@@ -0,0 +1,335 @@
+from collections import defaultdict
+from itertools import chain
+
+from .constants import (
+    EMPTY,
+    TOKENS,
+    LEMMAS,
+    TAGS,
+    SPINES,
+    ANCHORS,
+    ANCHOR_HS,
+    HEADS,
+    DEPRELS,
+)
+
+class TreeNode(object):
+    
+    def __init__(self, nid, category, is_head, from_index, to_index, head_index=None, deprel=None, attributes=None, children=None):
+        self.nid = nid
+        self.parent = None
+        self.category = category
+        self.is_head = is_head
+        self.from_index = from_index
+        self.to_index = to_index
+        self.head_index = head_index
+        self.deprel = deprel
+        self.attributes = attributes if attributes is not None else {}
+        self.children = children if children is not None else []
+        for child in self.children:
+            child.parent = self
+    
+    def add_child(self, child):
+        self.children.append(child)
+        child.parent = self
+    
+    def get_yield(self):
+        if not self.children:
+            return [self]
+        return list(chain.from_iterable(child.get_yield() for child in self.children))
+    
+    def is_continuous(self):
+        idx = [token.from_index for token in self.get_yield()]
+        return (idx == sorted(idx))
+    
+    def get_root(self):
+        root = self
+        while root.parent is not None:
+            root = root.parent
+        return root
+    
+    def get_head_child(self):
+        if tree.children:
+            heads = [child for child in tree.children if child.is_head]
+            assert(len(heads) == 1)
+            return heads[0]
+        return None
+    
+    def get_head_token(self):
+        while tree.children:
+            tree = tree.get_head_child
+        return tree
+    
+    def make_evalb_friendly(self, s):
+        return s.replace(' ', '_').replace('(', 'LPAR').replace(')', 'RPAR')
+    
+    def to_brackets(self, features=[], mark_head=True, mark_head_terminals=False, morph_tags=False, dummy_pre=False):
+        if mark_head_terminals:
+            raise NotImplementedError
+        if not self.children:
+            cat = self.make_evalb_friendly(self.category[0])
+            if morph_tags:
+                cat = f'({self.category[2]} {cat})'
+            #if mark_head_terminals and self.is_head:
+            #    cat = '*' + cat
+            if len(self.parent.children) == 1 or not dummy_pre:
+                return cat
+            else:
+                return f'(DUMMY_PRE {cat})'
+        else:
+            cat = '_'.join([self.category] + [self.attributes.get(f, EMPTY_VAL) for f in features])
+            if mark_head and self.is_head:
+                cat = '*' + cat
+            cat = self.make_evalb_friendly(cat)
+            return f'({cat} {" ".join(child.to_brackets(features=features, mark_head=mark_head, mark_head_terminals=mark_head_terminals, morph_tags=morph_tags, dummy_pre=dummy_pre) for child in self.children)})'
+    
+    def pretty_print(self, tab='', features=[]):
+        print(f'{tab}[{self.nid}] {"*" if self.is_head else ""}{self.category}{[self.attributes.get(f, EMPTY_VAL) for f in features]}')
+        for child in self.children:
+            child.pretty_print(tab=tab + '    ', features=features)      
+
+def _do_mark_heads(tree, dependency_heads):
+    if not tree.children:
+        return tree.from_index
+    child_head_idx = [_do_mark_heads(child, dependency_heads) for child in tree.children]
+    heads = []
+    for child, child_head_id in zip(tree.children, child_head_idx):
+        if dependency_heads[child_head_id] not in child_head_idx:
+            child.is_head = True
+            heads.append(child_head_id)
+    assert(len(heads) == 1)
+    return heads[0]
+
+def _mark_heads(tree, dependency_heads):
+    _do_mark_heads(tree, dependency_heads)
+
+def _rearrange(tree):
+    if tree.children:
+        children = [_rearrange(child) for child in tree.children]
+        tree.children = sorted(children, key=lambda child: child.from_index)
+        tree.from_index = tree.children[0].from_index
+        tree.to_index = max(child.to_index for child in tree.children)
+    return tree
+
+def tree_from_dataset_instance(instance, dataset_features):
+    nonterminals = instance['nonterminals']
+    nodes = []
+    
+    # create a node for each nonterminal
+    for i, nonterminal in enumerate(nonterminals):
+        category = nonterminal['cat']
+        if category is None:
+            assert(len(nonterminal['children']) == 1)
+            token_idx = nonterminal['children'][0]
+            orth = instance[TOKENS][token_idx]
+            lemma = instance[LEMMAS][token_idx]
+            tag = dataset_features[TAGS].feature.int2str(instance[TAGS][token_idx])
+            category = (orth, lemma, tag)
+            nodes.append(TreeNode(i, category, False, token_idx, token_idx + 1))
+        else:
+            nodes.append(TreeNode(i, category, False, 0, 0))
+    
+    # link the nodes with parent-head relations
+    for nonterminal, dupa in list(zip(nonterminals, nodes)):
+        if nonterminal['cat'] is not None:
+            for child_idx in nonterminal['children']:
+                dupa.add_child(nodes[child_idx])
+    
+    tree = nodes[0]
+    # mark the heads according to dependency relations
+    _mark_heads(tree, instance['heads'])
+    
+    return _rearrange(tree)
+
+def get_heads(matrix):
+    chart_n = normalize(matrix)
+    chart_r = add_root(chart_n)
+    heads = {dep - 1: hd - 1 for hd, dep in mst(chart_r) if dep > 0}
+    return [hd for dep, hd in sorted(heads.items())]
+
+def make_head_path(path, token, lemma, tag, index):
+    node = TreeNode(0, (token, lemma, tag), False, index, index + 1)
+    if path == EMPTY:
+        return node
+    for cat in reversed(path.split('_')):
+        node.is_head = True
+        node = TreeNode(0, cat, False, None, None, children=[node])
+    return node
+
+def append_dependent(head_path, dep_path, anchor_cat, anchor_h, decompress=False):
+    problem = None
+    anchor_node = head_path
+    head_chain = [head_path]
+    while head_chain[-1].children:
+        heads = [child for child in head_chain[-1].children if child.is_head]
+        try:
+            assert len(heads) == 1
+            head_chain.append(heads[0])
+        except:
+            head_path.pretty_print()
+            head_chain[-1].pretty_print()
+            raise
+    matching_heads = [hd for hd in head_chain if hd.category == anchor_cat]
+    if not matching_heads:
+        anchor_node = head_path
+        problem = (dep_path, anchor_cat)
+    else:
+        # fallback: take the highest
+        if anchor_h is None:
+            anchor_h = len(matching_heads)
+        elif anchor_h > len(matching_heads) and not decompress:
+            anchor_h = len(matching_heads)
+        elif anchor_h > len(matching_heads) and decompress:
+            expand = anchor_h - len(matching_heads)
+            for i in range(expand):
+                child = matching_heads[0]
+                parent = child.parent
+                new_node = TreeNode(0, anchor_cat, child.is_head, None, None, children=[child])
+                child.is_head = True
+                if parent:
+                    parent.children.remove(child)
+                    parent.add_child(new_node)
+                if head_path == child:
+                    head_path = new_node
+                matching_heads.insert(0, new_node)
+        anchor_node = matching_heads[-anchor_h]
+    anchor_node.add_child(dep_path)
+    dep_path.is_head = False
+    return head_path, problem
+
+POS2PRE = {
+    #'aglt' : 'aglt',
+    #'conj' : 'spójnik',
+    #'dig' : 'formalicz',
+    #'fin' : 'formaczas',
+    #'interp' : 'punct',
+    #'num' : 'formalicz',
+    #'praet' : 'formaczas',
+    #'_' : '???',
+}
+
+def add_dummy_pre(path):
+    pos = path.category[2].split(':')[0]
+    return TreeNode(0, f'{POS2PRE[pos]}', True, {}, [path])
+
+def check_no_cycles(heads):
+    children_dict = defaultdict(set)
+    for i, hd in enumerate(heads):
+        children_dict[hd].add(i)
+    visited = {-1}
+    queue = [-1]
+    while queue:
+        children = children_dict.pop(queue[0], set())
+        if children.intersection(visited):
+            return False
+        visited.update(children)
+        queue = queue[1:] + list(children)
+    return not children
+
+# find any <EMPTY>’s children and reattach them to <EMPTY>’s head
+def try_reattach(heads, spines, tokens):
+    
+    to_reattach = [i for i, spine in enumerate(spines) if spine == EMPTY and i in heads]
+    k = 0
+    while to_reattach:
+        k += 1
+        if k == 50:
+            1/0
+        print('------- TO REATTACH:')
+        for i in to_reattach:
+            print('    ===>', i, tokens[i], '->', [t for t, h in zip(tokens, heads) if h == i])
+        tr = to_reattach[0]
+        hd_idx = heads[tr]
+        assert(hd_idx is not None)
+        new_heads = heads.copy()
+        for i, hd in enumerate(heads):
+            if hd == tr:
+                new_heads[i] = hd_idx
+        if check_no_cycles(new_heads):
+            heads = new_heads
+        else:
+            print('can’t reattach (cycle!)')
+            1/0
+        to_reattach = [i for i, spine in enumerate(spines) if spine == EMPTY and i in heads]
+    
+    return heads
+
+def reconstruct_tree(tokens, tags, decompress=False, root_label='ROOT'):
+    morph_tags = tags.get(TAGS, ['_' for _ in tokens])
+    lemmas = tags.get(LEMMAS, ['_' for _ in tokens])
+    heads = tags[HEADS]
+    deprels = tags[DEPRELS]
+    spines = tags[SPINES]
+    anchors = tags[ANCHORS]
+    anchor_hs = tags[ANCHOR_HS] 
+    problems = []
+    spines = list(spines)
+    children = defaultdict(set)
+    
+    for i, (head, spine) in enumerate(zip(heads, spines)):
+        if (head is None and root_label not in spine):
+            spines[i] = (f'{root_label}_' + spines[i]).replace(f'_{EMPTY}', '')
+        if (head is not None and root_label in spine):
+            assert(spines[i].startswith(root_label))
+            spines[i] = EMPTY if spines[i] == root_label else spines[i].replace(f'{root_label}_', '')
+    
+    reattach = False
+    
+    new_heads = try_reattach(heads, spines, tokens)
+    if new_heads != heads:
+        heads = new_heads
+        reattach = True
+    
+    head_paths = [
+        make_head_path(p, tok, lemma, tag, i) for i, (p, tok, lemma, tag)
+        in enumerate(zip(spines, tokens, lemmas, morph_tags))
+    ]
+    
+    # if a spine is some other spine’s head and consists of a terminal only, add a dummy preterminal to append to
+    head_paths = [add_dummy_pre(hp) if (type(hp.category) == tuple and i in heads) else hp for i, hp in enumerate(head_paths)]
+    
+    anchor_hs = [int(h) if h != '<ROOT>' else None for h in anchor_hs]
+    root = None
+    for i, head in enumerate(heads):
+        if deprels[i] is not None:
+            head_paths[i].attributes['deprel'] = deprels[i]
+        if head is None:
+            root = i
+        else:
+            head_paths[head], problem = append_dependent(
+                head_paths[head], head_paths[i], anchors[i], anchor_hs[i], decompress=decompress)
+            if problem:
+                problems.append(problem)
+    if reattach:
+        problems.append('reattach')
+    
+    tree = _rearrange(head_paths[root])
+    
+    return tree, problems
+
+def make_tree(tokens, tags, root_label, decompress=True):
+    tree, problems = reconstruct_tree(tokens, tags, decompress=decompress, root_label=root_label)
+    return tree
+
+def _node2dict(tree):
+    children = [_node2dict(child) for child in tree.children]
+    leaves = tree.get_yield()
+    node = {
+        'is_head' : tree.is_head,
+        'span' : {'from' : tree.from_index, 'to' : tree.to_index},
+    }
+    if tree.deprel is not None:
+        node['deprel'] = tree.deprel
+    if tree.attributes:
+        node['attributes'] = tree.attributes
+    if children:
+        node.update({
+            'category' : tree.category,
+            'children' : children,
+        })
+    else:
+        node.update(dict(zip(('orth', 'base', 'tag'), tree.category)))
+    return node
+
+def tree2dict(tree, metadata={}):
+    return {'tree' : _node2dict(tree), 'metadata' : metadata}
diff --git b/neural_parser/training.py a/neural_parser/training.py
new file mode 100644
index 0000000..04d0201
--- /dev/null
+++ a/neural_parser/training.py
@@ -0,0 +1,180 @@
+import os
+import subprocess
+
+from itertools import chain
+
+import tensorflow as tf
+from tensorflow.keras import backend
+
+from datasets import Dataset
+from datasets.features import Features
+from transformers import AutoTokenizer
+from transformers.modeling_tf_utils import TFTokenClassificationLoss
+from transformers.tf_utils import shape_list
+
+from .constituency_parser import ConstituencyParser
+from .data_utils import DataCollator
+from .dataset_utils import bert_tokenize_and_align
+from .constants import (
+    FIRST,
+    MASK_VALUE,
+    TOKENS,
+    SPINES,
+    ANCHORS,
+    ANCHOR_HS,
+)
+
+class AvgAccuracy(tf.keras.callbacks.Callback):
+    def __init__(self):
+        super(AvgAccuracy, self).__init__()
+    def on_epoch_begin(self, epoch, logs={}):
+        return
+    def on_epoch_end(self, epoch, logs={}):
+        accs = []
+        val_accs = []
+        for k, v in logs.items():
+            if k.endswith('_acc'):
+                if k.startswith('val_'):
+                    val_accs.append(v)
+                else:
+                    accs.append(v)
+        logs['avg_acc'] = sum(accs) / len(accs)
+        logs['val_avg_acc'] = sum(val_accs) / len(val_accs)
+
+def _masked_sparse_categorical_accuracy(y_true, y_pred):
+    y_pred = tf.convert_to_tensor(y_pred)
+    y_true = tf.convert_to_tensor(y_true)
+    y_pred_rank = y_pred.shape.ndims
+    y_true_rank = y_true.shape.ndims
+    # If the shape of y_true is (num_samples, 1), squeeze to (num_samples,)
+    if (y_true_rank is not None) and (y_pred_rank is not None) and (len(
+            backend.int_shape(y_true)) == len(backend.int_shape(y_pred))):
+        y_true = tf.squeeze(y_true, [-1])
+    y_pred = tf.compat.v1.argmax(y_pred, axis=-1)
+    mask = tf.reshape(y_true, (-1,)) != MASK_VALUE
+    y_true = tf.boolean_mask(tf.reshape(y_true, (-1,)), mask)
+    y_pred = tf.boolean_mask(tf.reshape(y_pred, (-1,)), mask)
+    # If the predicted output and actual output types don't match, force cast them
+    # to match.
+    if backend.dtype(y_pred) != backend.dtype(y_true):
+        y_pred = tf.cast(y_pred, backend.dtype(y_true))
+    ret = tf.cast(tf.equal(y_true, y_pred), backend.floatx())
+    return ret
+
+class Trainer(object):
+    
+    def __init__(
+            self,
+            bert_path,
+            dataset,
+            batch_size=32,
+            ):
+        self.bert_path = bert_path
+        self.dataset = dataset
+        self.masking_strategy = FIRST
+        self.batch_size = batch_size
+        
+        self.categories = [SPINES, ANCHORS, ANCHOR_HS]
+        
+        self.features = Features({cat : self.dataset['train'].features[cat] for cat in self.categories})
+        
+        print('Loading BERT tokenizer...')
+        self.bert_tokenizer = AutoTokenizer.from_pretrained(self.bert_path)
+        
+        print('Preprocessing the dataset for BERT...')
+        self.dataset = self.dataset.map(lambda x: bert_tokenize_and_align(x, self.bert_tokenizer, self.masking_strategy))
+        
+        self.train_data = self._prepare_tf_data(self.dataset['train'], shuffle=True)
+        self.dev_data = self._prepare_tf_data(self.dataset['validation'])
+        
+    def _prepare_tf_data(self, dataset, shuffle=False):
+        collator = DataCollator(self.bert_tokenizer, self.features)
+        return Dataset.to_tf_dataset(
+            dataset,
+            columns=['input_ids', 'token_type_ids', 'attention_mask'],
+            label_cols=self.categories,
+            batch_size=self.batch_size, shuffle=shuffle, collate_fn=collator
+        )
+    
+    def _prepare_output_dir(self, path):
+        if not os.path.exists(path):
+            subprocess.call(f'mkdir {path}', shell=True)
+        else:
+            if not os.path.isdir(path):
+                raise ValueError(f'{path} is not a directory')
+            elif os.listdir(path):
+                print(f'emptying {path}')
+                subprocess.call(f'rm -r {path}/*', shell=True)
+    
+    
+    def _make_callbacks(self, log_dir):
+        callbacks = [
+            AvgAccuracy(),
+            tf.keras.callbacks.EarlyStopping(monitor='val_avg_acc', patience=4, verbose=1, restore_best_weights=True)
+        ]
+        if log_dir is not None:
+            callbacks.append(tf.keras.callbacks.TensorBoard(log_dir=log_dir, histogram_freq=0, update_freq=50))
+        return callbacks
+    
+    def train(self, epochs=10, lr=0.00001, log_dir=None, model_dir=None):
+        
+        if log_dir is not None:
+            self._prepare_output_dir(log_dir)
+        if model_dir is not None:
+            self._prepare_output_dir(model_dir)
+        
+        parser = ConstituencyParser.create(
+            self.bert_path,
+            self.features,
+            bert_tokenizer=self.bert_tokenizer
+        )
+        
+        parser.model.config.tf_legacy_loss = True
+        hf_loss = parser.model.hf_compute_loss
+        
+        def _loss(labels, logits):
+            print('LABELS:', labels)
+            print('LOGITS:', logits)
+            l = hf_loss(labels, logits)
+            print('LOSS:', l)
+            return l
+        
+        # wrap in eager execution so that tensor values can be printed
+        def debug_loss(y_true, y_pred):
+            return tf.py_function(func=_loss, inp=[tf.cast(y_true, tf.float32), y_pred], Tout=tf.float32)
+        
+        loss = hf_loss
+        #loss = debug_loss
+        
+        accuracy_metric = lambda: tf.keras.metrics.MeanMetricWrapper(
+            fn=_masked_sparse_categorical_accuracy, name='acc'
+        )
+        
+        metrics = {cat : [accuracy_metric()] for cat in self.categories}
+        
+        losses = {cat : loss for cat in self.categories}
+        
+        initial_epoch = 0
+        
+        parser.model.compile(
+            optimizer=tf.keras.optimizers.Adam(learning_rate=lr),
+            loss=losses,
+            metrics=metrics
+        )
+        parser.model.fit(
+            x=self.train_data,
+            validation_data=self.dev_data,
+            epochs=epochs,
+            callbacks=self._make_callbacks(log_dir),
+            initial_epoch=initial_epoch,
+        )
+        
+        if model_dir is not None:
+            parser.save(model_dir)
+            with open(f'{model_dir}/trainer.info', 'w') as f:
+                print(f'dataset: {self.dataset}', file=f)
+                print(f'batch_size: {self.batch_size}', file=f)
+                print(f'epochs: {epochs}', file=f)
+                print(f'lr: {lr}', file=f)
+        
+        return parser