TrainModel.ipynb 2.56 MB
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724 725 726 727 728 729 730 731 732 733 734 735 736 737 738 739 740 741 742 743 744 745 746 747 748 749 750 751 752 753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882 883 884 885 886 887 888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921 922 923 924 925 926 927 928 929 930 931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993 994 995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051 1052 1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091 1092 1093 1094 1095 1096 1097 1098 1099 1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 1119 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214 1215 1216 1217 1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297 1298 1299 1300 1301 1302 1303 1304 1305 1306 1307 1308 1309 1310 1311 1312 1313 1314 1315 1316 1317 1318 1319 1320 1321 1322 1323 1324 1325 1326 1327 1328 1329 1330 1331 1332 1333 1334 1335 1336 1337 1338 1339 1340 1341 1342 1343 1344 1345 1346 1347 1348 1349 1350 1351 1352 1353 1354 1355 1356 1357 1358 1359 1360 1361 1362 1363 1364 1365 1366 1367 1368 1369 1370 1371 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 1389 1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400 1401 1402 1403 1404 1405 1406 1407 1408 1409 1410 1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422 1423 1424 1425 1426 1427 1428 1429 1430 1431 1432 1433 1434 1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456 1457 1458 1459 1460 1461 1462 1463 1464 1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483 1484 1485 1486 1487 1488 1489 1490 1491 1492 1493 1494 1495 1496 1497 1498 1499 1500 1501 1502 1503 1504 1505 1506 1507 1508 1509 1510 1511 1512 1513 1514 1515 1516 1517 1518 1519 1520 1521 1522 1523 1524 1525 1526 1527 1528 1529 1530 1531 1532 1533 1534 1535 1536 1537 1538 1539 1540 1541 1542 1543 1544 1545 1546 1547 1548 1549 1550 1551 1552 1553 1554 1555 1556 1557 1558 1559 1560 1561 1562 1563 1564 1565 1566 1567 1568 1569 1570 1571 1572 1573 1574 1575 1576 1577 1578 1579 1580 1581 1582 1583 1584 1585 1586 1587 1588 1589 1590 1591 1592 1593 1594 1595 1596 1597 1598 1599 1600 1601 1602 1603 1604 1605 1606 1607 1608 1609 1610 1611 1612 1613 1614 1615 1616 1617 1618 1619 1620 1621 1622 1623 1624 1625 1626 1627 1628 1629 1630 1631 1632 1633 1634 1635 1636 1637 1638 1639 1640 1641 1642 1643 1644 1645 1646 1647 1648 1649 1650 1651 1652 1653 1654 1655 1656 1657 1658 1659 1660 1661 1662 1663 1664 1665 1666 1667 1668 1669 1670 1671 1672 1673 1674 1675 1676 1677 1678 1679 1680 1681 1682 1683 1684 1685 1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696 1697 1698 1699 1700 1701 1702 1703 1704 1705 1706 1707 1708 1709 1710 1711 1712 1713 1714 1715 1716 1717 1718 1719 1720 1721 1722 1723 1724 1725 1726 1727 1728 1729 1730 1731 1732 1733 1734 1735 1736 1737 1738 1739 1740 1741 1742 1743 1744 1745 1746 1747 1748 1749 1750 1751 1752 1753 1754 1755 1756 1757 1758 1759 1760 1761 1762 1763 1764 1765 1766 1767 1768 1769 1770 1771 1772 1773 1774 1775 1776 1777 1778 1779 1780 1781 1782 1783 1784 1785 1786 1787 1788 1789 1790 1791 1792 1793 1794 1795 1796 1797 1798 1799 1800 1801 1802 1803 1804 1805 1806 1807 1808 1809 1810 1811 1812 1813 1814 1815 1816 1817 1818 1819 1820 1821 1822 1823 1824 1825 1826 1827 1828 1829 1830 1831 1832 1833 1834 1835 1836 1837 1838 1839 1840 1841 1842 1843 1844 1845 1846 1847 1848 1849 1850 1851 1852 1853 1854 1855 1856 1857 1858 1859 1860 1861 1862 1863 1864 1865 1866 1867 1868 1869 1870 1871 1872 1873 1874 1875 1876 1877 1878 1879 1880 1881 1882 1883 1884 1885 1886 1887 1888 1889 1890 1891 1892 1893 1894 1895 1896 1897 1898 1899 1900 1901 1902 1903 1904 1905 1906 1907 1908 1909 1910 1911 1912 1913 1914 1915 1916 1917 1918 1919 1920 1921 1922 1923 1924 1925 1926 1927 1928 1929 1930 1931 1932 1933 1934 1935 1936 1937 1938 1939 1940 1941 1942 1943 1944 1945 1946 1947 1948 1949 1950 1951 1952 1953 1954 1955 1956 1957 1958 1959 1960 1961 1962 1963 1964 1965 1966 1967 1968 1969 1970 1971 1972 1973 1974 1975 1976 1977 1978 1979 1980 1981 1982 1983 1984 1985 1986 1987 1988 1989 1990 1991 1992 1993 1994 1995 1996 1997 1998 1999 2000 2001 2002 2003 2004 2005 2006 2007 2008 2009 2010 2011 2012 2013 2014 2015 2016 2017 2018 2019 2020 2021 2022 2023 2024 2025 2026 2027 2028 2029 2030 2031 2032 2033 2034 2035 2036 2037 2038 2039 2040 2041 2042 2043 2044 2045 2046 2047 2048 2049 2050 2051 2052 2053 2054 2055 2056 2057 2058 2059 2060 2061 2062 2063 2064 2065 2066 2067 2068 2069 2070 2071 2072 2073 2074 2075 2076 2077 2078 2079 2080 2081 2082 2083 2084 2085 2086 2087 2088 2089 2090 2091 2092 2093 2094 2095 2096 2097 2098 2099 2100 2101 2102 2103 2104 2105 2106 2107 2108 2109 2110 2111 2112 2113 2114 2115 2116 2117 2118 2119 2120 2121 2122 2123 2124 2125 2126 2127 2128 2129 2130 2131 2132 2133 2134 2135 2136 2137 2138 2139 2140 2141 2142 2143 2144 2145 2146 2147 2148 2149 2150 2151 2152 2153 2154 2155 2156 2157 2158 2159 2160 2161 2162 2163 2164 2165 2166 2167 2168 2169 2170 2171 2172 2173 2174 2175 2176 2177 2178 2179 2180 2181 2182 2183 2184 2185 2186 2187 2188 2189 2190 2191 2192 2193 2194 2195 2196 2197 2198 2199 2200 2201 2202 2203 2204 2205 2206 2207 2208 2209 2210 2211 2212 2213 2214 2215 2216 2217 2218 2219 2220 2221 2222 2223 2224 2225 2226 2227 2228 2229 2230 2231 2232 2233 2234 2235 2236 2237 2238 2239 2240 2241 2242 2243 2244 2245 2246 2247 2248 2249 2250 2251 2252 2253 2254 2255 2256 2257 2258 2259 2260 2261 2262 2263 2264 2265 2266 2267 2268 2269 2270 2271 2272 2273 2274 2275 2276 2277 2278 2279 2280 2281 2282 2283 2284 2285 2286 2287 2288 2289 2290 2291 2292 2293 2294 2295 2296 2297 2298 2299 2300 2301 2302 2303 2304 2305 2306 2307 2308 2309 2310 2311 2312 2313 2314 2315 2316 2317 2318 2319 2320 2321 2322 2323 2324 2325 2326 2327 2328 2329 2330 2331 2332 2333 2334 2335 2336 2337 2338 2339 2340 2341 2342 2343 2344 2345 2346 2347 2348 2349 2350 2351 2352 2353 2354 2355 2356 2357 2358 2359 2360 2361 2362 2363 2364 2365 2366 2367 2368 2369 2370 2371 2372 2373 2374 2375 2376 2377 2378 2379 2380 2381 2382 2383 2384 2385 2386 2387 2388 2389 2390 2391 2392 2393 2394 2395 2396 2397 2398 2399 2400 2401 2402 2403 2404 2405 2406 2407 2408 2409 2410 2411 2412 2413 2414 2415 2416 2417 2418 2419 2420 2421 2422 2423 2424 2425 2426 2427 2428 2429 2430 2431 2432 2433 2434 2435 2436 2437 2438 2439 2440 2441 2442 2443 2444 2445 2446 2447 2448 2449 2450 2451 2452 2453 2454 2455 2456 2457 2458 2459 2460 2461 2462 2463 2464 2465 2466 2467 2468 2469 2470 2471 2472 2473 2474 2475 2476 2477 2478 2479 2480 2481 2482 2483 2484 2485 2486 2487 2488 2489 2490 2491 2492 2493 2494 2495 2496 2497 2498 2499 2500 2501 2502 2503 2504 2505 2506 2507 2508 2509 2510 2511 2512 2513 2514 2515 2516 2517 2518 2519 2520 2521 2522 2523 2524 2525 2526 2527 2528 2529 2530 2531 2532 2533 2534 2535 2536 2537 2538 2539 2540 2541 2542 2543 2544 2545 2546 2547 2548 2549 2550 2551 2552 2553 2554 2555 2556 2557 2558 2559 2560 2561 2562 2563 2564 2565 2566 2567 2568 2569 2570 2571 2572 2573 2574 2575 2576 2577 2578 2579 2580 2581 2582 2583 2584 2585 2586 2587 2588 2589 2590 2591 2592 2593 2594 2595 2596 2597 2598 2599 2600 2601 2602 2603 2604 2605 2606 2607 2608 2609 2610 2611 2612 2613 2614 2615 2616 2617 2618 2619 2620 2621 2622 2623 2624 2625 2626 2627 2628 2629 2630 2631 2632 2633 2634 2635 2636 2637 2638 2639 2640 2641 2642 2643 2644 2645 2646 2647 2648 2649 2650 2651 2652 2653 2654 2655 2656 2657 2658 2659 2660 2661 2662 2663 2664 2665 2666 2667 2668 2669 2670 2671 2672 2673 2674 2675 2676 2677 2678 2679 2680 2681 2682 2683 2684 2685 2686 2687 2688 2689 2690 2691 2692 2693 2694 2695 2696 2697 2698 2699 2700 2701 2702 2703 2704 2705 2706 2707 2708 2709 2710 2711 2712 2713 2714 2715 2716 2717 2718 2719 2720 2721 2722 2723 2724 2725 2726 2727 2728 2729 2730 2731 2732 2733 2734 2735 2736 2737 2738 2739 2740 2741 2742 2743 2744 2745 2746 2747 2748 2749 2750 2751 2752 2753 2754 2755 2756 2757 2758 2759 2760 2761 2762 2763 2764 2765 2766 2767 2768 2769 2770 2771 2772 2773 2774 2775 2776 2777 2778 2779 2780 2781 2782 2783 2784 2785 2786 2787 2788 2789 2790 2791 2792 2793 2794 2795 2796 2797 2798 2799 2800 2801 2802 2803 2804 2805 2806 2807 2808 2809 2810 2811 2812 2813 2814 2815 2816 2817 2818 2819 2820 2821 2822 2823 2824 2825 2826 2827 2828 2829 2830 2831 2832 2833 2834 2835 2836 2837 2838 2839 2840 2841 2842 2843 2844 2845 2846 2847 2848 2849 2850 2851 2852 2853 2854 2855 2856 2857 2858 2859 2860 2861 2862 2863 2864 2865 2866 2867 2868 2869 2870 2871 2872 2873 2874 2875 2876 2877 2878 2879 2880 2881 2882 2883 2884 2885 2886 2887 2888 2889 2890 2891 2892 2893 2894 2895 2896 2897 2898 2899 2900 2901 2902 2903 2904 2905 2906 2907 2908 2909 2910 2911 2912 2913 2914 2915 2916 2917 2918 2919 2920 2921 2922 2923 2924 2925 2926 2927 2928 2929 2930 2931 2932 2933 2934 2935 2936 2937 2938 2939 2940 2941 2942 2943 2944 2945 2946 2947 2948 2949 2950 2951 2952 2953 2954 2955 2956 2957 2958 2959 2960 2961 2962 2963 2964 2965 2966 2967 2968 2969 2970 2971 2972 2973 2974 2975 2976 2977 2978 2979 2980 2981 2982 2983 2984 2985 2986 2987 2988 2989 2990 2991 2992 2993 2994 2995 2996 2997 2998 2999 3000 3001 3002 3003 3004 3005 3006 3007 3008 3009 3010 3011 3012 3013 3014 3015 3016 3017 3018 3019 3020 3021 3022 3023 3024 3025 3026 3027 3028 3029 3030 3031 3032 3033 3034 3035 3036 3037 3038 3039 3040 3041 3042 3043 3044 3045 3046 3047 3048 3049 3050 3051 3052 3053 3054 3055 3056 3057 3058 3059 3060 3061 3062 3063 3064 3065 3066 3067 3068 3069 3070 3071 3072 3073 3074 3075 3076 3077 3078 3079 3080 3081 3082 3083 3084 3085 3086 3087 3088 3089 3090 3091 3092 3093 3094 3095 3096 3097 3098 3099 3100 3101 3102 3103 3104 3105 3106 3107 3108 3109 3110 3111 3112 3113 3114 3115 3116 3117 3118 3119 3120 3121 3122 3123 3124 3125 3126 3127 3128 3129 3130 3131 3132 3133 3134 3135 3136 3137 3138 3139 3140 3141 3142 3143 3144 3145 3146 3147 3148 3149 3150 3151 3152 3153 3154 3155 3156 3157 3158 3159 3160 3161 3162 3163 3164 3165 3166 3167 3168 3169 3170 3171 3172 3173 3174 3175 3176 3177 3178 3179 3180 3181 3182 3183 3184 3185 3186 3187 3188 3189 3190 3191 3192 3193 3194 3195 3196 3197 3198 3199 3200 3201 3202 3203 3204 3205 3206 3207 3208 3209 3210 3211 3212 3213 3214 3215 3216 3217 3218 3219 3220 3221 3222 3223 3224 3225 3226 3227 3228 3229 3230 3231 3232 3233 3234 3235 3236 3237 3238 3239 3240 3241 3242 3243 3244 3245 3246 3247 3248 3249 3250 3251 3252 3253 3254 3255 3256 3257 3258 3259 3260 3261 3262 3263 3264 3265 3266 3267 3268 3269 3270 3271 3272 3273 3274 3275 3276 3277 3278 3279 3280 3281 3282 3283 3284 3285 3286 3287 3288 3289 3290 3291 3292 3293 3294 3295 3296 3297 3298 3299 3300 3301 3302 3303 3304 3305 3306 3307 3308 3309 3310 3311 3312 3313 3314 3315 3316 3317 3318 3319 3320 3321 3322 3323 3324 3325 3326 3327 3328 3329 3330 3331 3332 3333 3334 3335 3336 3337 3338 3339 3340 3341 3342 3343 3344 3345 3346 3347 3348 3349 3350 3351 3352 3353 3354 3355 3356 3357 3358 3359 3360 3361 3362 3363 3364 3365 3366 3367 3368 3369 3370 3371 3372 3373 3374 3375 3376 3377 3378 3379 3380 3381 3382 3383 3384 3385 3386 3387 3388 3389 3390 3391 3392 3393 3394 3395 3396 3397 3398 3399 3400 3401 3402 3403 3404 3405 3406 3407 3408 3409 3410 3411 3412 3413 3414 3415 3416 3417 3418 3419 3420 3421 3422 3423 3424 3425 3426 3427 3428 3429 3430 3431 3432 3433 3434 3435 3436 3437 3438 3439 3440 3441 3442 3443 3444 3445 3446 3447 3448 3449 3450 3451 3452 3453 3454 3455 3456 3457 3458 3459 3460 3461 3462 3463 3464 3465 3466 3467 3468 3469 3470 3471 3472 3473 3474 3475 3476 3477 3478 3479 3480 3481 3482 3483 3484 3485 3486 3487 3488 3489 3490 3491 3492 3493 3494 3495 3496 3497 3498 3499 3500 3501 3502 3503 3504 3505 3506 3507 3508 3509 3510 3511 3512 3513 3514 3515 3516 3517 3518 3519 3520 3521 3522 3523 3524 3525 3526 3527 3528 3529 3530 3531 3532 3533 3534 3535 3536 3537 3538 3539 3540 3541 3542 3543 3544 3545 3546 3547 3548 3549 3550 3551 3552 3553 3554 3555 3556 3557 3558 3559 3560 3561 3562 3563 3564 3565 3566 3567 3568 3569 3570 3571 3572 3573 3574 3575 3576 3577 3578 3579 3580 3581 3582 3583 3584 3585 3586 3587 3588 3589 3590 3591 3592 3593 3594 3595 3596 3597 3598 3599 3600 3601 3602 3603 3604 3605 3606 3607 3608 3609 3610 3611 3612 3613 3614 3615 3616 3617 3618 3619 3620 3621 3622 3623 3624 3625 3626 3627 3628 3629 3630 3631 3632 3633 3634 3635 3636 3637 3638 3639 3640 3641 3642 3643 3644 3645 3646 3647 3648 3649 3650 3651 3652 3653 3654 3655 3656 3657 3658 3659 3660 3661 3662 3663 3664 3665 3666 3667 3668 3669 3670 3671 3672 3673 3674 3675 3676 3677 3678 3679 3680 3681 3682 3683 3684 3685 3686 3687 3688 3689 3690 3691 3692 3693 3694 3695 3696 3697 3698 3699 3700 3701 3702 3703 3704 3705 3706 3707 3708 3709 3710 3711 3712 3713 3714 3715 3716 3717 3718 3719 3720 3721 3722 3723 3724 3725 3726 3727 3728 3729 3730 3731 3732 3733 3734 3735 3736 3737 3738 3739 3740 3741 3742 3743 3744 3745 3746 3747 3748 3749 3750 3751 3752 3753 3754 3755 3756 3757 3758 3759 3760 3761 3762 3763 3764 3765 3766 3767 3768 3769 3770 3771 3772 3773 3774 3775 3776 3777 3778 3779 3780 3781 3782 3783 3784 3785 3786 3787 3788 3789 3790 3791 3792 3793 3794 3795 3796 3797 3798 3799 3800 3801 3802 3803 3804 3805 3806 3807 3808 3809 3810 3811 3812 3813 3814 3815 3816 3817 3818 3819 3820 3821 3822 3823 3824 3825 3826 3827 3828 3829 3830 3831 3832 3833 3834 3835 3836 3837 3838 3839 3840 3841 3842 3843 3844 3845 3846 3847 3848 3849 3850 3851 3852 3853 3854 3855 3856 3857 3858 3859 3860 3861 3862 3863 3864 3865 3866 3867 3868 3869 3870 3871 3872 3873 3874 3875 3876 3877 3878 3879 3880 3881 3882 3883 3884 3885 3886 3887 3888 3889 3890 3891 3892 3893 3894 3895 3896 3897 3898 3899 3900 3901 3902 3903 3904 3905 3906 3907 3908 3909 3910 3911 3912 3913 3914 3915 3916 3917 3918 3919 3920 3921 3922 3923 3924 3925 3926 3927 3928 3929 3930 3931 3932 3933 3934 3935 3936 3937 3938 3939 3940 3941 3942 3943 3944 3945 3946 3947 3948 3949 3950 3951 3952 3953 3954 3955 3956 3957 3958 3959 3960 3961 3962 3963 3964 3965 3966 3967 3968 3969 3970 3971 3972 3973 3974 3975 3976 3977 3978 3979 3980 3981 3982 3983 3984 3985 3986 3987 3988 3989 3990 3991 3992 3993 3994 3995 3996 3997 3998 3999 4000 4001 4002 4003 4004 4005 4006 4007 4008 4009 4010 4011 4012 4013 4014 4015 4016 4017 4018 4019 4020 4021 4022 4023 4024 4025 4026 4027 4028 4029 4030 4031 4032 4033 4034 4035 4036 4037 4038 4039 4040 4041 4042 4043 4044 4045 4046 4047 4048 4049 4050 4051 4052 4053 4054 4055 4056 4057 4058 4059 4060 4061 4062 4063 4064 4065 4066 4067 4068 4069 4070 4071 4072 4073 4074 4075 4076 4077 4078 4079 4080 4081 4082 4083 4084 4085 4086 4087 4088 4089 4090 4091 4092 4093 4094 4095 4096 4097 4098 4099 4100 4101 4102 4103 4104 4105 4106 4107 4108 4109 4110 4111 4112 4113 4114 4115 4116 4117 4118 4119 4120 4121 4122 4123 4124 4125 4126 4127 4128 4129 4130 4131 4132 4133 4134 4135 4136 4137 4138 4139 4140 4141 4142 4143 4144 4145 4146 4147 4148 4149 4150 4151 4152 4153 4154 4155 4156 4157 4158 4159 4160 4161 4162 4163 4164 4165 4166 4167 4168 4169 4170 4171 4172 4173 4174 4175 4176 4177 4178 4179 4180 4181 4182 4183 4184 4185 4186 4187 4188 4189 4190 4191 4192 4193 4194 4195 4196 4197 4198 4199 4200 4201 4202 4203 4204 4205 4206 4207 4208 4209 4210 4211 4212 4213 4214 4215 4216 4217 4218 4219 4220 4221 4222 4223 4224 4225 4226 4227 4228 4229 4230 4231 4232 4233 4234 4235 4236 4237 4238 4239 4240 4241 4242 4243 4244 4245 4246 4247 4248 4249 4250 4251 4252 4253 4254 4255 4256 4257 4258 4259 4260 4261 4262 4263 4264 4265 4266 4267 4268 4269 4270 4271 4272 4273 4274 4275 4276 4277 4278 4279 4280 4281 4282 4283 4284 4285 4286 4287 4288 4289 4290 4291 4292 4293 4294 4295 4296 4297 4298 4299 4300 4301 4302 4303 4304 4305 4306 4307 4308 4309 4310 4311 4312 4313 4314 4315 4316 4317 4318 4319 4320 4321 4322 4323 4324 4325 4326 4327 4328 4329 4330 4331 4332 4333 4334 4335 4336 4337 4338 4339 4340 4341 4342 4343 4344 4345 4346 4347 4348 4349 4350 4351 4352 4353 4354 4355 4356 4357 4358 4359 4360 4361 4362 4363 4364 4365 4366 4367 4368 4369 4370 4371 4372 4373 4374 4375 4376 4377 4378 4379 4380 4381 4382 4383 4384 4385 4386 4387 4388 4389 4390 4391 4392 4393 4394 4395 4396 4397 4398 4399 4400 4401 4402 4403 4404 4405 4406 4407 4408 4409 4410 4411 4412 4413 4414 4415 4416 4417 4418 4419 4420 4421 4422 4423 4424 4425 4426 4427 4428 4429 4430 4431 4432 4433 4434 4435 4436 4437 4438 4439 4440 4441 4442 4443 4444 4445 4446 4447 4448 4449 4450 4451 4452 4453 4454 4455 4456 4457 4458 4459 4460 4461 4462 4463 4464 4465 4466 4467 4468 4469 4470 4471 4472 4473 4474 4475 4476 4477 4478 4479 4480 4481 4482 4483 4484 4485 4486 4487 4488 4489 4490 4491 4492 4493 4494 4495 4496 4497 4498 4499 4500 4501 4502 4503 4504 4505 4506 4507 4508 4509 4510 4511 4512 4513 4514 4515 4516 4517 4518 4519 4520 4521 4522 4523 4524 4525 4526 4527 4528 4529 4530 4531 4532 4533 4534 4535 4536 4537 4538 4539 4540 4541 4542 4543 4544 4545 4546 4547 4548 4549 4550 4551 4552 4553 4554 4555 4556 4557 4558 4559 4560 4561 4562 4563 4564 4565 4566 4567 4568 4569 4570 4571 4572 4573 4574 4575 4576 4577 4578 4579 4580 4581 4582 4583 4584 4585 4586 4587 4588 4589 4590 4591 4592 4593 4594 4595 4596 4597 4598 4599 4600 4601 4602 4603 4604 4605 4606 4607 4608 4609 4610 4611 4612 4613 4614 4615 4616 4617 4618 4619 4620 4621 4622 4623 4624 4625 4626 4627 4628 4629 4630 4631 4632 4633 4634 4635 4636 4637 4638 4639 4640 4641 4642 4643 4644 4645 4646 4647 4648 4649 4650 4651 4652 4653 4654 4655 4656 4657 4658 4659 4660 4661 4662 4663 4664 4665 4666 4667 4668 4669 4670 4671 4672 4673 4674 4675 4676 4677 4678 4679 4680 4681 4682 4683 4684 4685 4686 4687 4688 4689 4690 4691 4692 4693 4694 4695 4696 4697 4698 4699 4700 4701 4702 4703 4704 4705 4706 4707 4708 4709 4710 4711 4712 4713 4714 4715 4716 4717 4718 4719 4720 4721 4722 4723 4724 4725 4726 4727 4728 4729 4730 4731 4732 4733 4734 4735 4736 4737 4738 4739 4740 4741 4742 4743 4744 4745 4746 4747 4748 4749 4750 4751 4752 4753 4754 4755 4756 4757 4758 4759 4760 4761 4762 4763 4764 4765 4766 4767 4768 4769 4770 4771 4772 4773 4774 4775 4776 4777 4778 4779 4780 4781 4782 4783 4784 4785 4786 4787 4788 4789 4790 4791 4792 4793 4794 4795 4796 4797 4798 4799 4800 4801 4802 4803 4804 4805 4806 4807 4808 4809 4810 4811 4812 4813 4814 4815 4816 4817 4818 4819 4820 4821 4822 4823 4824 4825 4826 4827 4828 4829 4830 4831 4832 4833 4834 4835 4836 4837 4838 4839 4840 4841 4842 4843 4844 4845 4846 4847 4848 4849 4850 4851 4852 4853 4854 4855 4856 4857 4858 4859 4860 4861 4862 4863 4864 4865 4866 4867 4868 4869 4870 4871 4872 4873 4874 4875 4876 4877 4878 4879 4880 4881 4882 4883 4884 4885 4886 4887 4888 4889 4890 4891 4892 4893 4894 4895 4896 4897 4898 4899 4900 4901 4902 4903 4904 4905 4906 4907 4908 4909 4910 4911 4912 4913 4914 4915 4916 4917 4918 4919 4920 4921 4922 4923 4924 4925 4926 4927 4928 4929 4930 4931 4932 4933 4934 4935 4936 4937 4938 4939 4940 4941 4942 4943 4944 4945 4946 4947 4948 4949 4950 4951 4952 4953 4954 4955 4956 4957 4958 4959 4960 4961 4962 4963 4964 4965 4966 4967 4968 4969 4970 4971 4972 4973 4974 4975 4976 4977 4978 4979 4980 4981 4982 4983 4984 4985 4986 4987 4988 4989 4990 4991 4992 4993 4994 4995 4996 4997 4998 4999 5000 5001 5002 5003 5004 5005 5006 5007 5008 5009 5010 5011 5012 5013 5014 5015 5016 5017 5018 5019 5020 5021 5022 5023 5024 5025 5026 5027 5028 5029 5030 5031 5032 5033 5034 5035 5036 5037 5038 5039 5040 5041 5042 5043 5044 5045 5046 5047 5048 5049 5050 5051 5052 5053 5054 5055 5056 5057 5058 5059 5060 5061 5062 5063 5064 5065 5066 5067 5068 5069 5070 5071 5072 5073 5074 5075 5076 5077 5078 5079 5080 5081 5082 5083 5084 5085 5086 5087 5088 5089 5090 5091 5092 5093 5094 5095 5096 5097 5098 5099 5100 5101 5102 5103 5104 5105 5106 5107 5108 5109 5110 5111 5112 5113 5114 5115 5116 5117 5118 5119 5120 5121 5122 5123 5124 5125 5126 5127 5128 5129 5130 5131 5132 5133 5134 5135 5136 5137 5138 5139 5140 5141 5142 5143 5144 5145 5146 5147 5148 5149 5150 5151 5152 5153 5154 5155 5156 5157 5158 5159 5160 5161 5162 5163 5164 5165 5166 5167 5168 5169 5170 5171 5172 5173 5174 5175 5176 5177 5178 5179 5180 5181 5182 5183 5184 5185 5186 5187 5188 5189 5190 5191 5192 5193 5194 5195 5196 5197 5198 5199 5200 5201 5202 5203 5204 5205 5206 5207 5208 5209 5210 5211 5212 5213 5214 5215 5216 5217 5218 5219 5220 5221 5222 5223 5224 5225 5226 5227 5228 5229 5230 5231 5232 5233 5234 5235 5236 5237 5238 5239 5240 5241 5242 5243 5244 5245 5246 5247 5248 5249 5250 5251 5252 5253 5254 5255 5256 5257 5258 5259 5260 5261 5262 5263 5264 5265 5266 5267 5268 5269 5270 5271 5272 5273 5274 5275 5276 5277 5278 5279 5280 5281 5282 5283 5284 5285 5286 5287 5288 5289 5290 5291 5292 5293 5294 5295 5296 5297 5298 5299 5300 5301 5302 5303 5304 5305 5306 5307 5308 5309 5310 5311 5312 5313 5314 5315 5316 5317 5318 5319 5320 5321 5322 5323 5324 5325 5326 5327 5328 5329 5330 5331 5332 5333 5334 5335 5336 5337 5338 5339 5340 5341 5342 5343 5344 5345 5346 5347 5348 5349 5350 5351 5352 5353 5354 5355 5356 5357 5358 5359 5360 5361 5362 5363 5364 5365 5366 5367 5368 5369 5370 5371 5372 5373 5374 5375 5376 5377 5378 5379 5380 5381 5382 5383 5384 5385 5386 5387 5388 5389 5390 5391 5392 5393 5394 5395 5396 5397 5398 5399 5400 5401 5402 5403 5404 5405 5406 5407 5408 5409 5410 5411 5412 5413 5414 5415 5416 5417 5418 5419 5420 5421 5422 5423 5424 5425 5426 5427 5428 5429 5430 5431 5432 5433 5434 5435 5436 5437 5438 5439 5440 5441 5442 5443 5444 5445 5446 5447 5448 5449 5450 5451 5452 5453 5454 5455 5456 5457 5458 5459 5460 5461 5462 5463 5464 5465 5466 5467 5468 5469 5470 5471 5472 5473 5474 5475 5476 5477 5478 5479 5480 5481 5482 5483 5484 5485 5486 5487 5488 5489 5490 5491 5492 5493 5494 5495 5496 5497 5498 5499 5500 5501 5502 5503 5504 5505 5506 5507 5508 5509 5510 5511 5512 5513 5514 5515 5516 5517 5518 5519 5520 5521 5522 5523 5524 5525 5526 5527 5528 5529 5530 5531 5532 5533 5534 5535 5536 5537 5538 5539 5540 5541 5542 5543 5544 5545 5546 5547 5548 5549 5550 5551 5552 5553 5554 5555 5556 5557 5558 5559 5560 5561 5562 5563 5564 5565 5566 5567 5568 5569 5570 5571 5572 5573 5574 5575 5576 5577 5578 5579 5580 5581 5582 5583 5584 5585 5586 5587 5588 5589 5590 5591 5592 5593 5594 5595 5596 5597 5598 5599 5600 5601 5602 5603 5604 5605 5606 5607 5608 5609 5610 5611 5612 5613 5614 5615 5616 5617 5618 5619 5620 5621 5622 5623 5624 5625 5626 5627 5628 5629 5630 5631 5632 5633 5634 5635 5636 5637 5638 5639 5640 5641 5642 5643 5644 5645 5646 5647 5648 5649 5650 5651 5652 5653 5654 5655 5656 5657 5658 5659 5660 5661 5662 5663 5664 5665 5666 5667 5668 5669 5670 5671 5672 5673 5674 5675 5676 5677 5678 5679 5680 5681 5682 5683 5684 5685 5686 5687 5688 5689 5690 5691 5692 5693 5694 5695 5696 5697 5698 5699 5700 5701 5702 5703 5704 5705 5706 5707 5708 5709 5710 5711 5712 5713 5714 5715 5716 5717 5718 5719 5720 5721 5722 5723 5724 5725 5726 5727 5728 5729 5730 5731 5732 5733 5734 5735 5736 5737 5738 5739 5740 5741 5742 5743 5744 5745 5746 5747 5748 5749 5750 5751 5752 5753 5754 5755 5756 5757 5758 5759 5760 5761 5762 5763 5764 5765 5766 5767 5768 5769 5770 5771 5772 5773 5774 5775 5776 5777 5778 5779 5780 5781 5782 5783 5784 5785 5786 5787 5788 5789 5790 5791 5792 5793 5794 5795 5796 5797 5798 5799 5800 5801 5802 5803 5804 5805 5806 5807 5808 5809 5810 5811 5812 5813 5814 5815 5816 5817 5818 5819 5820 5821 5822 5823 5824 5825 5826 5827 5828 5829 5830 5831 5832 5833 5834 5835 5836 5837 5838 5839 5840 5841 5842 5843 5844 5845 5846 5847 5848 5849 5850 5851 5852 5853 5854 5855 5856 5857 5858 5859 5860 5861 5862 5863 5864 5865 5866 5867 5868 5869 5870 5871 5872 5873 5874 5875 5876 5877 5878 5879 5880 5881 5882 5883 5884 5885 5886 5887 5888 5889 5890 5891 5892 5893 5894 5895 5896 5897 5898 5899 5900 5901 5902 5903 5904 5905 5906 5907 5908 5909 5910 5911 5912 5913 5914 5915 5916 5917 5918 5919 5920 5921 5922 5923 5924 5925 5926 5927 5928 5929 5930 5931 5932 5933 5934 5935 5936 5937 5938 5939 5940 5941 5942 5943 5944 5945 5946 5947 5948 5949 5950 5951 5952 5953 5954 5955 5956 5957 5958 5959 5960 5961 5962 5963 5964 5965 5966 5967 5968 5969 5970 5971 5972 5973 5974 5975 5976 5977 5978 5979 5980 5981 5982 5983 5984 5985 5986 5987 5988 5989 5990 5991 5992 5993 5994 5995 5996 5997 5998 5999 6000 6001 6002 6003 6004 6005 6006 6007 6008 6009 6010 6011 6012 6013 6014 6015 6016 6017 6018 6019 6020 6021 6022 6023 6024 6025 6026 6027 6028 6029 6030 6031 6032 6033 6034 6035 6036 6037 6038 6039 6040 6041 6042 6043 6044 6045 6046 6047 6048 6049 6050 6051 6052 6053 6054 6055 6056 6057 6058 6059 6060 6061 6062 6063 6064 6065 6066 6067 6068 6069 6070 6071 6072 6073 6074 6075 6076 6077 6078 6079 6080 6081 6082 6083 6084 6085 6086 6087 6088 6089 6090 6091 6092 6093 6094 6095 6096 6097 6098 6099 6100 6101 6102 6103 6104 6105 6106 6107 6108 6109 6110 6111 6112 6113 6114 6115 6116 6117 6118 6119 6120 6121 6122 6123 6124 6125 6126 6127 6128 6129 6130 6131 6132 6133 6134 6135 6136 6137 6138 6139 6140 6141 6142 6143 6144 6145 6146 6147 6148 6149 6150 6151 6152 6153 6154 6155 6156 6157 6158 6159 6160 6161 6162 6163 6164 6165 6166 6167 6168 6169 6170 6171 6172 6173 6174 6175 6176 6177 6178 6179 6180 6181 6182 6183 6184 6185 6186 6187 6188 6189 6190 6191 6192 6193 6194 6195 6196 6197 6198 6199 6200 6201 6202 6203 6204 6205 6206 6207 6208 6209 6210 6211 6212 6213 6214 6215 6216 6217 6218 6219 6220 6221 6222 6223 6224 6225 6226 6227 6228 6229 6230 6231 6232 6233 6234 6235 6236 6237 6238 6239 6240 6241 6242 6243 6244 6245 6246 6247 6248 6249 6250 6251 6252 6253 6254 6255 6256 6257 6258 6259 6260 6261 6262 6263 6264 6265 6266 6267 6268 6269 6270 6271 6272 6273 6274 6275 6276 6277 6278 6279 6280 6281 6282 6283 6284 6285 6286 6287 6288 6289 6290 6291 6292 6293 6294 6295 6296 6297 6298 6299 6300 6301 6302 6303 6304 6305 6306 6307 6308 6309 6310 6311 6312 6313 6314 6315 6316 6317 6318 6319 6320 6321 6322 6323 6324 6325 6326 6327 6328 6329 6330 6331 6332 6333 6334 6335 6336 6337 6338 6339 6340 6341 6342 6343 6344 6345 6346 6347 6348 6349 6350 6351 6352 6353 6354 6355 6356 6357 6358 6359 6360 6361 6362 6363 6364 6365 6366 6367 6368 6369 6370 6371 6372 6373 6374 6375 6376 6377 6378 6379 6380 6381 6382 6383 6384 6385 6386 6387 6388 6389 6390 6391 6392 6393 6394 6395 6396 6397 6398 6399 6400 6401 6402 6403 6404 6405 6406 6407 6408 6409 6410 6411 6412 6413 6414 6415 6416 6417 6418 6419 6420 6421 6422 6423 6424 6425 6426 6427 6428 6429 6430 6431 6432 6433 6434 6435 6436 6437 6438 6439 6440 6441 6442 6443 6444 6445 6446 6447 6448 6449 6450 6451 6452 6453 6454 6455 6456 6457 6458 6459 6460 6461 6462 6463 6464 6465 6466 6467 6468 6469 6470 6471 6472 6473 6474 6475 6476 6477 6478 6479 6480 6481 6482 6483 6484 6485 6486 6487 6488 6489 6490 6491 6492 6493 6494 6495 6496 6497 6498 6499 6500 6501 6502 6503 6504 6505 6506 6507 6508 6509 6510 6511 6512 6513 6514 6515 6516 6517 6518 6519 6520 6521 6522 6523 6524 6525 6526 6527 6528 6529 6530 6531 6532 6533 6534 6535 6536 6537 6538 6539 6540 6541 6542 6543 6544 6545 6546 6547 6548 6549 6550 6551 6552 6553 6554 6555 6556 6557 6558 6559 6560 6561 6562 6563 6564 6565 6566 6567 6568 6569 6570 6571 6572 6573 6574 6575 6576 6577 6578 6579 6580 6581 6582 6583 6584 6585 6586 6587 6588 6589 6590 6591 6592 6593 6594 6595 6596 6597 6598 6599 6600 6601 6602 6603 6604 6605 6606 6607 6608 6609 6610 6611 6612 6613 6614 6615 6616 6617 6618 6619 6620 6621 6622 6623 6624 6625 6626 6627 6628 6629 6630 6631 6632 6633 6634 6635 6636 6637 6638 6639 6640 6641 6642 6643 6644 6645 6646 6647 6648 6649 6650 6651 6652 6653 6654 6655 6656 6657 6658 6659 6660 6661 6662 6663 6664 6665 6666 6667 6668 6669 6670 6671 6672 6673 6674 6675 6676 6677 6678 6679 6680 6681 6682 6683 6684 6685 6686 6687 6688 6689 6690 6691 6692 6693 6694 6695 6696 6697 6698 6699 6700 6701 6702 6703 6704 6705 6706 6707 6708 6709 6710 6711 6712 6713 6714 6715 6716 6717 6718 6719 6720 6721 6722 6723 6724 6725 6726 6727 6728 6729 6730 6731 6732 6733 6734 6735 6736 6737 6738 6739 6740 6741 6742 6743 6744 6745 6746 6747 6748 6749 6750 6751 6752 6753 6754 6755 6756 6757 6758 6759 6760 6761 6762 6763 6764 6765 6766 6767 6768 6769 6770 6771 6772 6773 6774 6775 6776 6777 6778 6779 6780 6781 6782 6783 6784 6785 6786 6787 6788 6789 6790 6791 6792 6793 6794 6795 6796 6797 6798 6799 6800 6801 6802 6803 6804 6805 6806 6807 6808 6809 6810 6811 6812 6813 6814 6815 6816 6817 6818 6819 6820 6821 6822 6823 6824 6825 6826 6827 6828 6829 6830 6831 6832 6833 6834 6835 6836 6837 6838 6839 6840 6841 6842 6843 6844 6845 6846 6847 6848 6849 6850 6851 6852 6853 6854 6855 6856 6857 6858 6859 6860 6861 6862 6863 6864 6865 6866 6867 6868 6869 6870 6871 6872 6873 6874 6875 6876 6877 6878 6879 6880 6881 6882 6883 6884 6885 6886 6887 6888 6889 6890 6891 6892 6893 6894 6895 6896 6897 6898 6899 6900 6901 6902 6903 6904 6905 6906 6907 6908 6909 6910 6911 6912 6913 6914 6915 6916 6917 6918 6919 6920 6921 6922 6923 6924 6925 6926 6927 6928 6929 6930 6931 6932 6933 6934 6935 6936 6937 6938 6939 6940 6941 6942 6943 6944 6945 6946 6947 6948 6949 6950 6951 6952 6953 6954 6955 6956 6957 6958 6959 6960 6961 6962 6963 6964 6965 6966 6967 6968 6969 6970 6971 6972 6973 6974 6975 6976 6977 6978 6979 6980 6981 6982 6983 6984 6985 6986 6987 6988 6989 6990 6991 6992 6993 6994 6995 6996 6997 6998 6999 7000 7001 7002 7003 7004 7005 7006 7007 7008 7009 7010 7011 7012 7013 7014 7015 7016 7017 7018 7019 7020 7021 7022 7023 7024 7025 7026 7027 7028 7029 7030 7031 7032 7033 7034 7035 7036 7037 7038 7039 7040 7041 7042 7043 7044 7045 7046 7047 7048 7049 7050 7051 7052 7053 7054 7055 7056 7057 7058 7059 7060 7061 7062 7063 7064 7065 7066 7067 7068 7069 7070 7071 7072 7073 7074 7075 7076 7077 7078 7079 7080 7081 7082 7083 7084 7085 7086 7087 7088 7089 7090 7091 7092 7093 7094 7095 7096 7097 7098 7099 7100 7101 7102 7103 7104 7105 7106 7107 7108 7109 7110 7111 7112 7113 7114 7115 7116 7117 7118 7119 7120 7121 7122 7123 7124 7125 7126 7127 7128 7129 7130 7131 7132 7133 7134 7135 7136 7137 7138 7139 7140 7141 7142 7143 7144 7145 7146 7147 7148 7149 7150 7151 7152 7153 7154 7155 7156 7157 7158 7159 7160 7161 7162 7163 7164 7165 7166 7167 7168 7169 7170 7171 7172 7173 7174 7175 7176 7177 7178 7179 7180 7181 7182 7183 7184 7185 7186 7187 7188 7189 7190 7191 7192 7193 7194 7195 7196 7197 7198 7199 7200 7201 7202 7203 7204 7205 7206 7207 7208 7209 7210 7211 7212 7213 7214 7215 7216 7217 7218 7219 7220 7221 7222 7223 7224 7225 7226 7227 7228 7229 7230 7231 7232 7233 7234 7235 7236 7237 7238 7239 7240 7241 7242 7243 7244 7245 7246 7247 7248 7249 7250 7251 7252 7253 7254 7255 7256 7257 7258 7259 7260 7261 7262 7263 7264 7265 7266 7267 7268 7269 7270 7271 7272 7273 7274 7275 7276 7277 7278 7279 7280 7281 7282 7283 7284 7285 7286 7287 7288 7289 7290 7291 7292 7293 7294 7295 7296 7297 7298 7299 7300 7301 7302 7303 7304 7305 7306 7307 7308 7309 7310 7311 7312 7313 7314 7315 7316 7317 7318 7319 7320 7321 7322 7323 7324 7325 7326 7327 7328 7329 7330 7331 7332 7333 7334 7335 7336 7337 7338 7339 7340 7341 7342 7343 7344 7345 7346 7347 7348 7349 7350 7351 7352 7353 7354 7355 7356 7357 7358 7359 7360 7361 7362 7363 7364 7365 7366 7367 7368 7369 7370 7371 7372 7373 7374 7375 7376 7377 7378 7379 7380 7381 7382 7383 7384 7385 7386 7387 7388 7389 7390 7391 7392 7393 7394 7395 7396 7397 7398 7399 7400 7401 7402 7403 7404 7405 7406 7407 7408 7409 7410 7411 7412 7413 7414 7415 7416 7417 7418 7419 7420 7421 7422 7423 7424 7425 7426 7427 7428 7429 7430 7431 7432 7433 7434 7435 7436 7437 7438 7439 7440 7441 7442 7443 7444 7445 7446 7447 7448 7449 7450 7451 7452 7453 7454 7455 7456 7457 7458 7459 7460 7461 7462 7463 7464 7465 7466 7467 7468 7469 7470 7471 7472 7473 7474 7475 7476 7477 7478 7479 7480 7481 7482 7483 7484 7485 7486 7487 7488 7489 7490 7491 7492 7493 7494 7495 7496 7497 7498 7499 7500 7501 7502 7503 7504 7505 7506 7507 7508 7509 7510 7511 7512 7513 7514 7515 7516 7517 7518 7519 7520 7521 7522 7523 7524 7525 7526 7527 7528 7529 7530 7531 7532 7533 7534 7535 7536 7537 7538 7539 7540 7541 7542 7543 7544 7545 7546 7547 7548 7549 7550 7551 7552 7553 7554 7555 7556 7557 7558 7559 7560 7561 7562 7563 7564 7565 7566 7567 7568 7569 7570 7571 7572 7573 7574 7575 7576 7577 7578 7579 7580 7581 7582 7583 7584 7585 7586 7587 7588 7589 7590 7591 7592 7593 7594 7595 7596 7597 7598 7599 7600 7601 7602 7603 7604 7605 7606 7607 7608 7609 7610 7611 7612 7613 7614 7615 7616 7617 7618 7619 7620 7621 7622 7623 7624 7625 7626 7627 7628 7629 7630 7631 7632 7633 7634 7635 7636 7637 7638 7639 7640 7641 7642 7643 7644 7645 7646 7647 7648 7649 7650 7651 7652 7653 7654 7655 7656 7657 7658 7659 7660 7661 7662 7663 7664 7665 7666 7667 7668 7669 7670 7671 7672 7673 7674 7675 7676 7677 7678 7679 7680 7681 7682 7683 7684 7685 7686 7687 7688 7689 7690 7691 7692 7693 7694 7695 7696 7697 7698 7699 7700 7701 7702 7703 7704 7705 7706 7707 7708 7709 7710 7711 7712 7713 7714 7715 7716 7717 7718 7719 7720 7721 7722 7723 7724 7725 7726 7727 7728 7729 7730 7731 7732 7733 7734 7735 7736 7737 7738 7739 7740 7741 7742 7743 7744 7745 7746 7747 7748 7749 7750 7751 7752 7753 7754 7755 7756 7757 7758 7759 7760 7761 7762 7763 7764 7765 7766 7767 7768 7769 7770 7771 7772 7773 7774 7775 7776 7777 7778 7779 7780 7781 7782 7783 7784 7785 7786 7787 7788 7789 7790 7791 7792 7793 7794 7795 7796 7797 7798 7799 7800 7801 7802 7803 7804 7805 7806 7807 7808 7809 7810 7811 7812 7813 7814 7815 7816 7817 7818 7819 7820 7821 7822 7823 7824 7825 7826 7827 7828 7829 7830 7831 7832 7833 7834 7835 7836 7837 7838 7839 7840 7841 7842 7843 7844 7845 7846 7847 7848 7849 7850 7851 7852 7853 7854 7855 7856 7857 7858 7859 7860 7861 7862 7863 7864 7865 7866 7867 7868 7869 7870 7871 7872 7873 7874 7875 7876 7877 7878 7879 7880 7881 7882 7883 7884 7885 7886 7887 7888 7889 7890 7891 7892 7893 7894 7895 7896 7897 7898 7899 7900 7901 7902 7903 7904 7905 7906 7907 7908 7909 7910 7911 7912 7913 7914 7915 7916 7917 7918 7919 7920 7921 7922 7923 7924 7925 7926 7927 7928 7929 7930 7931 7932 7933 7934 7935 7936 7937 7938 7939 7940 7941 7942 7943 7944 7945 7946 7947 7948 7949 7950 7951 7952 7953 7954 7955 7956 7957 7958 7959 7960 7961 7962 7963 7964 7965 7966 7967 7968 7969 7970 7971 7972 7973 7974 7975 7976 7977 7978 7979 7980 7981 7982 7983 7984 7985 7986 7987 7988 7989 7990 7991 7992 7993 7994 7995 7996 7997 7998 7999 8000 8001 8002 8003 8004 8005 8006 8007 8008 8009 8010 8011 8012 8013 8014 8015 8016 8017 8018 8019 8020 8021 8022 8023 8024 8025 8026 8027 8028 8029 8030 8031 8032 8033 8034 8035 8036 8037 8038 8039 8040 8041 8042 8043 8044 8045 8046 8047 8048 8049 8050 8051 8052 8053 8054 8055 8056 8057 8058 8059 8060 8061 8062 8063 8064 8065 8066 8067 8068 8069 8070 8071 8072 8073 8074 8075 8076 8077 8078 8079 8080 8081 8082 8083 8084 8085 8086 8087 8088 8089 8090 8091 8092 8093 8094 8095 8096 8097 8098 8099 8100 8101 8102 8103 8104 8105 8106 8107 8108 8109 8110 8111 8112 8113 8114 8115 8116 8117 8118 8119 8120 8121 8122 8123 8124 8125 8126 8127 8128 8129 8130 8131 8132 8133 8134 8135 8136 8137 8138 8139 8140 8141 8142 8143 8144 8145 8146 8147 8148 8149 8150 8151 8152 8153 8154 8155 8156 8157 8158 8159 8160 8161 8162 8163 8164 8165 8166 8167 8168 8169 8170 8171 8172 8173 8174 8175 8176 8177 8178 8179 8180 8181 8182 8183 8184 8185 8186 8187 8188 8189 8190 8191 8192 8193 8194 8195 8196 8197 8198 8199 8200 8201 8202 8203 8204 8205 8206 8207 8208 8209 8210 8211 8212 8213 8214 8215 8216 8217 8218 8219 8220 8221 8222 8223 8224 8225 8226 8227 8228 8229 8230 8231 8232 8233 8234 8235 8236 8237 8238 8239 8240 8241 8242 8243 8244 8245 8246 8247 8248 8249 8250 8251 8252 8253 8254 8255 8256 8257 8258 8259 8260 8261 8262 8263 8264 8265 8266 8267 8268 8269 8270 8271 8272 8273 8274 8275 8276 8277 8278 8279 8280 8281 8282 8283 8284 8285 8286 8287 8288 8289 8290 8291 8292 8293 8294 8295 8296 8297 8298 8299 8300 8301 8302 8303 8304 8305 8306 8307 8308 8309 8310 8311 8312 8313 8314 8315 8316 8317 8318 8319 8320 8321 8322 8323 8324 8325 8326 8327 8328 8329 8330 8331 8332 8333 8334 8335 8336 8337 8338 8339 8340 8341 8342 8343 8344 8345 8346 8347 8348 8349 8350 8351 8352 8353 8354 8355 8356 8357 8358 8359 8360 8361 8362 8363 8364 8365 8366 8367 8368 8369 8370 8371 8372 8373 8374 8375 8376 8377 8378 8379 8380 8381 8382 8383 8384 8385 8386 8387 8388 8389 8390 8391 8392 8393 8394 8395 8396 8397 8398 8399 8400 8401 8402 8403 8404 8405 8406 8407 8408 8409 8410 8411 8412 8413 8414 8415 8416 8417 8418 8419 8420 8421 8422 8423 8424 8425 8426 8427 8428 8429 8430 8431 8432 8433 8434 8435 8436 8437 8438 8439 8440 8441 8442 8443 8444 8445 8446 8447 8448 8449 8450 8451 8452 8453 8454 8455 8456 8457 8458 8459 8460 8461 8462 8463 8464 8465 8466 8467 8468 8469 8470 8471 8472 8473 8474 8475 8476 8477 8478 8479 8480 8481 8482 8483 8484 8485 8486 8487 8488 8489 8490 8491 8492 8493 8494 8495 8496 8497 8498 8499 8500 8501 8502 8503 8504 8505 8506 8507 8508 8509 8510 8511 8512 8513 8514 8515 8516 8517 8518 8519 8520 8521 8522 8523 8524 8525 8526 8527 8528 8529 8530 8531 8532 8533 8534 8535 8536 8537 8538 8539 8540 8541 8542 8543 8544 8545 8546 8547 8548 8549 8550 8551 8552 8553 8554 8555 8556 8557 8558 8559 8560 8561 8562 8563 8564 8565 8566 8567 8568 8569 8570 8571 8572 8573 8574 8575 8576 8577 8578 8579 8580 8581 8582 8583 8584 8585 8586 8587 8588 8589 8590 8591 8592 8593 8594 8595 8596 8597 8598 8599 8600 8601 8602 8603 8604 8605 8606 8607 8608 8609 8610 8611 8612 8613 8614 8615 8616 8617 8618 8619 8620 8621 8622 8623 8624 8625 8626 8627 8628 8629 8630 8631 8632 8633 8634 8635 8636 8637 8638 8639 8640 8641 8642 8643 8644 8645 8646 8647 8648 8649 8650 8651 8652 8653 8654 8655 8656 8657 8658 8659 8660 8661 8662 8663 8664 8665 8666 8667 8668 8669 8670 8671 8672 8673 8674 8675 8676 8677 8678 8679 8680 8681 8682 8683 8684 8685 8686 8687 8688 8689 8690 8691 8692 8693 8694 8695 8696 8697 8698 8699 8700 8701 8702 8703 8704 8705 8706 8707 8708 8709 8710 8711 8712 8713 8714 8715 8716 8717 8718 8719 8720 8721 8722 8723 8724 8725 8726 8727 8728 8729 8730 8731 8732 8733 8734 8735 8736 8737 8738 8739 8740 8741 8742 8743 8744 8745 8746 8747 8748 8749 8750 8751 8752 8753 8754 8755 8756 8757 8758 8759 8760 8761 8762 8763 8764 8765 8766 8767 8768 8769 8770 8771 8772 8773 8774 8775 8776 8777 8778 8779 8780 8781 8782 8783 8784 8785 8786 8787 8788 8789 8790 8791 8792 8793 8794 8795 8796 8797 8798 8799 8800 8801 8802 8803 8804 8805 8806 8807 8808 8809 8810 8811 8812 8813 8814 8815 8816 8817 8818 8819 8820 8821 8822 8823 8824 8825 8826 8827 8828 8829 8830 8831 8832 8833 8834 8835 8836 8837 8838 8839 8840 8841 8842 8843 8844 8845 8846 8847 8848 8849 8850 8851 8852 8853 8854 8855 8856 8857 8858 8859 8860 8861 8862 8863 8864 8865 8866 8867 8868 8869 8870 8871 8872 8873 8874 8875 8876 8877 8878 8879 8880 8881 8882 8883 8884 8885 8886 8887 8888 8889 8890 8891 8892 8893 8894 8895 8896 8897 8898 8899 8900 8901 8902 8903 8904 8905 8906 8907 8908 8909 8910 8911 8912 8913 8914 8915 8916 8917 8918 8919 8920 8921 8922 8923 8924 8925 8926 8927 8928 8929 8930 8931 8932 8933 8934 8935 8936 8937 8938 8939 8940 8941 8942 8943 8944 8945 8946 8947 8948 8949 8950 8951 8952 8953 8954 8955 8956 8957 8958 8959 8960 8961 8962 8963 8964 8965 8966 8967 8968 8969 8970 8971 8972 8973 8974 8975 8976 8977 8978 8979 8980 8981 8982 8983 8984 8985 8986 8987 8988 8989 8990 8991 8992 8993 8994 8995 8996 8997 8998 8999 9000 9001 9002 9003 9004 9005 9006 9007 9008 9009 9010 9011 9012 9013 9014 9015 9016 9017 9018 9019 9020 9021 9022 9023 9024 9025 9026 9027 9028 9029 9030 9031 9032 9033 9034 9035 9036 9037 9038 9039 9040 9041 9042 9043 9044 9045 9046 9047 9048 9049 9050 9051 9052 9053 9054 9055 9056 9057 9058 9059 9060 9061 9062 9063 9064 9065 9066 9067 9068 9069 9070 9071 9072 9073 9074 9075 9076 9077 9078 9079 9080 9081 9082 9083 9084 9085 9086 9087 9088 9089 9090 9091 9092 9093 9094 9095 9096 9097 9098 9099 9100 9101 9102 9103 9104 9105 9106 9107 9108 9109 9110 9111 9112 9113 9114 9115 9116 9117 9118 9119 9120 9121 9122 9123 9124 9125 9126 9127 9128 9129 9130 9131 9132 9133 9134 9135 9136 9137 9138 9139 9140 9141 9142 9143 9144 9145 9146 9147 9148 9149 9150 9151 9152 9153 9154 9155 9156 9157 9158 9159 9160 9161 9162 9163 9164 9165 9166 9167 9168 9169 9170 9171 9172 9173 9174 9175 9176 9177 9178 9179 9180 9181 9182 9183 9184 9185 9186 9187 9188 9189 9190 9191 9192 9193 9194 9195 9196 9197 9198 9199 9200 9201 9202 9203 9204 9205 9206 9207 9208 9209 9210 9211 9212 9213 9214 9215 9216 9217 9218 9219 9220 9221 9222 9223 9224 9225 9226 9227 9228 9229 9230 9231 9232 9233 9234 9235 9236 9237 9238 9239 9240 9241 9242 9243 9244 9245 9246 9247 9248 9249 9250 9251 9252 9253 9254 9255 9256 9257 9258 9259 9260 9261 9262 9263 9264 9265 9266 9267 9268 9269 9270 9271 9272 9273 9274 9275 9276 9277 9278 9279 9280 9281 9282 9283 9284 9285 9286 9287 9288 9289 9290 9291 9292 9293 9294 9295 9296 9297 9298 9299 9300 9301 9302 9303 9304 9305 9306 9307 9308 9309 9310 9311 9312 9313 9314 9315 9316 9317 9318 9319 9320 9321 9322 9323 9324 9325 9326 9327 9328 9329 9330 9331 9332 9333 9334 9335 9336 9337 9338 9339 9340 9341 9342 9343 9344 9345 9346 9347 9348 9349 9350 9351 9352 9353 9354 9355 9356 9357 9358 9359 9360 9361 9362 9363 9364 9365 9366 9367 9368 9369 9370 9371 9372 9373 9374 9375 9376 9377 9378 9379 9380 9381 9382 9383 9384 9385 9386 9387 9388 9389 9390 9391 9392 9393 9394 9395 9396 9397 9398 9399 9400 9401 9402 9403 9404 9405 9406 9407 9408 9409 9410 9411 9412 9413 9414 9415 9416 9417 9418 9419 9420 9421 9422 9423 9424 9425 9426 9427 9428 9429 9430 9431 9432 9433 9434 9435 9436 9437 9438 9439 9440 9441 9442 9443 9444 9445 9446 9447 9448 9449 9450 9451 9452 9453 9454 9455 9456 9457 9458 9459 9460 9461 9462 9463 9464 9465 9466 9467 9468 9469 9470 9471 9472 9473 9474 9475 9476 9477 9478 9479 9480 9481 9482 9483 9484 9485 9486 9487 9488 9489 9490 9491 9492 9493 9494 9495 9496 9497 9498 9499 9500 9501 9502 9503 9504 9505 9506 9507 9508 9509 9510 9511 9512 9513 9514 9515 9516 9517 9518 9519 9520 9521 9522 9523 9524 9525 9526 9527 9528 9529 9530 9531 9532 9533 9534 9535 9536 9537 9538 9539 9540 9541 9542 9543 9544 9545 9546 9547 9548 9549 9550 9551 9552 9553 9554 9555 9556 9557 9558 9559 9560 9561 9562 9563 9564 9565 9566 9567 9568 9569 9570 9571 9572 9573 9574 9575 9576 9577 9578 9579 9580 9581 9582 9583 9584 9585 9586 9587 9588 9589 9590 9591 9592 9593 9594 9595 9596 9597 9598 9599 9600 9601 9602 9603 9604 9605 9606 9607 9608 9609 9610 9611 9612 9613 9614 9615 9616 9617 9618 9619 9620 9621 9622 9623 9624 9625 9626 9627 9628 9629 9630 9631 9632 9633 9634 9635 9636 9637 9638 9639 9640 9641 9642 9643 9644 9645 9646 9647 9648 9649 9650 9651 9652 9653 9654 9655 9656 9657 9658 9659 9660 9661 9662 9663 9664 9665 9666 9667 9668 9669 9670 9671 9672 9673 9674 9675 9676 9677 9678 9679 9680 9681 9682 9683 9684 9685 9686 9687 9688 9689 9690 9691 9692 9693 9694 9695 9696 9697 9698 9699 9700 9701 9702 9703 9704 9705 9706 9707 9708 9709 9710 9711 9712 9713 9714 9715 9716 9717 9718 9719 9720 9721 9722 9723 9724 9725 9726 9727 9728 9729 9730 9731 9732 9733 9734 9735 9736 9737 9738 9739 9740 9741 9742 9743 9744 9745 9746 9747 9748 9749 9750 9751 9752 9753 9754 9755 9756 9757 9758 9759 9760 9761 9762 9763 9764 9765 9766 9767 9768 9769 9770 9771 9772 9773 9774 9775 9776 9777 9778 9779 9780 9781 9782 9783 9784 9785 9786 9787 9788 9789 9790 9791 9792 9793 9794 9795 9796 9797 9798 9799 9800 9801 9802 9803 9804 9805 9806 9807 9808 9809 9810 9811 9812 9813 9814 9815 9816 9817 9818 9819 9820 9821 9822 9823 9824 9825 9826 9827 9828 9829 9830 9831 9832 9833 9834 9835 9836 9837 9838 9839 9840 9841 9842 9843 9844 9845 9846 9847 9848 9849 9850 9851 9852 9853 9854 9855 9856 9857 9858 9859 9860 9861 9862 9863 9864 9865 9866 9867 9868 9869 9870 9871 9872 9873 9874 9875 9876 9877 9878 9879 9880 9881 9882 9883 9884 9885 9886 9887 9888 9889 9890 9891 9892 9893 9894 9895 9896 9897 9898 9899 9900 9901 9902 9903 9904 9905 9906 9907 9908 9909 9910 9911 9912 9913 9914 9915 9916 9917 9918 9919 9920 9921 9922 9923 9924 9925 9926 9927 9928 9929 9930 9931 9932 9933 9934 9935 9936 9937 9938 9939 9940 9941 9942 9943 9944 9945 9946 9947 9948 9949 9950 9951 9952 9953 9954 9955 9956 9957 9958 9959 9960 9961 9962 9963 9964 9965 9966 9967 9968 9969 9970 9971 9972 9973 9974 9975 9976 9977 9978 9979 9980 9981 9982 9983 9984 9985 9986 9987 9988 9989 9990 9991 9992 9993 9994 9995 9996 9997 9998 9999 10000 10001 10002 10003 10004 10005 10006 10007 10008 10009 10010 10011 10012 10013 10014 10015 10016 10017 10018 10019 10020 10021 10022 10023 10024 10025 10026 10027 10028 10029 10030 10031 10032 10033 10034 10035 10036 10037 10038 10039 10040 10041 10042 10043 10044 10045 10046 10047 10048 10049 10050 10051 10052 10053 10054 10055 10056 10057 10058 10059 10060 10061 10062 10063 10064 10065 10066 10067 10068 10069 10070 10071 10072 10073 10074 10075 10076 10077 10078 10079 10080 10081 10082 10083 10084 10085 10086 10087 10088 10089 10090 10091 10092 10093 10094 10095 10096 10097 10098 10099 10100 10101 10102 10103 10104 10105 10106 10107 10108 10109 10110 10111 10112 10113 10114 10115 10116 10117 10118 10119 10120 10121 10122 10123 10124 10125 10126 10127 10128 10129 10130 10131 10132 10133 10134 10135 10136 10137 10138 10139 10140 10141 10142 10143 10144 10145 10146 10147 10148 10149 10150 10151 10152 10153 10154 10155 10156 10157 10158 10159 10160 10161 10162 10163 10164 10165 10166 10167 10168 10169 10170 10171 10172 10173 10174 10175 10176 10177 10178 10179 10180 10181 10182 10183 10184 10185 10186 10187 10188 10189 10190 10191 10192 10193 10194 10195 10196 10197 10198 10199 10200 10201 10202 10203 10204 10205 10206 10207 10208 10209 10210 10211 10212 10213 10214 10215 10216 10217 10218 10219 10220 10221 10222 10223 10224 10225 10226 10227 10228 10229 10230 10231 10232 10233 10234 10235 10236 10237 10238 10239 10240 10241 10242 10243 10244 10245 10246 10247 10248 10249 10250 10251 10252 10253 10254 10255 10256 10257 10258 10259 10260 10261 10262 10263 10264 10265 10266 10267 10268 10269 10270 10271 10272 10273 10274 10275 10276 10277 10278 10279 10280 10281 10282 10283 10284 10285 10286 10287 10288 10289 10290 10291 10292 10293 10294 10295 10296 10297 10298 10299 10300 10301 10302 10303 10304 10305 10306 10307 10308 10309 10310 10311 10312 10313 10314 10315 10316 10317 10318 10319 10320 10321 10322 10323 10324 10325 10326 10327 10328 10329 10330 10331 10332 10333 10334 10335 10336 10337 10338 10339 10340 10341 10342 10343 10344 10345 10346 10347 10348 10349 10350 10351 10352 10353 10354 10355 10356 10357 10358 10359 10360 10361 10362 10363 10364 10365 10366 10367 10368 10369 10370 10371 10372 10373 10374 10375 10376 10377 10378 10379 10380 10381 10382 10383 10384 10385 10386 10387 10388 10389 10390 10391 10392 10393 10394 10395 10396 10397 10398 10399 10400 10401 10402 10403 10404 10405 10406 10407 10408 10409 10410 10411 10412 10413 10414 10415 10416 10417 10418 10419 10420 10421 10422 10423 10424 10425 10426 10427 10428 10429 10430 10431 10432 10433 10434 10435 10436 10437 10438 10439 10440 10441 10442 10443 10444 10445 10446 10447 10448 10449 10450 10451 10452 10453 10454 10455 10456 10457 10458 10459 10460 10461 10462 10463 10464 10465 10466 10467 10468 10469 10470 10471 10472 10473 10474 10475 10476 10477 10478 10479 10480 10481 10482 10483 10484 10485 10486 10487 10488 10489 10490 10491 10492 10493 10494 10495 10496 10497 10498 10499 10500 10501 10502 10503 10504 10505 10506 10507 10508 10509 10510 10511 10512 10513 10514 10515 10516 10517 10518 10519 10520 10521 10522 10523 10524 10525 10526 10527 10528 10529 10530 10531 10532 10533 10534 10535 10536 10537 10538 10539 10540 10541 10542 10543 10544 10545 10546 10547 10548 10549 10550 10551 10552 10553 10554 10555 10556 10557 10558 10559 10560 10561 10562 10563 10564 10565 10566 10567 10568 10569 10570 10571 10572 10573 10574 10575 10576 10577 10578 10579 10580 10581 10582 10583 10584 10585 10586 10587 10588 10589 10590 10591 10592 10593 10594 10595 10596 10597 10598 10599 10600 10601 10602 10603 10604 10605 10606 10607 10608 10609 10610 10611 10612 10613 10614 10615 10616 10617 10618 10619 10620 10621 10622 10623 10624 10625 10626 10627 10628 10629 10630 10631 10632 10633 10634 10635 10636 10637 10638 10639 10640 10641 10642 10643 10644 10645 10646 10647 10648 10649 10650 10651 10652 10653 10654 10655 10656 10657 10658 10659 10660 10661 10662 10663 10664 10665 10666 10667 10668 10669 10670 10671 10672 10673 10674 10675 10676 10677 10678 10679 10680 10681 10682 10683 10684 10685 10686 10687 10688 10689 10690 10691 10692 10693 10694 10695 10696 10697 10698 10699 10700 10701 10702 10703 10704 10705 10706 10707 10708 10709 10710 10711 10712 10713 10714 10715 10716 10717 10718 10719 10720 10721 10722 10723 10724 10725 10726 10727 10728 10729 10730 10731 10732 10733 10734 10735 10736 10737 10738 10739 10740 10741 10742 10743 10744 10745 10746 10747 10748 10749 10750 10751 10752 10753 10754 10755 10756 10757 10758 10759 10760 10761 10762 10763 10764 10765 10766 10767 10768 10769 10770 10771 10772 10773 10774 10775 10776 10777 10778 10779 10780 10781 10782 10783 10784 10785 10786 10787 10788 10789 10790 10791 10792 10793 10794 10795 10796 10797 10798 10799 10800 10801 10802 10803 10804 10805 10806 10807 10808 10809 10810 10811 10812 10813 10814 10815 10816 10817 10818 10819 10820 10821 10822 10823 10824 10825 10826 10827 10828 10829 10830 10831 10832 10833 10834 10835 10836 10837 10838 10839 10840 10841 10842 10843 10844 10845 10846 10847 10848 10849 10850 10851 10852 10853 10854 10855 10856 10857 10858 10859 10860 10861 10862 10863 10864 10865 10866 10867 10868 10869 10870 10871 10872 10873 10874 10875 10876 10877 10878 10879 10880 10881 10882 10883 10884 10885 10886 10887 10888 10889 10890 10891 10892 10893 10894 10895 10896 10897 10898 10899 10900 10901 10902 10903 10904 10905 10906 10907 10908 10909 10910 10911 10912 10913 10914 10915 10916 10917 10918 10919 10920 10921 10922 10923 10924 10925 10926 10927 10928 10929 10930 10931 10932 10933 10934 10935 10936 10937 10938 10939 10940 10941 10942 10943 10944 10945 10946 10947 10948 10949 10950 10951 10952 10953 10954 10955 10956 10957 10958 10959 10960 10961 10962 10963 10964 10965 10966 10967 10968 10969 10970 10971 10972 10973 10974 10975 10976 10977 10978 10979 10980 10981 10982 10983 10984 10985 10986 10987 10988 10989 10990 10991 10992 10993 10994 10995 10996 10997 10998 10999 11000 11001 11002 11003 11004 11005 11006 11007 11008 11009 11010 11011 11012 11013 11014 11015 11016 11017 11018 11019 11020 11021 11022 11023 11024 11025 11026 11027 11028 11029 11030 11031 11032 11033 11034 11035 11036 11037 11038 11039 11040 11041 11042 11043 11044 11045 11046 11047 11048 11049 11050 11051 11052 11053 11054 11055 11056 11057 11058 11059 11060 11061 11062 11063 11064 11065 11066 11067 11068 11069 11070 11071 11072 11073 11074 11075 11076 11077 11078 11079 11080 11081 11082 11083 11084 11085 11086 11087 11088 11089 11090 11091 11092 11093 11094 11095 11096 11097 11098 11099 11100 11101 11102 11103 11104 11105 11106 11107 11108 11109 11110 11111 11112 11113 11114 11115 11116 11117 11118 11119 11120 11121 11122 11123 11124 11125 11126 11127 11128 11129 11130 11131 11132 11133 11134 11135 11136 11137 11138 11139 11140 11141 11142 11143 11144 11145 11146 11147 11148 11149 11150 11151 11152 11153 11154 11155 11156 11157 11158 11159 11160 11161 11162 11163 11164 11165 11166 11167 11168 11169 11170 11171 11172 11173 11174 11175 11176 11177 11178 11179 11180 11181 11182 11183 11184 11185 11186 11187 11188 11189 11190 11191 11192 11193 11194 11195 11196 11197 11198 11199 11200 11201 11202 11203 11204 11205 11206 11207 11208 11209 11210 11211 11212 11213 11214 11215 11216 11217 11218 11219 11220 11221 11222
{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "aabfb24b",
   "metadata": {},
   "outputs": [],
   "source": [
    "COMBO = '/home/kkrasnowska/anaconda3/envs/combo_p39/bin/combo'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "54a97ebd",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "I0406 22:49:19.084177 139884283720768 params.py:248] include_in_archive = None\n",
      "2023-04-06 22:49:19,085 - INFO - allennlp.common.params - random_seed = 8787\n",
      "2023-04-06 22:49:19,085 - INFO - allennlp.common.params - numpy_seed = 8787\n",
      "2023-04-06 22:49:19,085 - INFO - allennlp.common.params - pytorch_seed = 8787\n",
      "2023-04-06 22:49:19,086 - INFO - allennlp.common.checks - Pytorch version: 1.13.1\n",
      "2023-04-06 22:49:19,087 - INFO - allennlp.common.params - type = default\n",
      "2023-04-06 22:49:19,087 - INFO - allennlp.common.params - dataset_reader.type = conllu\n",
      "2023-04-06 22:49:19,088 - INFO - allennlp.common.params - dataset_reader.lazy = False\n",
      "2023-04-06 22:49:19,088 - INFO - allennlp.common.params - dataset_reader.cache_directory = None\n",
      "2023-04-06 22:49:19,088 - INFO - allennlp.common.params - dataset_reader.max_instances = None\n",
      "2023-04-06 22:49:19,088 - INFO - allennlp.common.params - dataset_reader.manual_distributed_sharding = False\n",
      "2023-04-06 22:49:19,088 - INFO - allennlp.common.params - dataset_reader.manual_multi_process_sharding = False\n",
      "2023-04-06 22:49:19,088 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.type = characters_const_padding\n",
      "2023-04-06 22:49:19,089 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.namespace = token_characters\n",
      "2023-04-06 22:49:19,089 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.character_tokenizer.byte_encoding = None\n",
      "2023-04-06 22:49:19,089 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.character_tokenizer.lowercase_characters = False\n",
      "2023-04-06 22:49:19,089 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
      "2023-04-06 22:49:19,089 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
      "2023-04-06 22:49:19,089 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.start_tokens = None\n",
      "2023-04-06 22:49:19,089 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.end_tokens = None\n",
      "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.min_padding_length = 32\n",
      "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.char.token_min_padding_length = 0\n",
      "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.feats.type = feats_indexer\n",
      "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.feats.namespace = feats\n",
      "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.feats.feature_name = feats_\n",
      "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.feats.token_min_padding_length = 0\n",
      "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.type = characters_const_padding\n",
      "2023-04-06 22:49:19,090 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.namespace = token_characters\n",
      "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.character_tokenizer.byte_encoding = None\n",
      "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.character_tokenizer.lowercase_characters = False\n",
      "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.character_tokenizer.start_tokens = ['__START__']\n",
      "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.character_tokenizer.end_tokens = ['__END__']\n",
      "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.start_tokens = None\n",
      "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.end_tokens = None\n",
      "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.min_padding_length = 32\n",
      "2023-04-06 22:49:19,091 - INFO - allennlp.common.params - dataset_reader.token_indexers.lemma.token_min_padding_length = 0\n",
      "2023-04-06 22:49:19,092 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.type = pretrained_transformer_mismatched_fixed\n",
      "2023-04-06 22:49:19,092 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.token_min_padding_length = 0\n",
      "2023-04-06 22:49:19,092 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.model_name = allegro/herbert-large-cased\n",
      "2023-04-06 22:49:19,092 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.namespace = tags\n",
      "2023-04-06 22:49:19,092 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.max_length = None\n",
      "2023-04-06 22:49:19,092 - INFO - allennlp.common.params - dataset_reader.token_indexers.token.tokenizer_kwargs.use_fast = False\n",
      "2023-04-06 22:49:21,857 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.type = single_id\n",
      "2023-04-06 22:49:21,857 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.namespace = upostag\n",
      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.lowercase_tokens = False\n",
      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.start_tokens = None\n",
      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.end_tokens = None\n",
      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.feature_name = pos_\n",
      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.upostag.token_min_padding_length = 0\n",
      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.type = single_id\n",
      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.namespace = xpostag\n",
      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.lowercase_tokens = False\n",
      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.start_tokens = None\n",
      "2023-04-06 22:49:21,858 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.end_tokens = None\n",
      "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.feature_name = tag_\n",
      "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.default_value = THIS IS A REALLY UNLIKELY VALUE THAT HAS TO BE A STRING\n",
      "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.token_indexers.xpostag.token_min_padding_length = 0\n",
      "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.type = characters_const_padding\n",
      "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.namespace = lemma_characters\n",
      "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.character_tokenizer.byte_encoding = None\n",
      "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.character_tokenizer.lowercase_characters = False\n",
      "2023-04-06 22:49:21,859 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.character_tokenizer.start_tokens = ['__START__']\n",
      "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.character_tokenizer.end_tokens = ['__END__']\n",
      "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.start_tokens = None\n",
      "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.end_tokens = None\n",
      "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.min_padding_length = 32\n",
      "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.lemma_indexers.char.token_min_padding_length = 0\n",
      "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.features = ['token', 'char']\n",
      "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.targets = ['head', 'deprel']\n",
      "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - dataset_reader.use_sem = False\n",
      "2023-04-06 22:49:21,860 - INFO - allennlp.common.params - train_data_path = connlu/pdbc-train.conllu\n",
      "2023-04-06 22:49:21,861 - INFO - allennlp.common.params - datasets_for_vocab_creation = ['train']\n",
      "2023-04-06 22:49:21,861 - INFO - allennlp.common.params - validation_dataset_reader = None\n",
      "2023-04-06 22:49:21,861 - INFO - allennlp.common.params - validation_data_path = connlu/pdbc-validation.conllu\n",
      "2023-04-06 22:49:21,861 - INFO - allennlp.common.params - validation_data_loader = None\n",
      "2023-04-06 22:49:21,861 - INFO - allennlp.common.params - test_data_path = None\n",
      "2023-04-06 22:49:21,861 - INFO - allennlp.common.params - evaluate_on_test = False\n",
      "2023-04-06 22:49:21,862 - INFO - allennlp.common.params - batch_weight_key = \n",
      "2023-04-06 22:49:21,862 - INFO - allennlp.training.util - Reading training data from connlu/pdbc-train.conllu\n",
      "reading instances: 0it [00:00, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "reading instances: 3853it [00:02, 1926.46it/s]\n",
      "reading instances: 8024it [00:04, 1907.69it/s]\n",
      "reading instances: 11424it [00:06, 1840.15it/s]\n",
      "reading instances: 14555it [00:08, 1654.52it/s]\n",
      "reading instances: 17659it [00:09, 1772.69it/s]\n",
      "2023-04-06 22:49:31,824 - INFO - allennlp.training.util - Reading validation data from connlu/pdbc-validation.conllu\n",
      "reading instances: 0it [00:00, ?it/s]\n",
      "reading instances: 1851it [00:02, 897.46it/s]\n",
      "reading instances: 2211it [00:02, 933.13it/s]\n",
      "2023-04-06 22:49:34,194 - INFO - allennlp.commands.train - From dataset instances, train will be considered for vocabulary creation.\n",
      "2023-04-06 22:49:34,194 - INFO - allennlp.common.params - vocabulary.type = from_instances_extended\n",
      "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.min_count = None\n",
      "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.max_vocab_size = None\n",
      "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.non_padded_namespaces = ['head_labels']\n",
      "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.pretrained_files = None\n",
      "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.only_include_pretrained_words = True\n",
      "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.min_pretrained_embeddings = None\n",
      "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.padding_token = __PAD__\n",
      "2023-04-06 22:49:34,195 - INFO - allennlp.common.params - vocabulary.oov_token = _\n",
      "2023-04-06 22:49:34,195 - INFO - allennlp.data.vocabulary - Fitting token dictionary from dataset.\n",
      "building vocab: 0it [00:00, ?it/s]\n",
      "building vocab: 16773it [00:02, 8386.16it/s]\n",
      "building vocab: 17659it [00:02, 8423.42it/s]\n",
      "2023-04-06 22:49:36,293 - INFO - allennlp.common.params - model.type = semantic_multitask\n",
      "2023-04-06 22:49:36,293 - INFO - allennlp.common.params - model.text_field_embedder.type = basic\n",
      "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.type = char_embeddings_from_config\n",
      "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.embedding_dim = 64\n",
      "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.input_dim = 64\n",
      "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.filters = [512, 256, 64]\n",
      "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.kernel_size = [3, 3, 3]\n",
      "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.stride = [1, 1, 1]\n",
      "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.padding = [1, 2, 4]\n",
      "2023-04-06 22:49:36,294 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.dilation = [1, 2, 4]\n",
      "2023-04-06 22:49:36,295 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.dilated_cnn_encoder.activations = ['relu', 'relu', 'linear']\n",
      "2023-04-06 22:49:36,295 - INFO - allennlp.common.params - type = relu\n",
      "2023-04-06 22:49:36,295 - INFO - allennlp.common.params - type = relu\n",
      "2023-04-06 22:49:36,295 - INFO - allennlp.common.params - type = linear\n",
      "2023-04-06 22:49:36,300 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.char.vocab_namespace = token_characters\n",
      "2023-04-06 22:49:36,300 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.type = transformers_word_embeddings\n",
      "2023-04-06 22:49:36,300 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.model_name = allegro/herbert-large-cased\n",
      "2023-04-06 22:49:36,301 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.projection_dim = 100\n",
      "2023-04-06 22:49:36,301 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.projection_activation = <function TransformersWordEmbedder.<lambda> at 0x7f388b745280>\n",
      "2023-04-06 22:49:36,301 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.projection_dropout_rate = 0.0\n",
      "2023-04-06 22:49:36,301 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.freeze_transformer = True\n",
      "2023-04-06 22:49:36,301 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.last_layer_only = True\n",
      "2023-04-06 22:49:36,301 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.tokenizer_kwargs.use_fast = False\n",
      "2023-04-06 22:49:36,301 - INFO - allennlp.common.params - model.text_field_embedder.token_embedders.token.transformer_kwargs = None\n",
      "2023-04-06 22:49:44,104 - INFO - allennlp.common.params - model.seq_encoder.type = combo_encoder\n",
      "2023-04-06 22:49:44,105 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.input_size = 164\n",
      "2023-04-06 22:49:44,105 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.hidden_size = 512\n",
      "2023-04-06 22:49:44,105 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.num_layers = 2\n",
      "2023-04-06 22:49:44,105 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.recurrent_dropout_probability = 0.33\n",
      "2023-04-06 22:49:44,105 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.layer_dropout_probability = 0.33\n",
      "2023-04-06 22:49:44,105 - INFO - allennlp.common.params - model.seq_encoder.stacked_bilstm.use_highway = False\n",
      "2023-04-06 22:49:44,804 - INFO - allennlp.common.params - model.seq_encoder.layer_dropout_probability = 0.33\n",
      "2023-04-06 22:49:44,805 - INFO - allennlp.common.params - model.use_sample_weight = True\n",
      "2023-04-06 22:49:44,805 - INFO - allennlp.common.params - model.lemmatizer = None\n",
      "2023-04-06 22:49:44,805 - INFO - allennlp.common.params - model.upos_tagger = None\n",
      "2023-04-06 22:49:44,805 - INFO - allennlp.common.params - model.xpos_tagger = None\n",
      "2023-04-06 22:49:44,805 - INFO - allennlp.common.params - model.semantic_relation = None\n",
      "2023-04-06 22:49:44,805 - INFO - allennlp.common.params - model.morphological_feat = None\n",
      "2023-04-06 22:49:44,805 - INFO - allennlp.common.params - model.dependency_relation.type = combo_dependency_parsing_from_vocab\n",
      "2023-04-06 22:49:44,806 - INFO - allennlp.common.params - model.dependency_relation.vocab_namespace = deprel_labels\n",
      "2023-04-06 22:49:44,806 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.head_projection_layer.in_features = 1024\n",
      "2023-04-06 22:49:44,806 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.head_projection_layer.out_features = 512\n",
      "2023-04-06 22:49:44,806 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.head_projection_layer.activation = tanh\n",
      "2023-04-06 22:49:44,806 - INFO - allennlp.common.params - type = tanh\n",
      "2023-04-06 22:49:44,806 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.head_projection_layer.dropout_rate = 0.0\n",
      "2023-04-06 22:49:44,811 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.dependency_projection_layer.in_features = 1024\n",
      "2023-04-06 22:49:44,811 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.dependency_projection_layer.out_features = 512\n",
      "2023-04-06 22:49:44,811 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.dependency_projection_layer.activation = tanh\n",
      "2023-04-06 22:49:44,811 - INFO - allennlp.common.params - type = tanh\n",
      "2023-04-06 22:49:44,811 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.dependency_projection_layer.dropout_rate = 0.0\n",
      "2023-04-06 22:49:44,816 - INFO - allennlp.common.params - model.dependency_relation.head_predictor.cycle_loss_n = 0\n",
      "2023-04-06 22:49:44,816 - INFO - allennlp.common.params - model.dependency_relation.head_projection_layer.in_features = 1024\n",
      "2023-04-06 22:49:44,816 - INFO - allennlp.common.params - model.dependency_relation.head_projection_layer.out_features = 128\n",
      "2023-04-06 22:49:44,816 - INFO - allennlp.common.params - model.dependency_relation.head_projection_layer.activation = tanh\n",
      "2023-04-06 22:49:44,816 - INFO - allennlp.common.params - type = tanh\n",
      "2023-04-06 22:49:44,816 - INFO - allennlp.common.params - model.dependency_relation.head_projection_layer.dropout_rate = 0.25\n",
      "2023-04-06 22:49:44,818 - INFO - allennlp.common.params - model.dependency_relation.dependency_projection_layer.in_features = 1024\n",
      "2023-04-06 22:49:44,818 - INFO - allennlp.common.params - model.dependency_relation.dependency_projection_layer.out_features = 128\n",
      "2023-04-06 22:49:44,818 - INFO - allennlp.common.params - model.dependency_relation.dependency_projection_layer.activation = tanh\n",
      "2023-04-06 22:49:44,818 - INFO - allennlp.common.params - type = tanh\n",
      "2023-04-06 22:49:44,818 - INFO - allennlp.common.params - model.dependency_relation.dependency_projection_layer.dropout_rate = 0.25\n",
      "2023-04-06 22:49:44,820 - INFO - allennlp.common.params - model.enhanced_dependency_relation = None\n",
      "2023-04-06 22:49:44,821 - INFO - allennlp.common.params - model.regularizer.regexes.0.1.type = l2\n",
      "2023-04-06 22:49:44,821 - INFO - allennlp.common.params - model.regularizer.regexes.0.1.alpha = 1e-06\n",
      "2023-04-06 22:49:44,821 - INFO - allennlp.common.params - model.regularizer.regexes.1.1.type = l2\n",
      "2023-04-06 22:49:44,821 - INFO - allennlp.common.params - model.regularizer.regexes.1.1.alpha = 1e-06\n",
      "2023-04-06 22:49:44,821 - INFO - allennlp.common.params - model.regularizer.regexes.2.1.type = l2\n",
      "2023-04-06 22:49:44,821 - INFO - allennlp.common.params - model.regularizer.regexes.2.1.alpha = 1e-06\n",
      "2023-04-06 22:49:44,822 - INFO - allennlp.common.params - model.regularizer.regexes.3.1.type = l2\n",
      "2023-04-06 22:49:44,822 - INFO - allennlp.common.params - model.regularizer.regexes.3.1.alpha = 1e-05\n",
      "2023-04-06 22:49:44,822 - INFO - filelock - Lock 139878665944848 acquired on ./allennlpru3hb8qq/vocabulary/.lock\n",
      "2023-04-06 22:49:44,823 - INFO - filelock - Lock 139878665944848 released on ./allennlpru3hb8qq/vocabulary/.lock\n",
      "2023-04-06 22:49:44,823 - INFO - allennlp.common.params - data_loader.type = pytorch_dataloader\n",
      "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.batch_size = 1\n",
      "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.shuffle = False\n",
      "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.sampler = None\n",
      "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.num_workers = 0\n",
      "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.pin_memory = False\n",
      "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.drop_last = False\n",
      "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.timeout = 0\n",
      "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.worker_init_fn = None\n",
      "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.multiprocessing_context = None\n",
      "2023-04-06 22:49:44,824 - INFO - allennlp.common.params - data_loader.batches_per_epoch = None\n",
      "2023-04-06 22:49:44,825 - INFO - allennlp.common.params - data_loader.batch_sampler.type = token_count\n",
      "2023-04-06 22:49:44,825 - INFO - allennlp.common.params - data_loader.batch_sampler.word_batch_size = 2500\n",
      "2023-04-06 22:49:44,825 - INFO - allennlp.common.params - data_loader.batch_sampler.shuffle_dataset = True\n",
      "/home/kkrasnowska/anaconda3/envs/combo_p39/lib/python3.8/site-packages/combo/data/samplers/samplers.py:51: VisibleDeprecationWarning: Creating an ndarray from ragged nested sequences (which is a list-or-tuple of lists-or-tuples-or ndarrays with different lengths or shapes) is deprecated. If you meant to do this, you must specify 'dtype=object' when creating the ndarray.\n",
      "  self.batch_dataset = np.array(self.batch_dataset)[indices].tolist()\n",
      "2023-04-06 22:49:44,845 - INFO - allennlp.common.params - data_loader.type = pytorch_dataloader\n",
      "2023-04-06 22:49:44,845 - INFO - allennlp.common.params - data_loader.batch_size = 1\n",
      "2023-04-06 22:49:44,845 - INFO - allennlp.common.params - data_loader.shuffle = False\n",
      "2023-04-06 22:49:44,845 - INFO - allennlp.common.params - data_loader.sampler = None\n",
      "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.num_workers = 0\n",
      "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.pin_memory = False\n",
      "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.drop_last = False\n",
      "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.timeout = 0\n",
      "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.worker_init_fn = None\n",
      "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.multiprocessing_context = None\n",
      "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.batches_per_epoch = None\n",
      "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.batch_sampler.type = token_count\n",
      "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.batch_sampler.word_batch_size = 2500\n",
      "2023-04-06 22:49:44,846 - INFO - allennlp.common.params - data_loader.batch_sampler.shuffle_dataset = True\n",
      "2023-04-06 22:49:44,849 - INFO - allennlp.common.params - trainer.type = gradient_descent_validate_n\n",
      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.patience = 1\n",
      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.validation_metric = +EM\n",
      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.num_epochs = 400\n",
      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.cuda_device = 0\n",
      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.grad_norm = None\n",
      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.grad_clipping = 5\n",
      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.distributed = None\n",
      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.world_size = 1\n",
      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.num_gradient_accumulation_steps = 1\n",
      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.use_amp = False\n",
      "2023-04-06 22:49:44,850 - INFO - allennlp.common.params - trainer.no_grad = None\n",
      "2023-04-06 22:49:44,851 - INFO - allennlp.common.params - trainer.momentum_scheduler = None\n",
      "2023-04-06 22:49:44,851 - INFO - allennlp.common.params - trainer.tensorboard_writer = None\n",
      "2023-04-06 22:49:44,851 - INFO - allennlp.common.params - trainer.moving_average = None\n",
      "2023-04-06 22:49:44,851 - INFO - allennlp.common.params - trainer.batch_callbacks = None\n",
      "2023-04-06 22:49:44,851 - INFO - allennlp.common.params - trainer.epoch_callbacks.0.type = transfer_patience\n",
      "2023-04-06 22:49:44,851 - INFO - allennlp.common.params - trainer.end_callbacks = None\n",
      "2023-04-06 22:49:44,851 - INFO - allennlp.common.params - trainer.trainer_callbacks = None\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-06 22:49:47,277 - INFO - allennlp.common.params - trainer.optimizer.type = adam\r\n",
      "2023-04-06 22:49:47,277 - INFO - allennlp.common.params - trainer.optimizer.parameter_groups = None\r\n",
      "2023-04-06 22:49:47,277 - INFO - allennlp.common.params - trainer.optimizer.lr = 0.002\r\n",
      "2023-04-06 22:49:47,277 - INFO - allennlp.common.params - trainer.optimizer.betas = [0.9, 0.9]\r\n",
      "2023-04-06 22:49:47,278 - INFO - allennlp.common.params - trainer.optimizer.eps = 1e-08\r\n",
      "2023-04-06 22:49:47,278 - INFO - allennlp.common.params - trainer.optimizer.weight_decay = 0.0\r\n",
      "2023-04-06 22:49:47,278 - INFO - allennlp.common.params - trainer.optimizer.amsgrad = False\r\n",
      "2023-04-06 22:49:47,278 - INFO - allennlp.training.optimizers - Number of trainable parameters: 11053872\r\n",
      "2023-04-06 22:49:47,278 - INFO - allennlp.common.util - The following parameters are Frozen (without gradient):\r\n",
      "2023-04-06 22:49:47,278 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.word_embeddings.weight\r\n",
      "2023-04-06 22:49:47,278 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.position_embeddings.weight\r\n",
      "2023-04-06 22:49:47,278 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.token_type_embeddings.weight\r\n",
      "2023-04-06 22:49:47,278 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,278 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.embeddings.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,278 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.output.dense.weight\r\n",
      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.output.dense.bias\r\n",
      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.0.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,279 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.output.dense.weight\r\n",
      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.output.dense.bias\r\n",
      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.1.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,280 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.output.dense.weight\r\n",
      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.output.dense.bias\r\n",
      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.2.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,281 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.output.dense.weight\r\n",
      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.output.dense.bias\r\n",
      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.3.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,282 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.output.dense.weight\r\n",
      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.output.dense.bias\r\n",
      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.4.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,283 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.output.dense.weight\r\n",
      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.output.dense.bias\r\n",
      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.5.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,284 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.output.dense.weight\r\n",
      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.output.dense.bias\r\n",
      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.6.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,285 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.output.dense.weight\r\n",
      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.output.dense.bias\r\n",
      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.7.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,286 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.output.dense.weight\r\n",
      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.output.dense.bias\r\n",
      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.8.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,287 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.output.dense.weight\r\n",
      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.output.dense.bias\r\n",
      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.9.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,288 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.output.dense.weight\r\n",
      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.output.dense.bias\r\n",
      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.10.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,289 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.output.dense.weight\r\n",
      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.output.dense.bias\r\n",
      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.11.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,290 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.output.dense.weight\r\n",
      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.output.dense.bias\r\n",
      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.12.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,291 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.output.dense.weight\r\n",
      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.output.dense.bias\r\n",
      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.13.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,292 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.output.dense.weight\r\n",
      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.output.dense.bias\r\n",
      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.14.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.output.dense.weight\r\n",
      "2023-04-06 22:49:47,293 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.output.dense.bias\r\n",
      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.15.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.output.dense.weight\r\n",
      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.output.dense.bias\r\n",
      "2023-04-06 22:49:47,294 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.16.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.output.dense.weight\r\n",
      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.output.dense.bias\r\n",
      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,295 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.17.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.output.dense.weight\r\n",
      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.output.dense.bias\r\n",
      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,296 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.18.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.output.dense.weight\r\n",
      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.output.dense.bias\r\n",
      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.19.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,297 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.output.dense.weight\r\n",
      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.output.dense.bias\r\n",
      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.20.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,298 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.output.dense.weight\r\n",
      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.output.dense.bias\r\n",
      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.21.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,299 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.output.dense.weight\r\n",
      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.output.dense.bias\r\n",
      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.22.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.query.weight\r\n",
      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.query.bias\r\n",
      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.key.weight\r\n",
      "2023-04-06 22:49:47,300 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.key.bias\r\n",
      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.value.weight\r\n",
      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.self.value.bias\r\n",
      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.output.dense.weight\r\n",
      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.output.dense.bias\r\n",
      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.attention.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.intermediate.dense.weight\r\n",
      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.intermediate.dense.bias\r\n",
      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.output.dense.weight\r\n",
      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.output.dense.bias\r\n",
      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.output.LayerNorm.weight\r\n",
      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.encoder.layer.23.output.LayerNorm.bias\r\n",
      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.pooler.dense.weight\r\n",
      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token._matched_embedder.transformer_model.pooler.dense.bias\r\n",
      "2023-04-06 22:49:47,301 - INFO - allennlp.common.util - The following parameters are Tunable (with gradient):\r\n",
      "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - _head_sentinel\r\n",
      "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.char_embed.weight\r\n",
      "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.0.weight\r\n",
      "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.0.bias\r\n",
      "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.1.weight\r\n",
      "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.1.bias\r\n",
      "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.2.weight\r\n",
      "2023-04-06 22:49:47,302 - INFO - allennlp.common.util - text_field_embedder.token_embedder_char.dilated_cnn_encoder._module.conv1d_layers.2.bias\r\n",
      "2023-04-06 22:49:47,303 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token.projection_layer.weight\r\n",
      "2023-04-06 22:49:47,303 - INFO - allennlp.common.util - text_field_embedder.token_embedder_token.projection_layer.bias\r\n",
      "2023-04-06 22:49:47,303 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_0.cell.input_linearity.weight\r\n",
      "2023-04-06 22:49:47,303 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_0.cell.state_linearity.weight\r\n",
      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_0.cell.state_linearity.bias\r\n",
      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_0.cell.input_linearity.weight\r\n",
      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_0.cell.state_linearity.weight\r\n",
      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_0.cell.state_linearity.bias\r\n",
      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_1.cell.input_linearity.weight\r\n",
      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_1.cell.state_linearity.weight\r\n",
      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.forward_layer_1.cell.state_linearity.bias\r\n",
      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_1.cell.input_linearity.weight\r\n",
      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_1.cell.state_linearity.weight\r\n",
      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - seq_encoder._module.backward_layer_1.cell.state_linearity.bias\r\n",
      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - dependency_relation.head_predictor.head_projection_layer.weight\r\n",
      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - dependency_relation.head_predictor.head_projection_layer.bias\r\n",
      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - dependency_relation.head_predictor.dependency_projection_layer.weight\r\n",
      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - dependency_relation.head_predictor.dependency_projection_layer.bias\r\n",
      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - dependency_relation.head_projection_layer.weight\r\n",
      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - dependency_relation.head_projection_layer.bias\r\n",
      "2023-04-06 22:49:47,304 - INFO - allennlp.common.util - dependency_relation.dependency_projection_layer.weight\r\n",
      "2023-04-06 22:49:47,305 - INFO - allennlp.common.util - dependency_relation.dependency_projection_layer.bias\r\n",
      "2023-04-06 22:49:47,305 - INFO - allennlp.common.util - dependency_relation.relation_prediction_layer.weight\r\n",
      "2023-04-06 22:49:47,305 - INFO - allennlp.common.util - dependency_relation.relation_prediction_layer.bias\r\n",
      "2023-04-06 22:49:47,305 - INFO - allennlp.common.params - trainer.learning_rate_scheduler.type = combo_scheduler\r\n",
      "2023-04-06 22:49:47,305 - INFO - allennlp.common.params - trainer.learning_rate_scheduler.patience = 6\r\n",
      "2023-04-06 22:49:47,305 - INFO - allennlp.common.params - trainer.learning_rate_scheduler.decreases = 2\r\n",
      "2023-04-06 22:49:47,305 - INFO - allennlp.common.params - trainer.learning_rate_scheduler.threshold = 0.001\r\n",
      "2023-04-06 22:49:47,305 - INFO - allennlp.common.params - trainer.checkpointer.type = finishing_only_checkpointer\r\n",
      "2023-04-06 22:49:47,306 - INFO - allennlp.common.params - trainer.checkpointer.keep_serialized_model_every_num_seconds = None\r\n",
      "2023-04-06 22:49:47,306 - INFO - allennlp.common.params - trainer.checkpointer.num_serialized_models_to_keep = 2\r\n",
      "2023-04-06 22:49:47,306 - INFO - allennlp.common.params - trainer.checkpointer.model_save_interval = None\r\n",
      "2023-04-06 22:49:47,308 - INFO - combo.training.trainer - Beginning training.\r\n",
      "2023-04-06 22:49:47,308 - INFO - allennlp.training.trainer - Epoch 0/399\r\n",
      "2023-04-06 22:49:47,308 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.3G\r\n",
      "2023-04-06 22:49:47,308 - INFO - allennlp.training.trainer - GPU 0 memory usage: 1.4G\r\n",
      "2023-04-06 22:49:47,315 - INFO - allennlp.training.trainer - Training\r\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\r\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0000, UAS: 0.0492, LAS: 0.0000, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.7155, partial_loss/deprel_loss: 12.9573, partial_loss/cycle_loss: 0.0000, batch_loss: 12.4107, loss: 12.4107, batch_reg_loss: 0.1018, reg_loss: 0.1018 ||:   1%|          | 1/111 [00:03<07:00,  3.82s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0000, UAS: 0.0559, LAS: 0.0045, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 19.7004, partial_loss/deprel_loss: 16.3879, partial_loss/cycle_loss: 0.0000, batch_loss: 17.1516, loss: 25.2089, batch_reg_loss: 0.1012, reg_loss: 0.1015 ||:   4%|3         | 4/111 [00:06<05:11,  2.91s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0120, UAS: 0.0714, LAS: 0.0044, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 22.1129, partial_loss/deprel_loss: 9.0855, partial_loss/cycle_loss: 0.0000, batch_loss: 11.7916, loss: 24.6851, batch_reg_loss: 0.1006, reg_loss: 0.1012 ||:   6%|6         | 7/111 [00:08<03:56,  2.27s/it] \n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0099, UAS: 0.0608, LAS: 0.0046, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 15.5869, partial_loss/deprel_loss: 9.3639, partial_loss/cycle_loss: 0.0000, batch_loss: 10.7085, loss: 21.3806, batch_reg_loss: 0.1000, reg_loss: 0.1009 ||:   9%|9         | 10/111 [00:10<03:01,  1.80s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0315, UAS: 0.0725, LAS: 0.0092, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 18.3275, partial_loss/deprel_loss: 7.1568, partial_loss/cycle_loss: 0.0000, batch_loss: 9.4905, loss: 18.5717, batch_reg_loss: 0.0995, reg_loss: 0.1006 ||:  12%|#1        | 13/111 [00:12<02:26,  1.49s/it] \n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0000, UAS: 0.0633, LAS: 0.0083, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 25.8989, partial_loss/deprel_loss: 11.7684, partial_loss/cycle_loss: 0.0000, batch_loss: 14.6935, loss: 17.9697, batch_reg_loss: 0.0991, reg_loss: 0.1003 ||:  14%|#4        | 16/111 [00:15<01:59,  1.26s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0064, UAS: 0.0604, LAS: 0.0079, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 16.1143, partial_loss/deprel_loss: 10.8376, partial_loss/cycle_loss: 0.0000, batch_loss: 11.9915, loss: 16.8737, batch_reg_loss: 0.0986, reg_loss: 0.1001 ||:  17%|#7        | 19/111 [00:17<01:39,  1.08s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0079, UAS: 0.0579, LAS: 0.0081, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 15.2368, partial_loss/deprel_loss: 10.3155, partial_loss/cycle_loss: 0.0000, batch_loss: 11.3978, loss: 16.0851, batch_reg_loss: 0.0981, reg_loss: 0.0998 ||:  20%|#9        | 22/111 [00:19<01:25,  1.04it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0259, UAS: 0.0602, LAS: 0.0091, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 13.9253, partial_loss/deprel_loss: 7.4326, partial_loss/cycle_loss: 0.0000, batch_loss: 8.8288, loss: 15.3859, batch_reg_loss: 0.0976, reg_loss: 0.0996 ||:  23%|##2       | 25/111 [00:21<01:17,  1.11it/s]  \n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0267, UAS: 0.0629, LAS: 0.0101, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 23.9539, partial_loss/deprel_loss: 6.4690, partial_loss/cycle_loss: 0.0000, batch_loss: 10.0631, loss: 14.9031, batch_reg_loss: 0.0971, reg_loss: 0.0994 ||:  25%|##5       | 28/111 [00:23<01:10,  1.18it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0139, UAS: 0.0629, LAS: 0.0103, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 19.2664, partial_loss/deprel_loss: 8.1915, partial_loss/cycle_loss: 0.0000, batch_loss: 10.5031, loss: 14.5860, batch_reg_loss: 0.0966, reg_loss: 0.0991 ||:  28%|##7       | 31/111 [00:25<01:04,  1.23it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0056, UAS: 0.0635, LAS: 0.0105, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 14.2399, partial_loss/deprel_loss: 9.7935, partial_loss/cycle_loss: 0.0000, batch_loss: 10.7789, loss: 14.1692, batch_reg_loss: 0.0961, reg_loss: 0.0989 ||:  31%|###       | 34/111 [00:27<01:00,  1.27it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0148, UAS: 0.0660, LAS: 0.0107, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 8.0003, partial_loss/deprel_loss: 6.0032, partial_loss/cycle_loss: 0.0000, batch_loss: 6.4982, loss: 13.6788, batch_reg_loss: 0.0956, reg_loss: 0.0986 ||:  33%|###3      | 37/111 [00:30<00:58,  1.26it/s]  \n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0159, UAS: 0.0717, LAS: 0.0140, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 10.5919, partial_loss/deprel_loss: 8.8836, partial_loss/cycle_loss: 0.0000, batch_loss: 9.3203, loss: 13.2278, batch_reg_loss: 0.0950, reg_loss: 0.0983 ||:  36%|###6      | 40/111 [00:32<00:58,  1.22it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0160, UAS: 0.0744, LAS: 0.0148, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 10.1016, partial_loss/deprel_loss: 9.2769, partial_loss/cycle_loss: 0.0000, batch_loss: 9.5363, loss: 12.8973, batch_reg_loss: 0.0945, reg_loss: 0.0981 ||:  39%|###8      | 43/111 [00:34<00:52,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0467, UAS: 0.0768, LAS: 0.0156, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.8362, partial_loss/deprel_loss: 6.5938, partial_loss/cycle_loss: 0.0000, batch_loss: 6.5361, loss: 12.5863, batch_reg_loss: 0.0939, reg_loss: 0.0978 ||:  41%|####1     | 46/111 [00:37<00:49,  1.31it/s] \n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0130, UAS: 0.0790, LAS: 0.0162, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 12.9970, partial_loss/deprel_loss: 11.0561, partial_loss/cycle_loss: 0.0000, batch_loss: 11.5376, loss: 12.3941, batch_reg_loss: 0.0933, reg_loss: 0.0976 ||:  44%|####4     | 49/111 [00:39<00:46,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0044, UAS: 0.0785, LAS: 0.0158, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 14.6006, partial_loss/deprel_loss: 11.6897, partial_loss/cycle_loss: 0.0000, batch_loss: 12.3646, loss: 12.3354, batch_reg_loss: 0.0927, reg_loss: 0.0973 ||:  47%|####6     | 52/111 [00:41<00:43,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0115, UAS: 0.0791, LAS: 0.0156, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 12.7207, partial_loss/deprel_loss: 11.0801, partial_loss/cycle_loss: 0.0000, batch_loss: 11.5003, loss: 12.2236, batch_reg_loss: 0.0921, reg_loss: 0.0970 ||:  50%|####9     | 55/111 [00:43<00:42,  1.32it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0243, UAS: 0.0817, LAS: 0.0158, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.6552, partial_loss/deprel_loss: 7.4151, partial_loss/cycle_loss: 0.0000, batch_loss: 7.3545, loss: 12.0074, batch_reg_loss: 0.0915, reg_loss: 0.0967 ||:  52%|#####2    | 58/111 [00:45<00:38,  1.36it/s]   \n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0191, UAS: 0.0860, LAS: 0.0174, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 11.0116, partial_loss/deprel_loss: 10.2631, partial_loss/cycle_loss: 0.0000, batch_loss: 10.5036, loss: 11.7766, batch_reg_loss: 0.0908, reg_loss: 0.0965 ||:  55%|#####4    | 61/111 [00:48<00:38,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0343, UAS: 0.0937, LAS: 0.0194, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.9906, partial_loss/deprel_loss: 8.5044, partial_loss/cycle_loss: 0.0000, batch_loss: 8.4916, loss: 11.4687, batch_reg_loss: 0.0900, reg_loss: 0.0961 ||:  59%|#####8    | 65/111 [00:50<00:33,  1.38it/s]   \n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0919, UAS: 0.0972, LAS: 0.0205, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.0429, partial_loss/deprel_loss: 5.5430, partial_loss/cycle_loss: 0.0000, batch_loss: 5.3323, loss: 11.3481, batch_reg_loss: 0.0893, reg_loss: 0.0958 ||:  61%|######1   | 68/111 [00:53<00:33,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0574, UAS: 0.1052, LAS: 0.0221, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.5849, partial_loss/deprel_loss: 6.9327, partial_loss/cycle_loss: 0.0000, batch_loss: 6.7516, loss: 11.1225, batch_reg_loss: 0.0885, reg_loss: 0.0954 ||:  65%|######4   | 72/111 [00:56<00:28,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0301, UAS: 0.1099, LAS: 0.0231, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.2882, partial_loss/deprel_loss: 9.4010, partial_loss/cycle_loss: 0.0000, batch_loss: 9.4663, loss: 10.9824, batch_reg_loss: 0.0878, reg_loss: 0.0951 ||:  68%|######7   | 75/111 [01:00<00:33,  1.07it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0518, UAS: 0.1162, LAS: 0.0250, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.7446, partial_loss/deprel_loss: 8.7894, partial_loss/cycle_loss: 0.0000, batch_loss: 8.6676, loss: 10.8571, batch_reg_loss: 0.0872, reg_loss: 0.0948 ||:  70%|#######   | 78/111 [01:02<00:29,  1.13it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0834, UAS: 0.1219, LAS: 0.0265, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.8250, partial_loss/deprel_loss: 7.3410, partial_loss/cycle_loss: 0.0000, batch_loss: 7.1244, loss: 10.7374, batch_reg_loss: 0.0866, reg_loss: 0.0945 ||:  73%|#######2  | 81/111 [01:04<00:24,  1.20it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0427, UAS: 0.1239, LAS: 0.0269, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 10.8399, partial_loss/deprel_loss: 10.0552, partial_loss/cycle_loss: 0.0000, batch_loss: 10.2981, loss: 10.7271, batch_reg_loss: 0.0860, reg_loss: 0.0942 ||:  76%|#######5  | 84/111 [01:07<00:22,  1.22it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0643, UAS: 0.1288, LAS: 0.0287, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.8981, partial_loss/deprel_loss: 9.3547, partial_loss/cycle_loss: 0.0000, batch_loss: 9.5488, loss: 10.6448, batch_reg_loss: 0.0854, reg_loss: 0.0939 ||:  78%|#######8  | 87/111 [01:09<00:19,  1.24it/s]   \n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0661, UAS: 0.1356, LAS: 0.0319, UEM: 0.0004, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.0897, partial_loss/deprel_loss: 9.0732, partial_loss/cycle_loss: 0.0000, batch_loss: 9.1614, loss: 10.5082, batch_reg_loss: 0.0849, reg_loss: 0.0936 ||:  81%|########1 | 90/111 [01:12<00:17,  1.23it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0714, UAS: 0.1426, LAS: 0.0350, UEM: 0.0004, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 8.3305, partial_loss/deprel_loss: 8.5479, partial_loss/cycle_loss: 0.0000, batch_loss: 8.5886, loss: 10.3707, batch_reg_loss: 0.0842, reg_loss: 0.0932 ||:  85%|########4 | 94/111 [01:14<00:12,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0987, UAS: 0.1504, LAS: 0.0398, UEM: 0.0005, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.8474, partial_loss/deprel_loss: 6.8979, partial_loss/cycle_loss: 0.0000, batch_loss: 6.7715, loss: 10.2165, batch_reg_loss: 0.0837, reg_loss: 0.0929 ||:  87%|########7 | 97/111 [01:17<00:10,  1.28it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0733, UAS: 0.1541, LAS: 0.0412, UEM: 0.0004, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.9606, partial_loss/deprel_loss: 9.1819, partial_loss/cycle_loss: 0.0000, batch_loss: 9.4208, loss: 10.1551, batch_reg_loss: 0.0831, reg_loss: 0.0927 ||:  90%|######### | 100/111 [01:19<00:08,  1.27it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0887, UAS: 0.1585, LAS: 0.0433, UEM: 0.0004, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 8.6073, partial_loss/deprel_loss: 8.5581, partial_loss/cycle_loss: 0.0000, batch_loss: 8.6506, loss: 10.0863, batch_reg_loss: 0.0826, reg_loss: 0.0924 ||:  93%|#########2| 103/111 [01:21<00:06,  1.27it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0763, UAS: 0.1650, LAS: 0.0476, UEM: 0.0015, LEM: 0.0001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.8387, partial_loss/deprel_loss: 8.8138, partial_loss/cycle_loss: 0.0000, batch_loss: 9.1009, loss: 9.9700, batch_reg_loss: 0.0821, reg_loss: 0.0921 ||:  95%|#########5| 106/111 [01:24<00:04,  1.15it/s] \n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1713, UAS: 0.1692, LAS: 0.0496, UEM: 0.0014, LEM: 0.0001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.5725, partial_loss/deprel_loss: 5.1460, partial_loss/cycle_loss: 0.0000, batch_loss: 5.1130, loss: 9.8781, batch_reg_loss: 0.0817, reg_loss: 0.0918 ||:  98%|#########8| 109/111 [01:27<00:01,  1.21it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1029, UAS: 0.1708, LAS: 0.0502, UEM: 0.0014, LEM: 0.0001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.0519, partial_loss/deprel_loss: 7.4492, partial_loss/cycle_loss: 0.0000, batch_loss: 7.4511, loss: 9.8521, batch_reg_loss: 0.0813, reg_loss: 0.0916 ||: 100%|##########| 111/111 [01:28<00:00,  1.25it/s]\n",
      "2023-04-06 22:51:15,927 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1167, UAS: 0.3116, LAS: 0.1456, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.9999, partial_loss/deprel_loss: 15.2844, partial_loss/cycle_loss: 0.0000, batch_loss: 13.8275, loss: 12.0213, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:12,  1.11s/it]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2614, UAS: 0.3885, LAS: 0.1921, UEM: 0.0012, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.7361, partial_loss/deprel_loss: 8.9365, partial_loss/cycle_loss: 0.0000, batch_loss: 7.8964, loss: 10.3315, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  31%|###       | 4/13 [00:04<00:10,  1.15s/it]  \n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1863, UAS: 0.3556, LAS: 0.1713, UEM: 0.0009, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.5918, partial_loss/deprel_loss: 8.8550, partial_loss/cycle_loss: 0.0000, batch_loss: 8.2024, loss: 11.6787, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:07<00:08,  1.17s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1274, UAS: 0.3363, LAS: 0.1580, UEM: 0.0008, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.5021, partial_loss/deprel_loss: 14.9977, partial_loss/cycle_loss: 0.0000, batch_loss: 13.4986, loss: 12.1599, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:09<00:05,  1.17s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0952, UAS: 0.3134, LAS: 0.1427, UEM: 0.0007, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 8.8305, partial_loss/deprel_loss: 17.7009, partial_loss/cycle_loss: 0.0000, batch_loss: 15.9268, loss: 13.2406, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  77%|#######6  | 10/13 [00:12<00:03,  1.20s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3824, UAS: 0.3342, LAS: 0.1583, UEM: 0.0460, LEM: 0.0089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2575, partial_loss/deprel_loss: 6.4260, partial_loss/cycle_loss: 0.0000, batch_loss: 5.5923, loss: 12.9753, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  92%|#########2| 12/13 [00:14<00:01,  1.20s/it]  \n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1377, UAS: 0.3324, LAS: 0.1568, UEM: 0.0427, LEM: 0.0083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.7160, partial_loss/deprel_loss: 11.9092, partial_loss/cycle_loss: 0.0000, batch_loss: 10.8705, loss: 12.8134, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:15<00:00,  1.18s/it]\n",
      "2023-04-06 22:51:31,252 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     7.449  |    11.909\n",
      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     7.052  |     6.716\n",
      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.092  |     0.000\n",
      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - UEM                      |     0.001  |     0.043\n",
      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - LAS                      |     0.050  |     0.157\n",
      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - loss                     |     9.852  |    12.813\n",
      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  1397.911  |       N/A\n",
      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - LEM                      |     0.000  |     0.008\n",
      "2023-04-06 22:51:31,253 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-06 22:51:31,254 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-06 22:51:31,254 - INFO - combo.training.tensorboard_writer - UAS                      |     0.171  |     0.332\n",
      "2023-04-06 22:51:31,254 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-06 22:51:31,254 - INFO - combo.training.tensorboard_writer - EM                       |     0.103  |     0.138\n",
      "2023-04-06 22:51:31,254 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  6486.516  |       N/A\n",
      "2023-04-06 22:51:31,254 - INFO - combo.training.trainer - Epoch duration: 0:01:43.946313\n",
      "2023-04-06 22:51:31,254 - INFO - combo.training.trainer - Estimated training time remaining: 11:31:14\n",
      "2023-04-06 22:51:31,254 - INFO - allennlp.training.trainer - Epoch 1/399\n",
      "2023-04-06 22:51:31,254 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 22:51:31,255 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 22:51:31,259 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5026, UAS: 0.5009, LAS: 0.2748, UEM: 0.3237, LEM: 0.0478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9612, partial_loss/deprel_loss: 2.2067, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0384, loss: 4.7510, batch_reg_loss: 0.0809, reg_loss: 0.0810 ||:   3%|2         | 3/111 [00:02<01:25,  1.27it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2153, UAS: 0.4222, LAS: 0.2111, UEM: 0.2335, LEM: 0.0345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.8553, partial_loss/deprel_loss: 5.3630, partial_loss/cycle_loss: 0.0000, batch_loss: 5.1419, loss: 5.9501, batch_reg_loss: 0.0804, reg_loss: 0.0808 ||:   5%|5         | 6/111 [00:04<01:21,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1178, UAS: 0.3878, LAS: 0.1808, UEM: 0.1884, LEM: 0.0278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.1742, partial_loss/deprel_loss: 7.5720, partial_loss/cycle_loss: 0.0000, batch_loss: 7.5724, loss: 6.4967, batch_reg_loss: 0.0800, reg_loss: 0.0806 ||:   8%|8         | 9/111 [00:06<01:17,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1538, UAS: 0.3796, LAS: 0.1788, UEM: 0.1554, LEM: 0.0230, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.8665, partial_loss/deprel_loss: 7.3143, partial_loss/cycle_loss: 0.0000, batch_loss: 7.3044, loss: 6.6142, batch_reg_loss: 0.0796, reg_loss: 0.0804 ||:  11%|#         | 12/111 [00:08<01:14,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3034, UAS: 0.3993, LAS: 0.1915, UEM: 0.1191, LEM: 0.0176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.8777, partial_loss/deprel_loss: 4.3489, partial_loss/cycle_loss: 0.0000, batch_loss: 4.1338, loss: 6.2776, batch_reg_loss: 0.0791, reg_loss: 0.0801 ||:  14%|#3        | 15/111 [00:11<01:10,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.0891, UAS: 0.4053, LAS: 0.1952, UEM: 0.0993, LEM: 0.0147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 11.4397, partial_loss/deprel_loss: 9.1175, partial_loss/cycle_loss: 0.0000, batch_loss: 9.6606, loss: 6.2553, batch_reg_loss: 0.0787, reg_loss: 0.0799 ||:  16%|#6        | 18/111 [00:13<01:07,  1.38it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1735, UAS: 0.3983, LAS: 0.1911, UEM: 0.0899, LEM: 0.0133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.8049, partial_loss/deprel_loss: 6.6946, partial_loss/cycle_loss: 0.0000, batch_loss: 6.5950, loss: 6.3528, batch_reg_loss: 0.0783, reg_loss: 0.0797 ||:  19%|#8        | 21/111 [00:15<01:03,  1.41it/s] \n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2083, UAS: 0.3981, LAS: 0.1902, UEM: 0.0799, LEM: 0.0118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.1757, partial_loss/deprel_loss: 6.1916, partial_loss/cycle_loss: 0.0000, batch_loss: 6.0662, loss: 6.4057, batch_reg_loss: 0.0778, reg_loss: 0.0794 ||:  23%|##2       | 25/111 [00:17<00:58,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2246, UAS: 0.4012, LAS: 0.1929, UEM: 0.0725, LEM: 0.0107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.8645, partial_loss/deprel_loss: 6.6577, partial_loss/cycle_loss: 0.0000, batch_loss: 6.5763, loss: 6.4495, batch_reg_loss: 0.0772, reg_loss: 0.0792 ||:  26%|##6       | 29/111 [00:19<00:53,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2794, UAS: 0.4082, LAS: 0.1982, UEM: 0.0672, LEM: 0.0099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.1211, partial_loss/deprel_loss: 5.4412, partial_loss/cycle_loss: 0.0000, batch_loss: 5.2540, loss: 6.4181, batch_reg_loss: 0.0768, reg_loss: 0.0790 ||:  29%|##8       | 32/111 [00:22<00:52,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4732, UAS: 0.4244, LAS: 0.2122, UEM: 0.0709, LEM: 0.0090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3779, partial_loss/deprel_loss: 2.8672, partial_loss/cycle_loss: 0.0000, batch_loss: 2.6458, loss: 6.2343, batch_reg_loss: 0.0764, reg_loss: 0.0787 ||:  32%|###1      | 35/111 [00:24<00:51,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3141, UAS: 0.4378, LAS: 0.2248, UEM: 0.0649, LEM: 0.0081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.3674, partial_loss/deprel_loss: 5.2037, partial_loss/cycle_loss: 0.0000, batch_loss: 5.1125, loss: 6.0777, batch_reg_loss: 0.0761, reg_loss: 0.0785 ||:  34%|###4      | 38/111 [00:26<00:49,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2198, UAS: 0.4458, LAS: 0.2334, UEM: 0.0596, LEM: 0.0074, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 7.4857, partial_loss/deprel_loss: 7.1532, partial_loss/cycle_loss: 0.0000, batch_loss: 7.2953, loss: 6.0151, batch_reg_loss: 0.0756, reg_loss: 0.0783 ||:  38%|###7      | 42/111 [00:28<00:44,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.1855, UAS: 0.4456, LAS: 0.2364, UEM: 0.0564, LEM: 0.0070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 9.3300, partial_loss/deprel_loss: 7.6093, partial_loss/cycle_loss: 0.0000, batch_loss: 8.0285, loss: 6.0670, batch_reg_loss: 0.0751, reg_loss: 0.0780 ||:  41%|####1     | 46/111 [00:31<00:41,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3267, UAS: 0.4538, LAS: 0.2458, UEM: 0.0542, LEM: 0.0064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.7855, partial_loss/deprel_loss: 5.4041, partial_loss/cycle_loss: 0.0000, batch_loss: 5.3551, loss: 5.9627, batch_reg_loss: 0.0747, reg_loss: 0.0778 ||:  45%|####5     | 50/111 [00:33<00:40,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.2382, UAS: 0.4571, LAS: 0.2516, UEM: 0.0580, LEM: 0.0061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 8.0241, partial_loss/deprel_loss: 6.9911, partial_loss/cycle_loss: 0.0000, batch_loss: 7.2719, loss: 5.9374, batch_reg_loss: 0.0743, reg_loss: 0.0775 ||:  49%|####8     | 54/111 [00:36<00:38,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3417, UAS: 0.4640, LAS: 0.2595, UEM: 0.0551, LEM: 0.0057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.8885, partial_loss/deprel_loss: 5.4813, partial_loss/cycle_loss: 0.0000, batch_loss: 5.4367, loss: 5.8601, batch_reg_loss: 0.0740, reg_loss: 0.0773 ||:  51%|#####1    | 57/111 [00:38<00:37,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5159, UAS: 0.4709, LAS: 0.2672, UEM: 0.0535, LEM: 0.0055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9516, partial_loss/deprel_loss: 3.0269, partial_loss/cycle_loss: 0.0000, batch_loss: 2.8855, loss: 5.7894, batch_reg_loss: 0.0737, reg_loss: 0.0772 ||:  54%|#####4    | 60/111 [00:41<00:35,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3337, UAS: 0.4761, LAS: 0.2741, UEM: 0.0511, LEM: 0.0052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.5468, partial_loss/deprel_loss: 5.5245, partial_loss/cycle_loss: 0.0000, batch_loss: 5.6022, loss: 5.7441, batch_reg_loss: 0.0733, reg_loss: 0.0769 ||:  58%|#####7    | 64/111 [00:43<00:32,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4904, UAS: 0.4849, LAS: 0.2834, UEM: 0.0531, LEM: 0.0049, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4105, partial_loss/deprel_loss: 3.4176, partial_loss/cycle_loss: 0.0000, batch_loss: 3.2892, loss: 5.6526, batch_reg_loss: 0.0730, reg_loss: 0.0768 ||:  60%|######    | 67/111 [00:45<00:29,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4030, UAS: 0.4920, LAS: 0.2912, UEM: 0.0521, LEM: 0.0047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.4853, partial_loss/deprel_loss: 4.8174, partial_loss/cycle_loss: 0.0000, batch_loss: 4.8237, loss: 5.5778, batch_reg_loss: 0.0727, reg_loss: 0.0766 ||:  63%|######3   | 70/111 [00:47<00:28,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5730, UAS: 0.4957, LAS: 0.2965, UEM: 0.0518, LEM: 0.0046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8525, partial_loss/deprel_loss: 2.9431, partial_loss/cycle_loss: 0.0000, batch_loss: 2.7975, loss: 5.5408, batch_reg_loss: 0.0724, reg_loss: 0.0764 ||:  66%|######5   | 73/111 [00:50<00:26,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6026, UAS: 0.5030, LAS: 0.3044, UEM: 0.0582, LEM: 0.0055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2230, partial_loss/deprel_loss: 2.2791, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1400, loss: 5.4648, batch_reg_loss: 0.0722, reg_loss: 0.0763 ||:  68%|######8   | 76/111 [00:52<00:24,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5257, UAS: 0.5093, LAS: 0.3114, UEM: 0.0590, LEM: 0.0055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3376, partial_loss/deprel_loss: 3.2408, partial_loss/cycle_loss: 0.0000, batch_loss: 3.1320, loss: 5.3956, batch_reg_loss: 0.0719, reg_loss: 0.0761 ||:  71%|#######1  | 79/111 [00:54<00:22,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4749, UAS: 0.5194, LAS: 0.3224, UEM: 0.0594, LEM: 0.0054, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.3244, partial_loss/deprel_loss: 4.0444, partial_loss/cycle_loss: 0.0000, batch_loss: 3.9720, loss: 5.2892, batch_reg_loss: 0.0716, reg_loss: 0.0759 ||:  75%|#######4  | 83/111 [00:56<00:19,  1.45it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3801, UAS: 0.5250, LAS: 0.3287, UEM: 0.0793, LEM: 0.0098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.3332, partial_loss/deprel_loss: 5.2213, partial_loss/cycle_loss: 0.0000, batch_loss: 5.3150, loss: 5.2322, batch_reg_loss: 0.0713, reg_loss: 0.0757 ||:  77%|#######7  | 86/111 [00:58<00:17,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6195, UAS: 0.5311, LAS: 0.3359, UEM: 0.0901, LEM: 0.0120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5655, partial_loss/deprel_loss: 2.5718, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4416, loss: 5.1692, batch_reg_loss: 0.0711, reg_loss: 0.0756 ||:  80%|########  | 89/111 [01:01<00:15,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.3892, UAS: 0.5363, LAS: 0.3422, UEM: 0.0929, LEM: 0.0126, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.3758, partial_loss/deprel_loss: 4.9502, partial_loss/cycle_loss: 0.0000, batch_loss: 5.1062, loss: 5.1101, batch_reg_loss: 0.0708, reg_loss: 0.0754 ||:  83%|########2 | 92/111 [01:03<00:14,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4308, UAS: 0.5397, LAS: 0.3464, UEM: 0.0947, LEM: 0.0126, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.4937, partial_loss/deprel_loss: 4.5762, partial_loss/cycle_loss: 0.0000, batch_loss: 4.6303, loss: 5.0772, batch_reg_loss: 0.0706, reg_loss: 0.0753 ||:  86%|########5 | 95/111 [01:05<00:12,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4948, UAS: 0.5455, LAS: 0.3534, UEM: 0.0926, LEM: 0.0121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.4684, partial_loss/deprel_loss: 3.7837, partial_loss/cycle_loss: 0.0000, batch_loss: 3.7909, loss: 5.0118, batch_reg_loss: 0.0703, reg_loss: 0.0751 ||:  89%|########9 | 99/111 [01:08<00:08,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5697, UAS: 0.5519, LAS: 0.3608, UEM: 0.0901, LEM: 0.0116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5438, partial_loss/deprel_loss: 3.1081, partial_loss/cycle_loss: 0.0000, batch_loss: 3.0652, loss: 4.9450, batch_reg_loss: 0.0700, reg_loss: 0.0749 ||:  93%|#########2| 103/111 [01:11<00:05,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4417, UAS: 0.5557, LAS: 0.3658, UEM: 0.0879, LEM: 0.0113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.9554, partial_loss/deprel_loss: 4.7208, partial_loss/cycle_loss: 0.0000, batch_loss: 4.8375, loss: 4.9064, batch_reg_loss: 0.0697, reg_loss: 0.0747 ||:  96%|#########6| 107/111 [01:13<00:02,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4557, UAS: 0.5579, LAS: 0.3695, UEM: 0.0862, LEM: 0.0111, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.5091, partial_loss/deprel_loss: 4.5216, partial_loss/cycle_loss: 0.0000, batch_loss: 4.5886, loss: 4.8903, batch_reg_loss: 0.0695, reg_loss: 0.0745 ||: 100%|##########| 111/111 [01:16<00:00,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4557, UAS: 0.5579, LAS: 0.3695, UEM: 0.0862, LEM: 0.0111, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.5091, partial_loss/deprel_loss: 4.5216, partial_loss/cycle_loss: 0.0000, batch_loss: 4.5886, loss: 4.8903, batch_reg_loss: 0.0695, reg_loss: 0.0745 ||: 100%|##########| 111/111 [01:16<00:00,  1.46it/s]\n",
      "2023-04-06 22:52:47,522 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 22:52:47,522 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 22:52:47,522 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 22:52:47,522 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 22:52:47,522 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 22:52:47,522 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 22:52:47,522 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     4.522  |       N/A\n",
      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     4.509  |       N/A\n",
      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.075  |       N/A\n",
      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - UEM                      |     0.086  |       N/A\n",
      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - LAS                      |     0.369  |       N/A\n",
      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - loss                     |     4.890  |       N/A\n",
      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.097  |       N/A\n",
      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - LEM                      |     0.011  |       N/A\n",
      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - UAS                      |     0.558  |       N/A\n",
      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - EM                       |     0.456  |       N/A\n",
      "2023-04-06 22:52:47,523 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 22:52:47,524 - INFO - combo.training.trainer - Epoch duration: 0:01:16.269599\n",
      "2023-04-06 22:52:47,524 - INFO - combo.training.trainer - Estimated training time remaining: 9:57:43\n",
      "2023-04-06 22:52:47,524 - INFO - allennlp.training.trainer - Epoch 2/399\n",
      "2023-04-06 22:52:47,524 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 22:52:47,525 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 22:52:47,531 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4964, UAS: 0.6204, LAS: 0.4727, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.5829, partial_loss/deprel_loss: 3.9397, partial_loss/cycle_loss: 0.0000, batch_loss: 3.9376, loss: 4.4478, batch_reg_loss: 0.0693, reg_loss: 0.0693 ||:   3%|2         | 3/111 [00:02<01:15,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6479, UAS: 0.6977, LAS: 0.5419, UEM: 0.1026, LEM: 0.0106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4297, partial_loss/deprel_loss: 2.4040, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2782, loss: 3.5690, batch_reg_loss: 0.0691, reg_loss: 0.0692 ||:   5%|5         | 6/111 [00:04<01:13,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4715, UAS: 0.6718, LAS: 0.5218, UEM: 0.0755, LEM: 0.0079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.3314, partial_loss/deprel_loss: 4.2643, partial_loss/cycle_loss: 0.0000, batch_loss: 4.3466, loss: 3.8142, batch_reg_loss: 0.0688, reg_loss: 0.0691 ||:   9%|9         | 10/111 [00:06<01:08,  1.47it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6659, UAS: 0.6858, LAS: 0.5350, UEM: 0.0982, LEM: 0.0139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2351, partial_loss/deprel_loss: 2.0560, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9605, loss: 3.6185, batch_reg_loss: 0.0687, reg_loss: 0.0690 ||:  12%|#1        | 13/111 [00:09<01:10,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4735, UAS: 0.6843, LAS: 0.5326, UEM: 0.0795, LEM: 0.0112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.1403, partial_loss/deprel_loss: 4.2142, partial_loss/cycle_loss: 0.0000, batch_loss: 4.2679, loss: 3.6370, batch_reg_loss: 0.0685, reg_loss: 0.0689 ||:  15%|#5        | 17/111 [00:11<01:04,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6194, UAS: 0.6898, LAS: 0.5366, UEM: 0.0818, LEM: 0.0096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6949, partial_loss/deprel_loss: 2.5650, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4592, loss: 3.5757, batch_reg_loss: 0.0683, reg_loss: 0.0688 ||:  19%|#8        | 21/111 [00:14<01:00,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8213, UAS: 0.6979, LAS: 0.5455, UEM: 0.2170, LEM: 0.0958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2964, partial_loss/deprel_loss: 0.8507, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8079, loss: 3.5040, batch_reg_loss: 0.0681, reg_loss: 0.0687 ||:  23%|##2       | 25/111 [00:17<01:00,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5476, UAS: 0.7039, LAS: 0.5509, UEM: 0.1942, LEM: 0.0844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.0957, partial_loss/deprel_loss: 3.5291, partial_loss/cycle_loss: 0.0000, batch_loss: 3.5103, loss: 3.4550, batch_reg_loss: 0.0679, reg_loss: 0.0686 ||:  26%|##6       | 29/111 [00:19<00:55,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4213, UAS: 0.7068, LAS: 0.5547, UEM: 0.2095, LEM: 0.0826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 6.1965, partial_loss/deprel_loss: 4.9298, partial_loss/cycle_loss: 0.0000, batch_loss: 5.2509, loss: 3.4173, batch_reg_loss: 0.0677, reg_loss: 0.0685 ||:  29%|##8       | 32/111 [00:21<00:54,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4924, UAS: 0.7115, LAS: 0.5588, UEM: 0.1968, LEM: 0.0746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.2653, partial_loss/deprel_loss: 4.2745, partial_loss/cycle_loss: 0.0000, batch_loss: 4.3402, loss: 3.3855, batch_reg_loss: 0.0675, reg_loss: 0.0684 ||:  32%|###2      | 36/111 [00:24<00:49,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.4861, UAS: 0.7136, LAS: 0.5609, UEM: 0.1834, LEM: 0.0689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.9229, partial_loss/deprel_loss: 4.5551, partial_loss/cycle_loss: 0.0000, batch_loss: 4.6960, loss: 3.3816, batch_reg_loss: 0.0673, reg_loss: 0.0683 ||:  36%|###6      | 40/111 [00:26<00:45,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5632, UAS: 0.7197, LAS: 0.5670, UEM: 0.2184, LEM: 0.0784, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.7730, partial_loss/deprel_loss: 3.3519, partial_loss/cycle_loss: 0.0000, batch_loss: 3.3032, loss: 3.3144, batch_reg_loss: 0.0672, reg_loss: 0.0682 ||:  40%|###9      | 44/111 [00:29<00:43,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6700, UAS: 0.7271, LAS: 0.5743, UEM: 0.2131, LEM: 0.0736, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5173, partial_loss/deprel_loss: 2.2309, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1552, loss: 3.2352, batch_reg_loss: 0.0670, reg_loss: 0.0681 ||:  43%|####3     | 48/111 [00:32<00:42,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6822, UAS: 0.7298, LAS: 0.5776, UEM: 0.2081, LEM: 0.0692, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4613, partial_loss/deprel_loss: 2.0556, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0036, loss: 3.1978, batch_reg_loss: 0.0668, reg_loss: 0.0680 ||:  47%|####6     | 52/111 [00:34<00:38,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5462, UAS: 0.7286, LAS: 0.5768, UEM: 0.2001, LEM: 0.0662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.8922, partial_loss/deprel_loss: 3.8440, partial_loss/cycle_loss: 0.0000, batch_loss: 3.9202, loss: 3.2158, batch_reg_loss: 0.0666, reg_loss: 0.0679 ||:  50%|#####     | 56/111 [00:37<00:34,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6350, UAS: 0.7299, LAS: 0.5784, UEM: 0.1921, LEM: 0.0628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9702, partial_loss/deprel_loss: 2.6377, partial_loss/cycle_loss: 0.0000, batch_loss: 2.5707, loss: 3.2028, batch_reg_loss: 0.0665, reg_loss: 0.0678 ||:  54%|#####4    | 60/111 [00:39<00:31,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5091, UAS: 0.7325, LAS: 0.5817, UEM: 0.2037, LEM: 0.0652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.4303, partial_loss/deprel_loss: 4.1332, partial_loss/cycle_loss: 0.0000, batch_loss: 4.2589, loss: 3.1722, batch_reg_loss: 0.0663, reg_loss: 0.0677 ||:  58%|#####7    | 64/111 [00:42<00:29,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7077, UAS: 0.7373, LAS: 0.5864, UEM: 0.2098, LEM: 0.0632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8847, partial_loss/deprel_loss: 1.6877, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5933, loss: 3.1156, batch_reg_loss: 0.0661, reg_loss: 0.0677 ||:  61%|######1   | 68/111 [00:45<00:28,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6647, UAS: 0.7394, LAS: 0.5886, UEM: 0.2110, LEM: 0.0610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6878, partial_loss/deprel_loss: 2.3390, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2747, loss: 3.0945, batch_reg_loss: 0.0660, reg_loss: 0.0676 ||:  65%|######4   | 72/111 [00:47<00:26,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7484, UAS: 0.7455, LAS: 0.5957, UEM: 0.2179, LEM: 0.0604, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9192, partial_loss/deprel_loss: 1.6239, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5488, loss: 3.0243, batch_reg_loss: 0.0658, reg_loss: 0.0675 ||:  68%|######8   | 76/111 [00:50<00:22,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6129, UAS: 0.7469, LAS: 0.5972, UEM: 0.2108, LEM: 0.0580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4237, partial_loss/deprel_loss: 2.8786, partial_loss/cycle_loss: 0.0000, batch_loss: 2.8533, loss: 3.0067, batch_reg_loss: 0.0657, reg_loss: 0.0674 ||:  72%|#######2  | 80/111 [00:52<00:20,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6110, UAS: 0.7481, LAS: 0.5991, UEM: 0.2070, LEM: 0.0563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.7020, partial_loss/deprel_loss: 2.9102, partial_loss/cycle_loss: 0.0000, batch_loss: 2.9341, loss: 2.9940, batch_reg_loss: 0.0655, reg_loss: 0.0673 ||:  76%|#######5  | 84/111 [00:55<00:17,  1.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6596, UAS: 0.7500, LAS: 0.6014, UEM: 0.2146, LEM: 0.0583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7501, partial_loss/deprel_loss: 2.3329, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2817, loss: 2.9726, batch_reg_loss: 0.0654, reg_loss: 0.0672 ||:  79%|#######9  | 88/111 [00:58<00:15,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6643, UAS: 0.7513, LAS: 0.6027, UEM: 0.2091, LEM: 0.0562, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8068, partial_loss/deprel_loss: 2.3690, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3218, loss: 2.9569, batch_reg_loss: 0.0652, reg_loss: 0.0671 ||:  83%|########2 | 92/111 [01:00<00:12,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6382, UAS: 0.7496, LAS: 0.6019, UEM: 0.2044, LEM: 0.0549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3354, partial_loss/deprel_loss: 2.7962, partial_loss/cycle_loss: 0.0000, batch_loss: 2.7691, loss: 2.9764, batch_reg_loss: 0.0651, reg_loss: 0.0670 ||:  86%|########6 | 96/111 [01:03<00:09,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6473, UAS: 0.7524, LAS: 0.6053, UEM: 0.2124, LEM: 0.0594, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9798, partial_loss/deprel_loss: 2.4559, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4257, loss: 2.9392, batch_reg_loss: 0.0650, reg_loss: 0.0670 ||:  90%|######### | 100/111 [01:06<00:07,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7644, UAS: 0.7557, LAS: 0.6091, UEM: 0.2193, LEM: 0.0602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7733, partial_loss/deprel_loss: 1.3687, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3145, loss: 2.9018, batch_reg_loss: 0.0649, reg_loss: 0.0669 ||:  93%|#########2| 103/111 [01:08<00:05,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7474, UAS: 0.7586, LAS: 0.6125, UEM: 0.2241, LEM: 0.0607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8481, partial_loss/deprel_loss: 1.5531, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4769, loss: 2.8675, batch_reg_loss: 0.0648, reg_loss: 0.0668 ||:  95%|#########5| 106/111 [01:10<00:03,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6552, UAS: 0.7581, LAS: 0.6123, UEM: 0.2194, LEM: 0.0593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0818, partial_loss/deprel_loss: 2.4685, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4559, loss: 2.8710, batch_reg_loss: 0.0647, reg_loss: 0.0668 ||:  99%|#########9| 110/111 [01:13<00:00,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7474, UAS: 0.7592, LAS: 0.6135, UEM: 0.2213, LEM: 0.0596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8614, partial_loss/deprel_loss: 1.4801, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4210, loss: 2.8579, batch_reg_loss: 0.0646, reg_loss: 0.0668 ||: 100%|##########| 111/111 [01:13<00:00,  1.50it/s]\n",
      "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 22:54:01,487 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.480  |       N/A\n",
      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.861  |       N/A\n",
      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.067  |       N/A\n",
      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - UEM                      |     0.221  |       N/A\n",
      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - LAS                      |     0.614  |       N/A\n",
      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - loss                     |     2.858  |       N/A\n",
      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.097  |       N/A\n",
      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - LEM                      |     0.060  |       N/A\n",
      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - UAS                      |     0.759  |       N/A\n",
      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - EM                       |     0.747  |       N/A\n",
      "2023-04-06 22:54:01,488 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 22:54:01,489 - INFO - combo.training.trainer - Epoch duration: 0:01:13.964691\n",
      "2023-04-06 22:54:01,489 - INFO - combo.training.trainer - Estimated training time remaining: 9:20:36\n",
      "2023-04-06 22:54:01,489 - INFO - allennlp.training.trainer - Epoch 3/399\n",
      "2023-04-06 22:54:01,489 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 22:54:01,490 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 22:54:01,496 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5522, UAS: 0.7779, LAS: 0.6461, UEM: 0.4911, LEM: 0.1886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.8721, partial_loss/deprel_loss: 3.5902, partial_loss/cycle_loss: 0.0000, batch_loss: 3.7111, loss: 2.6501, batch_reg_loss: 0.0646, reg_loss: 0.0646 ||:   3%|2         | 3/111 [00:02<01:18,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5244, UAS: 0.7464, LAS: 0.6105, UEM: 0.3157, LEM: 0.1195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.4001, partial_loss/deprel_loss: 3.7685, partial_loss/cycle_loss: 0.0000, batch_loss: 3.9592, loss: 2.9957, batch_reg_loss: 0.0644, reg_loss: 0.0645 ||:   6%|6         | 7/111 [00:04<01:12,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7839, UAS: 0.7827, LAS: 0.6504, UEM: 0.3397, LEM: 0.1092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6771, partial_loss/deprel_loss: 1.2152, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1719, loss: 2.5749, batch_reg_loss: 0.0644, reg_loss: 0.0645 ||:   9%|9         | 10/111 [00:07<01:15,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5962, UAS: 0.7864, LAS: 0.6557, UEM: 0.2923, LEM: 0.0888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.4499, partial_loss/deprel_loss: 3.2404, partial_loss/cycle_loss: 0.0000, batch_loss: 3.3466, loss: 2.5323, batch_reg_loss: 0.0643, reg_loss: 0.0644 ||:  12%|#1        | 13/111 [00:09<01:15,  1.30it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7262, UAS: 0.7947, LAS: 0.6646, UEM: 0.2585, LEM: 0.0737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3265, partial_loss/deprel_loss: 2.0057, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9340, loss: 2.4410, batch_reg_loss: 0.0642, reg_loss: 0.0644 ||:  14%|#4        | 16/111 [00:11<01:10,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7504, UAS: 0.7977, LAS: 0.6674, UEM: 0.2444, LEM: 0.0644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9908, partial_loss/deprel_loss: 1.5113, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4713, loss: 2.4127, batch_reg_loss: 0.0641, reg_loss: 0.0644 ||:  18%|#8        | 20/111 [00:14<01:04,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7616, UAS: 0.8064, LAS: 0.6763, UEM: 0.2720, LEM: 0.0723, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6766, partial_loss/deprel_loss: 1.3444, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2749, loss: 2.3152, batch_reg_loss: 0.0640, reg_loss: 0.0643 ||:  22%|##1       | 24/111 [00:17<01:01,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7372, UAS: 0.8092, LAS: 0.6787, UEM: 0.2590, LEM: 0.0651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9644, partial_loss/deprel_loss: 1.6293, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5602, loss: 2.2885, batch_reg_loss: 0.0639, reg_loss: 0.0643 ||:  25%|##5       | 28/111 [00:19<00:56,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6937, UAS: 0.8106, LAS: 0.6800, UEM: 0.2438, LEM: 0.0602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7709, partial_loss/deprel_loss: 2.3077, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2642, loss: 2.2836, batch_reg_loss: 0.0638, reg_loss: 0.0642 ||:  28%|##7       | 31/111 [00:21<00:54,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6296, UAS: 0.8098, LAS: 0.6796, UEM: 0.2471, LEM: 0.0589, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.8165, partial_loss/deprel_loss: 2.8907, partial_loss/cycle_loss: 0.0000, batch_loss: 2.9396, loss: 2.2935, batch_reg_loss: 0.0637, reg_loss: 0.0642 ||:  31%|###       | 34/111 [00:23<00:52,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7206, UAS: 0.8103, LAS: 0.6805, UEM: 0.2360, LEM: 0.0556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4751, partial_loss/deprel_loss: 1.8719, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8562, loss: 2.2865, batch_reg_loss: 0.0637, reg_loss: 0.0641 ||:  33%|###3      | 37/111 [00:25<00:50,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7730, UAS: 0.8120, LAS: 0.6830, UEM: 0.2357, LEM: 0.0549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7538, partial_loss/deprel_loss: 1.3218, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2718, loss: 2.2638, batch_reg_loss: 0.0636, reg_loss: 0.0641 ||:  37%|###6      | 41/111 [00:28<00:48,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7604, UAS: 0.8162, LAS: 0.6880, UEM: 0.2428, LEM: 0.0550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9503, partial_loss/deprel_loss: 1.5284, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4763, loss: 2.2114, batch_reg_loss: 0.0635, reg_loss: 0.0640 ||:  40%|###9      | 44/111 [00:31<00:48,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6857, UAS: 0.8111, LAS: 0.6833, UEM: 0.2349, LEM: 0.0532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9399, partial_loss/deprel_loss: 2.2534, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2541, loss: 2.2633, batch_reg_loss: 0.0634, reg_loss: 0.0640 ||:  42%|####2     | 47/111 [00:33<00:45,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5934, UAS: 0.8120, LAS: 0.6844, UEM: 0.2419, LEM: 0.0557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.2585, partial_loss/deprel_loss: 3.4598, partial_loss/cycle_loss: 0.0000, batch_loss: 3.4829, loss: 2.2516, batch_reg_loss: 0.0634, reg_loss: 0.0640 ||:  45%|####5     | 50/111 [00:35<00:43,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7835, UAS: 0.8132, LAS: 0.6859, UEM: 0.2388, LEM: 0.0539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8033, partial_loss/deprel_loss: 1.3395, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2956, loss: 2.2403, batch_reg_loss: 0.0633, reg_loss: 0.0639 ||:  49%|####8     | 54/111 [00:37<00:39,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6621, UAS: 0.8141, LAS: 0.6874, UEM: 0.2512, LEM: 0.0626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2108, partial_loss/deprel_loss: 2.3082, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3519, loss: 2.2189, batch_reg_loss: 0.0632, reg_loss: 0.0639 ||:  51%|#####1    | 57/111 [00:40<00:38,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7630, UAS: 0.8126, LAS: 0.6865, UEM: 0.2518, LEM: 0.0619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7939, partial_loss/deprel_loss: 1.3554, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3063, loss: 2.2319, batch_reg_loss: 0.0631, reg_loss: 0.0638 ||:  55%|#####4    | 61/111 [00:42<00:34,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6531, UAS: 0.8133, LAS: 0.6870, UEM: 0.2467, LEM: 0.0600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5764, partial_loss/deprel_loss: 2.7017, partial_loss/cycle_loss: 0.0000, batch_loss: 2.7397, loss: 2.2260, batch_reg_loss: 0.0631, reg_loss: 0.0638 ||:  58%|#####7    | 64/111 [00:44<00:32,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7632, UAS: 0.8168, LAS: 0.6906, UEM: 0.2563, LEM: 0.0609, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0152, partial_loss/deprel_loss: 1.4983, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4647, loss: 2.1896, batch_reg_loss: 0.0630, reg_loss: 0.0638 ||:  60%|######    | 67/111 [00:46<00:31,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7593, UAS: 0.8180, LAS: 0.6922, UEM: 0.2522, LEM: 0.0592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0271, partial_loss/deprel_loss: 1.5328, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4947, loss: 2.1787, batch_reg_loss: 0.0630, reg_loss: 0.0637 ||:  63%|######3   | 70/111 [00:49<00:29,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8697, UAS: 0.8196, LAS: 0.6948, UEM: 0.2829, LEM: 0.0893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2393, partial_loss/deprel_loss: 0.5426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5448, loss: 2.1589, batch_reg_loss: 0.0629, reg_loss: 0.0637 ||:  67%|######6   | 74/111 [00:52<00:27,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6841, UAS: 0.8216, LAS: 0.6972, UEM: 0.2908, LEM: 0.0913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9630, partial_loss/deprel_loss: 2.3586, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3423, loss: 2.1351, batch_reg_loss: 0.0628, reg_loss: 0.0637 ||:  69%|######9   | 77/111 [00:54<00:25,  1.32it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7229, UAS: 0.8176, LAS: 0.6935, UEM: 0.2843, LEM: 0.0890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5630, partial_loss/deprel_loss: 1.9479, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9337, loss: 2.1812, batch_reg_loss: 0.0628, reg_loss: 0.0636 ||:  73%|#######2  | 81/111 [00:57<00:21,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7388, UAS: 0.8182, LAS: 0.6943, UEM: 0.2795, LEM: 0.0866, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1689, partial_loss/deprel_loss: 1.7263, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6775, loss: 2.1734, batch_reg_loss: 0.0627, reg_loss: 0.0636 ||:  77%|#######6  | 85/111 [00:59<00:17,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7027, UAS: 0.8202, LAS: 0.6969, UEM: 0.2926, LEM: 0.0965, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7537, partial_loss/deprel_loss: 2.1230, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1117, loss: 2.1483, batch_reg_loss: 0.0626, reg_loss: 0.0635 ||:  80%|########  | 89/111 [01:02<00:14,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7744, UAS: 0.8185, LAS: 0.6957, UEM: 0.2882, LEM: 0.0944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0477, partial_loss/deprel_loss: 1.4812, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4571, loss: 2.1638, batch_reg_loss: 0.0626, reg_loss: 0.0635 ||:  84%|########3 | 93/111 [01:04<00:11,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8176, UAS: 0.8203, LAS: 0.6977, UEM: 0.2968, LEM: 0.0975, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4458, partial_loss/deprel_loss: 0.9504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9120, loss: 2.1448, batch_reg_loss: 0.0625, reg_loss: 0.0635 ||:  87%|########7 | 97/111 [01:07<00:09,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6879, UAS: 0.8175, LAS: 0.6950, UEM: 0.2918, LEM: 0.0958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0558, partial_loss/deprel_loss: 2.3149, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3255, loss: 2.1791, batch_reg_loss: 0.0624, reg_loss: 0.0634 ||:  91%|######### | 101/111 [01:10<00:06,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7525, UAS: 0.8183, LAS: 0.6962, UEM: 0.2889, LEM: 0.0938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1692, partial_loss/deprel_loss: 1.6748, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6361, loss: 2.1703, batch_reg_loss: 0.0624, reg_loss: 0.0634 ||:  95%|#########4| 105/111 [01:13<00:04,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6415, UAS: 0.8200, LAS: 0.6981, UEM: 0.2967, LEM: 0.0958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.9598, partial_loss/deprel_loss: 2.7343, partial_loss/cycle_loss: 0.0000, batch_loss: 2.8417, loss: 2.1535, batch_reg_loss: 0.0623, reg_loss: 0.0633 ||:  98%|#########8| 109/111 [01:15<00:01,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6768, UAS: 0.8197, LAS: 0.6979, UEM: 0.2936, LEM: 0.0948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2748, partial_loss/deprel_loss: 2.3791, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4206, loss: 2.1574, batch_reg_loss: 0.0623, reg_loss: 0.0633 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
      "2023-04-06 22:55:18,227 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 22:55:18,227 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     2.379  |       N/A\n",
      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     2.275  |       N/A\n",
      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.063  |       N/A\n",
      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - UEM                      |     0.294  |       N/A\n",
      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - LAS                      |     0.698  |       N/A\n",
      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - loss                     |     2.157  |       N/A\n",
      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.097  |       N/A\n",
      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - LEM                      |     0.095  |       N/A\n",
      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 22:55:18,228 - INFO - combo.training.tensorboard_writer - UAS                      |     0.820  |       N/A\n",
      "2023-04-06 22:55:18,229 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 22:55:18,229 - INFO - combo.training.tensorboard_writer - EM                       |     0.677  |       N/A\n",
      "2023-04-06 22:55:18,229 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 22:55:18,229 - INFO - combo.training.trainer - Epoch duration: 0:01:16.740242\n",
      "2023-04-06 22:55:18,229 - INFO - combo.training.trainer - Estimated training time remaining: 9:06:01\n",
      "2023-04-06 22:55:18,230 - INFO - allennlp.training.trainer - Epoch 4/399\n",
      "2023-04-06 22:55:18,230 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 22:55:18,230 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 22:55:18,236 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6673, UAS: 0.7876, LAS: 0.6728, UEM: 0.0000, LEM: 0.0000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6651, partial_loss/deprel_loss: 2.6082, partial_loss/cycle_loss: 0.0000, batch_loss: 2.6819, loss: 2.5358, batch_reg_loss: 0.0623, reg_loss: 0.0623 ||:   3%|2         | 3/111 [00:02<01:16,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.5590, UAS: 0.7847, LAS: 0.6734, UEM: 0.0866, LEM: 0.0162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 5.1240, partial_loss/deprel_loss: 3.5891, partial_loss/cycle_loss: 0.0000, batch_loss: 3.9583, loss: 2.5349, batch_reg_loss: 0.0623, reg_loss: 0.0623 ||:   5%|5         | 6/111 [00:04<01:14,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8070, UAS: 0.8104, LAS: 0.7009, UEM: 0.1961, LEM: 0.0497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6716, partial_loss/deprel_loss: 1.1607, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1251, loss: 2.2299, batch_reg_loss: 0.0622, reg_loss: 0.0623 ||:   8%|8         | 9/111 [00:06<01:13,  1.38it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6524, UAS: 0.8224, LAS: 0.7121, UEM: 0.2315, LEM: 0.0565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.7101, partial_loss/deprel_loss: 2.5980, partial_loss/cycle_loss: 0.0000, batch_loss: 2.6826, loss: 2.1006, batch_reg_loss: 0.0622, reg_loss: 0.0622 ||:  12%|#1        | 13/111 [00:09<01:08,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8191, UAS: 0.8348, LAS: 0.7248, UEM: 0.3040, LEM: 0.0847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6051, partial_loss/deprel_loss: 1.1280, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0855, loss: 1.9659, batch_reg_loss: 0.0621, reg_loss: 0.0622 ||:  14%|#4        | 16/111 [00:11<01:08,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7504, UAS: 0.8448, LAS: 0.7351, UEM: 0.3447, LEM: 0.0959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1769, partial_loss/deprel_loss: 1.5892, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5688, loss: 1.8513, batch_reg_loss: 0.0621, reg_loss: 0.0622 ||:  17%|#7        | 19/111 [00:13<01:08,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6802, UAS: 0.8436, LAS: 0.7338, UEM: 0.3206, LEM: 0.0886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3447, partial_loss/deprel_loss: 2.3007, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3715, loss: 1.8468, batch_reg_loss: 0.0620, reg_loss: 0.0622 ||:  21%|##        | 23/111 [00:16<01:02,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6018, UAS: 0.8382, LAS: 0.7278, UEM: 0.2957, LEM: 0.0798, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.6370, partial_loss/deprel_loss: 2.9539, partial_loss/cycle_loss: 0.0000, batch_loss: 3.1524, loss: 1.9081, batch_reg_loss: 0.0620, reg_loss: 0.0621 ||:  24%|##4       | 27/111 [00:18<00:56,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8199, UAS: 0.8419, LAS: 0.7321, UEM: 0.3047, LEM: 0.0860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6244, partial_loss/deprel_loss: 1.0798, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0506, loss: 1.8696, batch_reg_loss: 0.0619, reg_loss: 0.0621 ||:  28%|##7       | 31/111 [00:21<00:53,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6994, UAS: 0.8443, LAS: 0.7347, UEM: 0.3040, LEM: 0.0849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3267, partial_loss/deprel_loss: 2.3726, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4253, loss: 1.8526, batch_reg_loss: 0.0619, reg_loss: 0.0621 ||:  31%|###       | 34/111 [00:23<00:52,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8111, UAS: 0.8474, LAS: 0.7388, UEM: 0.3153, LEM: 0.0885, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5854, partial_loss/deprel_loss: 1.0084, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9856, loss: 1.8095, batch_reg_loss: 0.0618, reg_loss: 0.0621 ||:  33%|###3      | 37/111 [00:26<00:54,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7707, UAS: 0.8458, LAS: 0.7371, UEM: 0.3159, LEM: 0.0895, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1063, partial_loss/deprel_loss: 1.5260, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5038, loss: 1.8230, batch_reg_loss: 0.0618, reg_loss: 0.0620 ||:  37%|###6      | 41/111 [00:28<00:49,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6812, UAS: 0.8369, LAS: 0.7281, UEM: 0.3046, LEM: 0.0863, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4355, partial_loss/deprel_loss: 2.4780, partial_loss/cycle_loss: 0.0000, batch_loss: 2.5312, loss: 1.9258, batch_reg_loss: 0.0617, reg_loss: 0.0620 ||:  41%|####      | 45/111 [00:31<00:44,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7159, UAS: 0.8362, LAS: 0.7273, UEM: 0.2977, LEM: 0.0830, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6377, partial_loss/deprel_loss: 2.1209, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0860, loss: 1.9371, batch_reg_loss: 0.0617, reg_loss: 0.0620 ||:  43%|####3     | 48/111 [00:33<00:44,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7413, UAS: 0.8332, LAS: 0.7243, UEM: 0.2893, LEM: 0.0804, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3635, partial_loss/deprel_loss: 1.7896, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7661, loss: 1.9680, batch_reg_loss: 0.0617, reg_loss: 0.0620 ||:  46%|####5     | 51/111 [00:35<00:43,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7546, UAS: 0.8368, LAS: 0.7289, UEM: 0.3044, LEM: 0.0903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4638, partial_loss/deprel_loss: 1.6606, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6829, loss: 1.9241, batch_reg_loss: 0.0617, reg_loss: 0.0620 ||:  50%|####9     | 55/111 [00:38<00:38,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8019, UAS: 0.8378, LAS: 0.7302, UEM: 0.2995, LEM: 0.0866, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7480, partial_loss/deprel_loss: 1.2659, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2240, loss: 1.9138, batch_reg_loss: 0.0617, reg_loss: 0.0619 ||:  53%|#####3    | 59/111 [00:40<00:35,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7229, UAS: 0.8413, LAS: 0.7346, UEM: 0.3580, LEM: 0.1405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7434, partial_loss/deprel_loss: 2.0320, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0359, loss: 1.8734, batch_reg_loss: 0.0616, reg_loss: 0.0619 ||:  56%|#####5    | 62/111 [00:43<00:36,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7846, UAS: 0.8430, LAS: 0.7366, UEM: 0.3472, LEM: 0.1341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0253, partial_loss/deprel_loss: 1.4828, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4530, loss: 1.8528, batch_reg_loss: 0.0616, reg_loss: 0.0619 ||:  59%|#####9    | 66/111 [00:46<00:32,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8108, UAS: 0.8447, LAS: 0.7383, UEM: 0.3415, LEM: 0.1300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7083, partial_loss/deprel_loss: 1.0955, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0797, loss: 1.8399, batch_reg_loss: 0.0616, reg_loss: 0.0619 ||:  63%|######3   | 70/111 [00:49<00:29,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8163, UAS: 0.8453, LAS: 0.7392, UEM: 0.3375, LEM: 0.1274, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6994, partial_loss/deprel_loss: 1.2058, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1661, loss: 1.8386, batch_reg_loss: 0.0616, reg_loss: 0.0619 ||:  66%|######5   | 73/111 [00:51<00:27,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7005, UAS: 0.8452, LAS: 0.7393, UEM: 0.3279, LEM: 0.1228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2810, partial_loss/deprel_loss: 2.1734, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2565, loss: 1.8368, batch_reg_loss: 0.0615, reg_loss: 0.0619 ||:  69%|######9   | 77/111 [00:53<00:23,  1.47it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6741, UAS: 0.8452, LAS: 0.7395, UEM: 0.3431, LEM: 0.1362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5383, partial_loss/deprel_loss: 2.6162, partial_loss/cycle_loss: 0.0000, batch_loss: 2.6622, loss: 1.8377, batch_reg_loss: 0.0615, reg_loss: 0.0618 ||:  72%|#######2  | 80/111 [00:55<00:21,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7905, UAS: 0.8448, LAS: 0.7389, UEM: 0.3355, LEM: 0.1324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8467, partial_loss/deprel_loss: 1.3524, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3128, loss: 1.8435, batch_reg_loss: 0.0615, reg_loss: 0.0618 ||:  76%|#######5  | 84/111 [00:58<00:18,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7866, UAS: 0.8450, LAS: 0.7392, UEM: 0.3311, LEM: 0.1296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9914, partial_loss/deprel_loss: 1.4335, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4066, loss: 1.8406, batch_reg_loss: 0.0615, reg_loss: 0.0618 ||:  78%|#######8  | 87/111 [01:00<00:16,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8356, UAS: 0.8472, LAS: 0.7416, UEM: 0.3370, LEM: 0.1305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3395, partial_loss/deprel_loss: 0.8325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7954, loss: 1.8162, batch_reg_loss: 0.0615, reg_loss: 0.0618 ||:  82%|########1 | 91/111 [01:02<00:13,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6469, UAS: 0.8463, LAS: 0.7407, UEM: 0.3336, LEM: 0.1286, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.0053, partial_loss/deprel_loss: 2.4016, partial_loss/cycle_loss: 0.0000, batch_loss: 2.5838, loss: 1.8231, batch_reg_loss: 0.0615, reg_loss: 0.0618 ||:  85%|########4 | 94/111 [01:05<00:11,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7256, UAS: 0.8454, LAS: 0.7396, UEM: 0.3284, LEM: 0.1263, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6650, partial_loss/deprel_loss: 1.9252, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9346, loss: 1.8328, batch_reg_loss: 0.0614, reg_loss: 0.0618 ||:  87%|########7 | 97/111 [01:07<00:10,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7599, UAS: 0.8465, LAS: 0.7407, UEM: 0.3289, LEM: 0.1240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2847, partial_loss/deprel_loss: 1.7309, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7031, loss: 1.8239, batch_reg_loss: 0.0614, reg_loss: 0.0618 ||:  91%|######### | 101/111 [01:09<00:06,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8397, UAS: 0.8483, LAS: 0.7429, UEM: 0.3366, LEM: 0.1267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5180, partial_loss/deprel_loss: 0.8814, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8701, loss: 1.8040, batch_reg_loss: 0.0614, reg_loss: 0.0618 ||:  95%|#########4| 105/111 [01:11<00:03,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7331, UAS: 0.8486, LAS: 0.7433, UEM: 0.3357, LEM: 0.1260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9632, partial_loss/deprel_loss: 1.9598, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0219, loss: 1.8012, batch_reg_loss: 0.0614, reg_loss: 0.0617 ||:  98%|#########8| 109/111 [01:14<00:01,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8351, UAS: 0.8500, LAS: 0.7451, UEM: 0.3439, LEM: 0.1293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5623, partial_loss/deprel_loss: 0.9248, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9137, loss: 1.7845, batch_reg_loss: 0.0614, reg_loss: 0.0617 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
      "2023-04-06 22:56:33,798 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 22:56:33,798 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.925  |       N/A\n",
      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.562  |       N/A\n",
      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.062  |       N/A\n",
      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - UEM                      |     0.344  |       N/A\n",
      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - LAS                      |     0.745  |       N/A\n",
      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - loss                     |     1.785  |       N/A\n",
      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.097  |       N/A\n",
      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - LEM                      |     0.129  |       N/A\n",
      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 22:56:33,799 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 22:56:33,800 - INFO - combo.training.tensorboard_writer - UAS                      |     0.850  |       N/A\n",
      "2023-04-06 22:56:33,800 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 22:56:33,800 - INFO - combo.training.tensorboard_writer - EM                       |     0.835  |       N/A\n",
      "2023-04-06 22:56:33,800 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 22:56:33,800 - INFO - combo.training.trainer - Epoch duration: 0:01:15.570663\n",
      "2023-04-06 22:56:33,800 - INFO - combo.training.trainer - Estimated training time remaining: 8:55:12\n",
      "2023-04-06 22:56:33,800 - INFO - allennlp.training.trainer - Epoch 5/399\n",
      "2023-04-06 22:56:33,801 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 22:56:33,801 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 22:56:33,806 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7017, UAS: 0.8575, LAS: 0.7564, UEM: 0.2434, LEM: 0.0823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1851, partial_loss/deprel_loss: 2.1142, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1898, loss: 1.6516, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:   4%|3         | 4/111 [00:02<00:55,  1.93it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7902, UAS: 0.8573, LAS: 0.7593, UEM: 0.1945, LEM: 0.0493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1142, partial_loss/deprel_loss: 1.3736, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3831, loss: 1.6800, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:   7%|7         | 8/111 [00:04<00:55,  1.84it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8045, UAS: 0.8581, LAS: 0.7600, UEM: 0.1996, LEM: 0.0437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7492, partial_loss/deprel_loss: 1.2165, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1844, loss: 1.6630, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  10%|9         | 11/111 [00:06<01:00,  1.66it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7124, UAS: 0.8519, LAS: 0.7533, UEM: 0.1704, LEM: 0.0371, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3078, partial_loss/deprel_loss: 2.1321, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2286, loss: 1.7343, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  13%|#2        | 14/111 [00:08<01:02,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8202, UAS: 0.8522, LAS: 0.7539, UEM: 0.1756, LEM: 0.0394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7495, partial_loss/deprel_loss: 1.1383, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1219, loss: 1.7377, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  15%|#5        | 17/111 [00:11<01:03,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7448, UAS: 0.8579, LAS: 0.7603, UEM: 0.2127, LEM: 0.0579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5514, partial_loss/deprel_loss: 1.6989, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7308, loss: 1.6711, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  18%|#8        | 20/111 [00:13<01:03,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8081, UAS: 0.8630, LAS: 0.7659, UEM: 0.2570, LEM: 0.0807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9484, partial_loss/deprel_loss: 1.1780, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1934, loss: 1.6165, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  21%|##        | 23/111 [00:15<01:03,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7710, UAS: 0.8636, LAS: 0.7669, UEM: 0.2827, LEM: 0.0951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3315, partial_loss/deprel_loss: 1.5198, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5435, loss: 1.6098, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  23%|##3       | 26/111 [00:17<01:01,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7620, UAS: 0.8608, LAS: 0.7644, UEM: 0.3072, LEM: 0.1148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3709, partial_loss/deprel_loss: 1.5272, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5573, loss: 1.6290, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  27%|##7       | 30/111 [00:20<00:55,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8430, UAS: 0.8687, LAS: 0.7732, UEM: 0.3575, LEM: 0.1333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5238, partial_loss/deprel_loss: 0.8705, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8625, loss: 1.5422, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  31%|###       | 34/111 [00:22<00:51,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6280, UAS: 0.8659, LAS: 0.7697, UEM: 0.3664, LEM: 0.1405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.5054, partial_loss/deprel_loss: 2.7331, partial_loss/cycle_loss: 0.0000, batch_loss: 2.9489, loss: 1.5726, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  34%|###4      | 38/111 [00:25<00:48,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7226, UAS: 0.8644, LAS: 0.7677, UEM: 0.3535, LEM: 0.1338, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9962, partial_loss/deprel_loss: 2.0087, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0676, loss: 1.5945, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  38%|###7      | 42/111 [00:27<00:45,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7397, UAS: 0.8681, LAS: 0.7717, UEM: 0.3782, LEM: 0.1455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6230, partial_loss/deprel_loss: 1.7756, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8064, loss: 1.5545, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  41%|####1     | 46/111 [00:30<00:42,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8341, UAS: 0.8698, LAS: 0.7736, UEM: 0.3770, LEM: 0.1440, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6194, partial_loss/deprel_loss: 0.9456, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9417, loss: 1.5345, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  45%|####5     | 50/111 [00:33<00:41,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7631, UAS: 0.8696, LAS: 0.7733, UEM: 0.3760, LEM: 0.1438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5292, partial_loss/deprel_loss: 1.6206, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6637, loss: 1.5373, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  48%|####7     | 53/111 [00:35<00:40,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7952, UAS: 0.8706, LAS: 0.7745, UEM: 0.3732, LEM: 0.1419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0361, partial_loss/deprel_loss: 1.3750, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3686, loss: 1.5272, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  50%|#####     | 56/111 [00:37<00:38,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8339, UAS: 0.8725, LAS: 0.7769, UEM: 0.3885, LEM: 0.1536, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6950, partial_loss/deprel_loss: 1.0568, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0458, loss: 1.5054, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  53%|#####3    | 59/111 [00:39<00:36,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.8729, LAS: 0.7771, UEM: 0.3914, LEM: 0.1520, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6869, partial_loss/deprel_loss: 1.1239, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0979, loss: 1.5056, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  56%|#####5    | 62/111 [00:42<00:34,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7123, UAS: 0.8726, LAS: 0.7767, UEM: 0.3847, LEM: 0.1476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1384, partial_loss/deprel_loss: 1.9929, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0833, loss: 1.5100, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  59%|#####8    | 65/111 [00:44<00:32,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9076, UAS: 0.8741, LAS: 0.7786, UEM: 0.4104, LEM: 0.1780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1555, partial_loss/deprel_loss: 0.3590, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3797, loss: 1.4902, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  61%|######1   | 68/111 [00:46<00:31,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6839, UAS: 0.8727, LAS: 0.7774, UEM: 0.4028, LEM: 0.1735, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6867, partial_loss/deprel_loss: 2.2795, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4223, loss: 1.4995, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  64%|######3   | 71/111 [00:48<00:28,  1.40it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7946, UAS: 0.8714, LAS: 0.7764, UEM: 0.3971, LEM: 0.1677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0939, partial_loss/deprel_loss: 1.3590, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3673, loss: 1.5104, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  68%|######7   | 75/111 [00:51<00:24,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6175, UAS: 0.8696, LAS: 0.7746, UEM: 0.3921, LEM: 0.1644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.8233, partial_loss/deprel_loss: 2.8003, partial_loss/cycle_loss: 0.0000, batch_loss: 3.0663, loss: 1.5301, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  71%|#######1  | 79/111 [00:53<00:20,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7637, UAS: 0.8661, LAS: 0.7709, UEM: 0.3842, LEM: 0.1610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5925, partial_loss/deprel_loss: 1.8030, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8223, loss: 1.5739, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  75%|#######4  | 83/111 [00:55<00:18,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7484, UAS: 0.8666, LAS: 0.7714, UEM: 0.3769, LEM: 0.1561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5992, partial_loss/deprel_loss: 1.6861, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7301, loss: 1.5698, batch_reg_loss: 0.0614, reg_loss: 0.0614 ||:  78%|#######8  | 87/111 [00:58<00:16,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6880, UAS: 0.8660, LAS: 0.7708, UEM: 0.3766, LEM: 0.1560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6133, partial_loss/deprel_loss: 2.1378, partial_loss/cycle_loss: 0.0000, batch_loss: 2.2944, loss: 1.5744, batch_reg_loss: 0.0615, reg_loss: 0.0614 ||:  81%|########1 | 90/111 [01:01<00:15,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7145, UAS: 0.8654, LAS: 0.7703, UEM: 0.3729, LEM: 0.1542, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3646, partial_loss/deprel_loss: 2.0728, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1926, loss: 1.5798, batch_reg_loss: 0.0615, reg_loss: 0.0614 ||:  84%|########3 | 93/111 [01:03<00:13,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7754, UAS: 0.8652, LAS: 0.7702, UEM: 0.3709, LEM: 0.1526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2314, partial_loss/deprel_loss: 1.5581, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5543, loss: 1.5834, batch_reg_loss: 0.0615, reg_loss: 0.0614 ||:  86%|########6 | 96/111 [01:05<00:10,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7925, UAS: 0.8642, LAS: 0.7695, UEM: 0.3719, LEM: 0.1529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1520, partial_loss/deprel_loss: 1.3520, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3735, loss: 1.5922, batch_reg_loss: 0.0615, reg_loss: 0.0614 ||:  89%|########9 | 99/111 [01:08<00:08,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6972, UAS: 0.8644, LAS: 0.7697, UEM: 0.3691, LEM: 0.1504, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3335, partial_loss/deprel_loss: 2.2219, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3058, loss: 1.5920, batch_reg_loss: 0.0615, reg_loss: 0.0614 ||:  93%|#########2| 103/111 [01:10<00:05,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8721, UAS: 0.8655, LAS: 0.7711, UEM: 0.3800, LEM: 0.1593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2474, partial_loss/deprel_loss: 0.5589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5582, loss: 1.5770, batch_reg_loss: 0.0616, reg_loss: 0.0614 ||:  95%|#########5| 106/111 [01:12<00:03,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7927, UAS: 0.8653, LAS: 0.7706, UEM: 0.3763, LEM: 0.1567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9309, partial_loss/deprel_loss: 1.2968, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2852, loss: 1.5809, batch_reg_loss: 0.0616, reg_loss: 0.0614 ||:  98%|#########8| 109/111 [01:14<00:01,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8018, UAS: 0.8655, LAS: 0.7708, UEM: 0.3731, LEM: 0.1547, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8911, partial_loss/deprel_loss: 1.3144, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2913, loss: 1.5809, batch_reg_loss: 0.0616, reg_loss: 0.0614 ||: 100%|##########| 111/111 [01:15<00:00,  1.46it/s]\n",
      "2023-04-06 22:57:49,583 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8182, UAS: 0.9041, LAS: 0.8223, UEM: 0.3590, LEM: 0.0897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9126, partial_loss/deprel_loss: 32.0601, partial_loss/cycle_loss: 0.0000, batch_loss: 25.8306, loss: 27.0349, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:09,  1.10it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8824, UAS: 0.9214, LAS: 0.8453, UEM: 0.5769, LEM: 0.3145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4594, partial_loss/deprel_loss: 16.4050, partial_loss/cycle_loss: 0.0000, batch_loss: 13.2159, loss: 21.8993, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:06,  1.11it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7466, UAS: 0.9121, LAS: 0.8362, UEM: 0.5609, LEM: 0.3025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1975, partial_loss/deprel_loss: 54.5662, partial_loss/cycle_loss: 0.0000, batch_loss: 44.0925, loss: 25.0782, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  69%|######9   | 9/13 [00:08<00:03,  1.05it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8448, UAS: 0.9151, LAS: 0.8387, UEM: 0.5397, LEM: 0.2662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6377, partial_loss/deprel_loss: 22.6314, partial_loss/cycle_loss: 0.0000, batch_loss: 18.2327, loss: 23.8980, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  92%|#########2| 12/13 [00:11<00:00,  1.06it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8053, UAS: 0.9130, LAS: 0.8361, UEM: 0.5198, LEM: 0.2546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3525, partial_loss/deprel_loss: 34.6234, partial_loss/cycle_loss: 0.0000, batch_loss: 27.9692, loss: 24.2112, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.05it/s]\n",
      "2023-04-06 22:58:01,929 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 22:58:01,929 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-06 22:58:01,929 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 22:58:01,929 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 22:58:01,929 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-06 22:58:01,929 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-06 22:58:01,929 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.314  |    34.623\n",
      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.891  |     1.353\n",
      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.061  |     0.000\n",
      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - UEM                      |     0.373  |     0.520\n",
      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - LAS                      |     0.771  |     0.836\n",
      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - loss                     |     1.581  |    24.211\n",
      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.097  |       N/A\n",
      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - LEM                      |     0.155  |     0.255\n",
      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - UAS                      |     0.866  |     0.913\n",
      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-06 22:58:01,930 - INFO - combo.training.tensorboard_writer - EM                       |     0.802  |     0.805\n",
      "2023-04-06 22:58:01,931 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 22:58:01,931 - INFO - combo.training.trainer - Epoch duration: 0:01:28.130781\n",
      "2023-04-06 22:58:01,931 - INFO - combo.training.trainer - Estimated training time remaining: 9:01:20\n",
      "2023-04-06 22:58:01,931 - INFO - allennlp.training.trainer - Epoch 6/399\n",
      "2023-04-06 22:58:01,932 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 22:58:01,932 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 22:58:01,939 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7928, UAS: 0.8946, LAS: 0.8032, UEM: 0.3837, LEM: 0.1392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9781, partial_loss/deprel_loss: 1.3434, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3320, loss: 1.3132, batch_reg_loss: 0.0616, reg_loss: 0.0616 ||:   3%|2         | 3/111 [00:02<01:16,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8273, UAS: 0.8970, LAS: 0.8065, UEM: 0.4021, LEM: 0.1350, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5714, partial_loss/deprel_loss: 0.9386, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9268, loss: 1.2471, batch_reg_loss: 0.0616, reg_loss: 0.0616 ||:   5%|5         | 6/111 [00:04<01:12,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8161, UAS: 0.8897, LAS: 0.7999, UEM: 0.3630, LEM: 0.1180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9064, partial_loss/deprel_loss: 1.2405, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2353, loss: 1.3079, batch_reg_loss: 0.0617, reg_loss: 0.0616 ||:   9%|9         | 10/111 [00:06<01:07,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7893, UAS: 0.8751, LAS: 0.7831, UEM: 0.3085, LEM: 0.0989, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1124, partial_loss/deprel_loss: 1.4383, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4348, loss: 1.4786, batch_reg_loss: 0.0617, reg_loss: 0.0616 ||:  13%|#2        | 14/111 [00:08<01:02,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8441, UAS: 0.8743, LAS: 0.7827, UEM: 0.3527, LEM: 0.1199, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4962, partial_loss/deprel_loss: 0.8334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8276, loss: 1.4829, batch_reg_loss: 0.0617, reg_loss: 0.0616 ||:  15%|#5        | 17/111 [00:11<01:04,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6250, UAS: 0.8694, LAS: 0.7787, UEM: 0.3480, LEM: 0.1177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 4.1969, partial_loss/deprel_loss: 2.8191, partial_loss/cycle_loss: 0.0000, batch_loss: 3.1564, loss: 1.5361, batch_reg_loss: 0.0617, reg_loss: 0.0617 ||:  19%|#8        | 21/111 [00:13<01:00,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7569, UAS: 0.8693, LAS: 0.7786, UEM: 0.3166, LEM: 0.1037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5271, partial_loss/deprel_loss: 1.8119, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8167, loss: 1.5297, batch_reg_loss: 0.0617, reg_loss: 0.0617 ||:  23%|##2       | 25/111 [00:16<00:56,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7141, UAS: 0.8677, LAS: 0.7759, UEM: 0.3006, LEM: 0.0945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3811, partial_loss/deprel_loss: 2.0258, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1586, loss: 1.5526, batch_reg_loss: 0.0618, reg_loss: 0.0617 ||:  26%|##6       | 29/111 [00:18<00:53,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7306, UAS: 0.8672, LAS: 0.7753, UEM: 0.3126, LEM: 0.1007, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0218, partial_loss/deprel_loss: 1.8331, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9327, loss: 1.5604, batch_reg_loss: 0.0618, reg_loss: 0.0617 ||:  30%|##9       | 33/111 [00:21<00:50,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7770, UAS: 0.8695, LAS: 0.7770, UEM: 0.3171, LEM: 0.1003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3398, partial_loss/deprel_loss: 1.4502, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4899, loss: 1.5471, batch_reg_loss: 0.0618, reg_loss: 0.0617 ||:  33%|###3      | 37/111 [00:23<00:46,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7841, UAS: 0.8650, LAS: 0.7722, UEM: 0.3010, LEM: 0.0950, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2401, partial_loss/deprel_loss: 1.4031, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4324, loss: 1.6028, batch_reg_loss: 0.0619, reg_loss: 0.0617 ||:  37%|###6      | 41/111 [00:26<00:42,  1.63it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.8680, LAS: 0.7754, UEM: 0.3355, LEM: 0.1209, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2475, partial_loss/deprel_loss: 0.5893, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5828, loss: 1.5741, batch_reg_loss: 0.0619, reg_loss: 0.0617 ||:  41%|####      | 45/111 [00:29<00:43,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8182, UAS: 0.8696, LAS: 0.7771, UEM: 0.3369, LEM: 0.1205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6923, partial_loss/deprel_loss: 1.0521, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0421, loss: 1.5538, batch_reg_loss: 0.0620, reg_loss: 0.0618 ||:  44%|####4     | 49/111 [00:31<00:41,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7539, UAS: 0.8692, LAS: 0.7765, UEM: 0.3256, LEM: 0.1145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6915, partial_loss/deprel_loss: 1.8414, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8734, loss: 1.5572, batch_reg_loss: 0.0620, reg_loss: 0.0618 ||:  48%|####7     | 53/111 [00:34<00:38,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8421, UAS: 0.8703, LAS: 0.7782, UEM: 0.3360, LEM: 0.1201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6520, partial_loss/deprel_loss: 0.8937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9074, loss: 1.5379, batch_reg_loss: 0.0620, reg_loss: 0.0618 ||:  51%|#####1    | 57/111 [00:37<00:37,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8116, UAS: 0.8717, LAS: 0.7799, UEM: 0.3610, LEM: 0.1445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9092, partial_loss/deprel_loss: 1.1890, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1951, loss: 1.5218, batch_reg_loss: 0.0620, reg_loss: 0.0618 ||:  54%|#####4    | 60/111 [00:39<00:36,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8035, UAS: 0.8727, LAS: 0.7813, UEM: 0.3561, LEM: 0.1403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1905, partial_loss/deprel_loss: 1.2473, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2980, loss: 1.5067, batch_reg_loss: 0.0621, reg_loss: 0.0618 ||:  57%|#####6    | 63/111 [00:42<00:34,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8627, UAS: 0.8749, LAS: 0.7839, UEM: 0.3711, LEM: 0.1484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2916, partial_loss/deprel_loss: 0.6615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6496, loss: 1.4817, batch_reg_loss: 0.0621, reg_loss: 0.0618 ||:  59%|#####9    | 66/111 [00:44<00:31,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7580, UAS: 0.8736, LAS: 0.7826, UEM: 0.3745, LEM: 0.1515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5556, partial_loss/deprel_loss: 1.6028, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6555, loss: 1.4939, batch_reg_loss: 0.0621, reg_loss: 0.0618 ||:  63%|######3   | 70/111 [00:46<00:28,  1.45it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8647, UAS: 0.8744, LAS: 0.7837, UEM: 0.3851, LEM: 0.1595, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3390, partial_loss/deprel_loss: 0.6582, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6565, loss: 1.4852, batch_reg_loss: 0.0621, reg_loss: 0.0619 ||:  66%|######5   | 73/111 [00:50<00:34,  1.10it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8116, UAS: 0.8754, LAS: 0.7846, UEM: 0.3853, LEM: 0.1580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8573, partial_loss/deprel_loss: 1.2353, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2218, loss: 1.4768, batch_reg_loss: 0.0621, reg_loss: 0.0619 ||:  68%|######8   | 76/111 [00:53<00:31,  1.13it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8517, UAS: 0.8775, LAS: 0.7871, UEM: 0.4008, LEM: 0.1662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4426, partial_loss/deprel_loss: 0.8148, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8025, loss: 1.4523, batch_reg_loss: 0.0622, reg_loss: 0.0619 ||:  71%|#######1  | 79/111 [00:55<00:27,  1.17it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7632, UAS: 0.8768, LAS: 0.7867, UEM: 0.4232, LEM: 0.1931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3685, partial_loss/deprel_loss: 1.5348, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5637, loss: 1.4562, batch_reg_loss: 0.0622, reg_loss: 0.0619 ||:  74%|#######3  | 82/111 [00:58<00:24,  1.21it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7120, UAS: 0.8759, LAS: 0.7859, UEM: 0.4157, LEM: 0.1885, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3845, partial_loss/deprel_loss: 2.0313, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1642, loss: 1.4645, batch_reg_loss: 0.0622, reg_loss: 0.0619 ||:  77%|#######7  | 86/111 [01:00<00:18,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8155, UAS: 0.8760, LAS: 0.7861, UEM: 0.4115, LEM: 0.1853, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8067, partial_loss/deprel_loss: 1.1319, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1291, loss: 1.4605, batch_reg_loss: 0.0622, reg_loss: 0.0619 ||:  80%|########  | 89/111 [01:02<00:16,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7328, UAS: 0.8753, LAS: 0.7855, UEM: 0.4026, LEM: 0.1804, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2779, partial_loss/deprel_loss: 1.9162, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0508, loss: 1.4669, batch_reg_loss: 0.0623, reg_loss: 0.0619 ||:  84%|########3 | 93/111 [01:04<00:12,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8328, UAS: 0.8765, LAS: 0.7868, UEM: 0.4051, LEM: 0.1809, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8328, partial_loss/deprel_loss: 1.0645, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0804, loss: 1.4538, batch_reg_loss: 0.0623, reg_loss: 0.0619 ||:  86%|########6 | 96/111 [01:06<00:10,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8406, UAS: 0.8762, LAS: 0.7865, UEM: 0.4014, LEM: 0.1783, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5521, partial_loss/deprel_loss: 0.9905, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9651, loss: 1.4581, batch_reg_loss: 0.0623, reg_loss: 0.0619 ||:  89%|########9 | 99/111 [01:09<00:08,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7715, UAS: 0.8767, LAS: 0.7872, UEM: 0.3993, LEM: 0.1761, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3737, partial_loss/deprel_loss: 1.5367, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5665, loss: 1.4511, batch_reg_loss: 0.0624, reg_loss: 0.0620 ||:  92%|#########1| 102/111 [01:11<00:06,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7680, UAS: 0.8764, LAS: 0.7870, UEM: 0.3919, LEM: 0.1721, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4850, partial_loss/deprel_loss: 1.6062, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6444, loss: 1.4537, batch_reg_loss: 0.0624, reg_loss: 0.0620 ||:  95%|#########5| 106/111 [01:13<00:03,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8565, UAS: 0.8768, LAS: 0.7875, UEM: 0.3925, LEM: 0.1722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4828, partial_loss/deprel_loss: 0.8308, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8236, loss: 1.4500, batch_reg_loss: 0.0624, reg_loss: 0.0620 ||:  98%|#########8| 109/111 [01:15<00:01,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8117, UAS: 0.8776, LAS: 0.7883, UEM: 0.3955, LEM: 0.1736, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9031, partial_loss/deprel_loss: 1.2503, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2433, loss: 1.4419, batch_reg_loss: 0.0625, reg_loss: 0.0620 ||: 100%|##########| 111/111 [01:17<00:00,  1.43it/s]\n",
      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.250  |       N/A\n",
      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.903  |       N/A\n",
      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.062  |       N/A\n",
      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - UEM                      |     0.395  |       N/A\n",
      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - LAS                      |     0.788  |       N/A\n",
      "2023-04-06 22:59:19,352 - INFO - combo.training.tensorboard_writer - loss                     |     1.442  |       N/A\n",
      "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.097  |       N/A\n",
      "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - LEM                      |     0.174  |       N/A\n",
      "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - UAS                      |     0.878  |       N/A\n",
      "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - EM                       |     0.812  |       N/A\n",
      "2023-04-06 22:59:19,353 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 22:59:19,354 - INFO - combo.training.trainer - Epoch duration: 0:01:17.422262\n",
      "2023-04-06 22:59:19,354 - INFO - combo.training.trainer - Estimated training time remaining: 8:55:16\n",
      "2023-04-06 22:59:19,354 - INFO - allennlp.training.trainer - Epoch 7/399\n",
      "2023-04-06 22:59:19,354 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 22:59:19,354 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 22:59:19,361 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8629, UAS: 0.8724, LAS: 0.7842, UEM: 0.3680, LEM: 0.1364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4368, partial_loss/deprel_loss: 0.7830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7763, loss: 1.4874, batch_reg_loss: 0.0625, reg_loss: 0.0625 ||:   4%|3         | 4/111 [00:02<01:11,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7297, UAS: 0.8701, LAS: 0.7828, UEM: 0.4033, LEM: 0.1768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0957, partial_loss/deprel_loss: 1.9928, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0759, loss: 1.5090, batch_reg_loss: 0.0625, reg_loss: 0.0625 ||:   6%|6         | 7/111 [00:05<01:13,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7719, UAS: 0.8774, LAS: 0.7933, UEM: 0.3826, LEM: 0.1651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4563, partial_loss/deprel_loss: 1.6923, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7077, loss: 1.4414, batch_reg_loss: 0.0626, reg_loss: 0.0625 ||:  10%|9         | 11/111 [00:07<01:07,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8024, UAS: 0.8787, LAS: 0.7934, UEM: 0.3521, LEM: 0.1407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9573, partial_loss/deprel_loss: 1.2649, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2660, loss: 1.4205, batch_reg_loss: 0.0626, reg_loss: 0.0625 ||:  14%|#3        | 15/111 [00:09<01:01,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7615, UAS: 0.8748, LAS: 0.7881, UEM: 0.3135, LEM: 0.1196, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6249, partial_loss/deprel_loss: 1.6581, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7141, loss: 1.4666, batch_reg_loss: 0.0627, reg_loss: 0.0626 ||:  17%|#7        | 19/111 [00:12<00:58,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8370, UAS: 0.8822, LAS: 0.7962, UEM: 0.3660, LEM: 0.1485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6126, partial_loss/deprel_loss: 0.9570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9508, loss: 1.3872, batch_reg_loss: 0.0627, reg_loss: 0.0626 ||:  20%|#9        | 22/111 [00:14<00:58,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6689, UAS: 0.8766, LAS: 0.7911, UEM: 0.3612, LEM: 0.1459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.2741, partial_loss/deprel_loss: 2.4141, partial_loss/cycle_loss: 0.0000, batch_loss: 2.6488, loss: 1.4397, batch_reg_loss: 0.0628, reg_loss: 0.0626 ||:  23%|##3       | 26/111 [00:16<00:53,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8573, UAS: 0.8769, LAS: 0.7922, UEM: 0.3532, LEM: 0.1394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6586, partial_loss/deprel_loss: 0.9206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9310, loss: 1.4379, batch_reg_loss: 0.0628, reg_loss: 0.0626 ||:  27%|##7       | 30/111 [00:19<00:51,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8501, UAS: 0.8768, LAS: 0.7918, UEM: 0.3561, LEM: 0.1370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4872, partial_loss/deprel_loss: 0.8191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8156, loss: 1.4428, batch_reg_loss: 0.0629, reg_loss: 0.0627 ||:  31%|###       | 34/111 [00:21<00:49,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7718, UAS: 0.8759, LAS: 0.7906, UEM: 0.3526, LEM: 0.1360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3521, partial_loss/deprel_loss: 1.4910, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5261, loss: 1.4532, batch_reg_loss: 0.0629, reg_loss: 0.0627 ||:  34%|###4      | 38/111 [00:24<00:47,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7682, UAS: 0.8763, LAS: 0.7911, UEM: 0.3421, LEM: 0.1291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5765, partial_loss/deprel_loss: 1.6436, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6931, loss: 1.4514, batch_reg_loss: 0.0630, reg_loss: 0.0627 ||:  38%|###7      | 42/111 [00:27<00:45,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8301, UAS: 0.8781, LAS: 0.7929, UEM: 0.3316, LEM: 0.1220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7117, partial_loss/deprel_loss: 1.1158, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0980, loss: 1.4348, batch_reg_loss: 0.0630, reg_loss: 0.0627 ||:  41%|####1     | 46/111 [00:29<00:40,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7495, UAS: 0.8762, LAS: 0.7916, UEM: 0.3351, LEM: 0.1242, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0049, partial_loss/deprel_loss: 1.8432, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9386, loss: 1.4529, batch_reg_loss: 0.0631, reg_loss: 0.0628 ||:  45%|####5     | 50/111 [00:31<00:37,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7735, UAS: 0.8790, LAS: 0.7953, UEM: 0.3877, LEM: 0.1736, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4529, partial_loss/deprel_loss: 1.4813, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5387, loss: 1.4166, batch_reg_loss: 0.0631, reg_loss: 0.0628 ||:  49%|####8     | 54/111 [00:35<00:39,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8136, UAS: 0.8792, LAS: 0.7954, UEM: 0.3826, LEM: 0.1685, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9952, partial_loss/deprel_loss: 1.2018, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2236, loss: 1.4151, batch_reg_loss: 0.0631, reg_loss: 0.0628 ||:  51%|#####1    | 57/111 [00:37<00:37,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7092, UAS: 0.8797, LAS: 0.7962, UEM: 0.4184, LEM: 0.2082, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.7240, partial_loss/deprel_loss: 2.1644, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3395, loss: 1.4103, batch_reg_loss: 0.0632, reg_loss: 0.0628 ||:  54%|#####4    | 60/111 [00:39<00:36,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7540, UAS: 0.8799, LAS: 0.7961, UEM: 0.4070, LEM: 0.1991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8092, partial_loss/deprel_loss: 1.7140, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7963, loss: 1.4121, batch_reg_loss: 0.0632, reg_loss: 0.0628 ||:  58%|#####7    | 64/111 [00:42<00:32,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8109, UAS: 0.8805, LAS: 0.7967, UEM: 0.4083, LEM: 0.2006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9000, partial_loss/deprel_loss: 1.1946, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1989, loss: 1.4027, batch_reg_loss: 0.0633, reg_loss: 0.0629 ||:  60%|######    | 67/111 [00:44<00:30,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8382, UAS: 0.8815, LAS: 0.7979, UEM: 0.4116, LEM: 0.2017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6882, partial_loss/deprel_loss: 0.9346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9486, loss: 1.3897, batch_reg_loss: 0.0633, reg_loss: 0.0629 ||:  63%|######3   | 70/111 [00:46<00:30,  1.36it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8771, UAS: 0.8812, LAS: 0.7976, UEM: 0.4122, LEM: 0.2035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3938, partial_loss/deprel_loss: 0.6384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6529, loss: 1.3910, batch_reg_loss: 0.0634, reg_loss: 0.0629 ||:  66%|######5   | 73/111 [00:48<00:27,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8465, UAS: 0.8816, LAS: 0.7982, UEM: 0.4122, LEM: 0.2019, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6296, partial_loss/deprel_loss: 0.9116, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9186, loss: 1.3860, batch_reg_loss: 0.0634, reg_loss: 0.0629 ||:  68%|######8   | 76/111 [00:50<00:25,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7487, UAS: 0.8817, LAS: 0.7982, UEM: 0.4104, LEM: 0.1998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8556, partial_loss/deprel_loss: 1.6892, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7859, loss: 1.3852, batch_reg_loss: 0.0634, reg_loss: 0.0629 ||:  71%|#######1  | 79/111 [00:53<00:22,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8273, UAS: 0.8828, LAS: 0.7995, UEM: 0.4079, LEM: 0.1960, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8511, partial_loss/deprel_loss: 1.1586, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1606, loss: 1.3738, batch_reg_loss: 0.0635, reg_loss: 0.0630 ||:  74%|#######3  | 82/111 [00:55<00:20,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7909, UAS: 0.8831, LAS: 0.7998, UEM: 0.3986, LEM: 0.1897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2809, partial_loss/deprel_loss: 1.4356, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4682, loss: 1.3714, batch_reg_loss: 0.0635, reg_loss: 0.0630 ||:  77%|#######7  | 86/111 [00:57<00:17,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8665, UAS: 0.8841, LAS: 0.8011, UEM: 0.4051, LEM: 0.1932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3861, partial_loss/deprel_loss: 0.6754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6811, loss: 1.3591, batch_reg_loss: 0.0636, reg_loss: 0.0630 ||:  80%|########  | 89/111 [00:59<00:15,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8384, UAS: 0.8851, LAS: 0.8022, UEM: 0.4059, LEM: 0.1904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7558, partial_loss/deprel_loss: 0.8878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9250, loss: 1.3475, batch_reg_loss: 0.0636, reg_loss: 0.0630 ||:  83%|########2 | 92/111 [01:01<00:13,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6849, UAS: 0.8847, LAS: 0.8021, UEM: 0.4073, LEM: 0.1900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.0226, partial_loss/deprel_loss: 2.1493, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3876, loss: 1.3458, batch_reg_loss: 0.0637, reg_loss: 0.0630 ||:  86%|########6 | 96/111 [01:04<00:10,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7306, UAS: 0.8834, LAS: 0.8006, UEM: 0.4017, LEM: 0.1872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0285, partial_loss/deprel_loss: 1.8749, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9693, loss: 1.3587, batch_reg_loss: 0.0637, reg_loss: 0.0631 ||:  89%|########9 | 99/111 [01:06<00:08,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8169, UAS: 0.8834, LAS: 0.8005, UEM: 0.4020, LEM: 0.1868, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8733, partial_loss/deprel_loss: 1.1504, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1587, loss: 1.3588, batch_reg_loss: 0.0637, reg_loss: 0.0631 ||:  92%|#########1| 102/111 [01:09<00:06,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.8850, LAS: 0.8022, UEM: 0.4122, LEM: 0.1905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3123, partial_loss/deprel_loss: 0.6209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6230, loss: 1.3414, batch_reg_loss: 0.0638, reg_loss: 0.0631 ||:  95%|#########5| 106/111 [01:11<00:03,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8577, UAS: 0.8857, LAS: 0.8029, UEM: 0.4147, LEM: 0.1914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4652, partial_loss/deprel_loss: 0.7915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7900, loss: 1.3339, batch_reg_loss: 0.0638, reg_loss: 0.0631 ||:  98%|#########8| 109/111 [01:13<00:01,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8271, UAS: 0.8854, LAS: 0.8026, UEM: 0.4124, LEM: 0.1897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8597, partial_loss/deprel_loss: 0.9947, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0315, loss: 1.3354, batch_reg_loss: 0.0638, reg_loss: 0.0631 ||: 100%|##########| 111/111 [01:15<00:00,  1.48it/s]\n",
      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.995  |       N/A\n",
      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.860  |       N/A\n",
      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.063  |       N/A\n",
      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - UEM                      |     0.412  |       N/A\n",
      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - LAS                      |     0.803  |       N/A\n",
      "2023-04-06 23:00:34,375 - INFO - combo.training.tensorboard_writer - loss                     |     1.335  |       N/A\n",
      "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.097  |       N/A\n",
      "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - LEM                      |     0.190  |       N/A\n",
      "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - UAS                      |     0.885  |       N/A\n",
      "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - EM                       |     0.827  |       N/A\n",
      "2023-04-06 23:00:34,376 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:00:34,377 - INFO - combo.training.trainer - Epoch duration: 0:01:15.022627\n",
      "2023-04-06 23:00:34,377 - INFO - combo.training.trainer - Estimated training time remaining: 8:48:26\n",
      "2023-04-06 23:00:34,377 - INFO - allennlp.training.trainer - Epoch 8/399\n",
      "2023-04-06 23:00:34,377 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-06 23:00:34,377 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:00:34,384 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8241, UAS: 0.8930, LAS: 0.8071, UEM: 0.2937, LEM: 0.0688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8920, partial_loss/deprel_loss: 1.0848, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1101, loss: 1.2838, batch_reg_loss: 0.0639, reg_loss: 0.0639 ||:   4%|3         | 4/111 [00:02<01:05,  1.63it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8233, UAS: 0.8886, LAS: 0.8066, UEM: 0.3058, LEM: 0.0816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9010, partial_loss/deprel_loss: 1.1552, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1683, loss: 1.2793, batch_reg_loss: 0.0640, reg_loss: 0.0639 ||:   7%|7         | 8/111 [00:04<01:03,  1.63it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9018, LAS: 0.8220, UEM: 0.5010, LEM: 0.2561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1971, partial_loss/deprel_loss: 0.4135, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4342, loss: 1.1506, batch_reg_loss: 0.0640, reg_loss: 0.0639 ||:  10%|9         | 11/111 [00:07<01:03,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8606, UAS: 0.8885, LAS: 0.8093, UEM: 0.5000, LEM: 0.2546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4594, partial_loss/deprel_loss: 0.6960, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7127, loss: 1.3050, batch_reg_loss: 0.0640, reg_loss: 0.0640 ||:  13%|#2        | 14/111 [00:09<01:07,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8513, UAS: 0.8872, LAS: 0.8077, UEM: 0.4793, LEM: 0.2398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5064, partial_loss/deprel_loss: 0.7968, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8028, loss: 1.3102, batch_reg_loss: 0.0641, reg_loss: 0.0640 ||:  15%|#5        | 17/111 [00:11<01:08,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7552, UAS: 0.8892, LAS: 0.8111, UEM: 0.4579, LEM: 0.2212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8160, partial_loss/deprel_loss: 1.5796, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6910, loss: 1.2699, batch_reg_loss: 0.0641, reg_loss: 0.0640 ||:  19%|#8        | 21/111 [00:14<01:01,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8090, UAS: 0.8856, LAS: 0.8065, UEM: 0.4306, LEM: 0.2060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1190, partial_loss/deprel_loss: 1.1705, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2244, loss: 1.3033, batch_reg_loss: 0.0642, reg_loss: 0.0640 ||:  22%|##1       | 24/111 [00:16<00:59,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7897, UAS: 0.8861, LAS: 0.8069, UEM: 0.4112, LEM: 0.1927, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2958, partial_loss/deprel_loss: 1.3087, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3704, loss: 1.2958, batch_reg_loss: 0.0642, reg_loss: 0.0640 ||:  24%|##4       | 27/111 [00:18<01:00,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7306, UAS: 0.8839, LAS: 0.8044, UEM: 0.4072, LEM: 0.1892, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4421, partial_loss/deprel_loss: 1.8969, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0702, loss: 1.3262, batch_reg_loss: 0.0643, reg_loss: 0.0641 ||:  27%|##7       | 30/111 [00:20<00:59,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8245, UAS: 0.8813, LAS: 0.8011, UEM: 0.3874, LEM: 0.1759, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8848, partial_loss/deprel_loss: 1.1863, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1903, loss: 1.3609, batch_reg_loss: 0.0644, reg_loss: 0.0641 ||:  31%|###       | 34/111 [00:23<00:53,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7990, UAS: 0.8837, LAS: 0.8038, UEM: 0.4387, LEM: 0.2372, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1111, partial_loss/deprel_loss: 1.2691, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3019, loss: 1.3366, batch_reg_loss: 0.0644, reg_loss: 0.0641 ||:  33%|###3      | 37/111 [00:25<00:52,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7902, UAS: 0.8854, LAS: 0.8050, UEM: 0.4272, LEM: 0.2249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3545, partial_loss/deprel_loss: 1.4825, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5214, loss: 1.3286, batch_reg_loss: 0.0645, reg_loss: 0.0642 ||:  36%|###6      | 40/111 [00:27<00:49,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.8877, LAS: 0.8072, UEM: 0.4217, LEM: 0.2144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5300, partial_loss/deprel_loss: 0.9049, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8945, loss: 1.3072, batch_reg_loss: 0.0645, reg_loss: 0.0642 ||:  39%|###8      | 43/111 [00:29<00:47,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8620, UAS: 0.8908, LAS: 0.8105, UEM: 0.4339, LEM: 0.2148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5897, partial_loss/deprel_loss: 0.8662, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8754, loss: 1.2774, batch_reg_loss: 0.0646, reg_loss: 0.0642 ||:  41%|####1     | 46/111 [00:32<00:47,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8295, UAS: 0.8909, LAS: 0.8105, UEM: 0.4243, LEM: 0.2074, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8100, partial_loss/deprel_loss: 0.9878, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0168, loss: 1.2768, batch_reg_loss: 0.0646, reg_loss: 0.0642 ||:  44%|####4     | 49/111 [00:34<00:45,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8451, UAS: 0.8901, LAS: 0.8096, UEM: 0.4112, LEM: 0.1977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7876, partial_loss/deprel_loss: 0.9327, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9683, loss: 1.2818, batch_reg_loss: 0.0647, reg_loss: 0.0643 ||:  48%|####7     | 53/111 [00:36<00:39,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8451, UAS: 0.8901, LAS: 0.8096, UEM: 0.4056, LEM: 0.1924, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6974, partial_loss/deprel_loss: 0.9227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9424, loss: 1.2799, batch_reg_loss: 0.0647, reg_loss: 0.0643 ||:  50%|#####     | 56/111 [00:38<00:38,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8424, UAS: 0.8911, LAS: 0.8107, UEM: 0.4065, LEM: 0.1909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7933, partial_loss/deprel_loss: 0.9271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9651, loss: 1.2707, batch_reg_loss: 0.0648, reg_loss: 0.0643 ||:  54%|#####4    | 60/111 [00:41<00:34,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8653, UAS: 0.8913, LAS: 0.8110, UEM: 0.4163, LEM: 0.1957, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5222, partial_loss/deprel_loss: 0.8511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8501, loss: 1.2691, batch_reg_loss: 0.0648, reg_loss: 0.0643 ||:  57%|#####6    | 63/111 [00:43<00:33,  1.45it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8443, UAS: 0.8926, LAS: 0.8125, UEM: 0.4278, LEM: 0.2061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7491, partial_loss/deprel_loss: 1.0206, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0312, loss: 1.2552, batch_reg_loss: 0.0649, reg_loss: 0.0644 ||:  59%|#####9    | 66/111 [00:45<00:31,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8008, UAS: 0.8931, LAS: 0.8132, UEM: 0.4331, LEM: 0.2078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1884, partial_loss/deprel_loss: 1.2751, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3227, loss: 1.2490, batch_reg_loss: 0.0649, reg_loss: 0.0644 ||:  63%|######3   | 70/111 [00:48<00:27,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7758, UAS: 0.8925, LAS: 0.8121, UEM: 0.4233, LEM: 0.2014, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4103, partial_loss/deprel_loss: 1.5663, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6001, loss: 1.2582, batch_reg_loss: 0.0650, reg_loss: 0.0644 ||:  67%|######6   | 74/111 [00:50<00:24,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.8917, LAS: 0.8114, UEM: 0.4194, LEM: 0.1977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5735, partial_loss/deprel_loss: 0.8557, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8643, loss: 1.2660, batch_reg_loss: 0.0651, reg_loss: 0.0645 ||:  70%|#######   | 78/111 [00:53<00:22,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8681, UAS: 0.8931, LAS: 0.8129, UEM: 0.4242, LEM: 0.1982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4187, partial_loss/deprel_loss: 0.7510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7497, loss: 1.2519, batch_reg_loss: 0.0651, reg_loss: 0.0645 ||:  73%|#######2  | 81/111 [00:55<00:21,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6999, UAS: 0.8912, LAS: 0.8106, UEM: 0.4176, LEM: 0.1948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5586, partial_loss/deprel_loss: 2.1598, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3047, loss: 1.2725, batch_reg_loss: 0.0651, reg_loss: 0.0645 ||:  76%|#######5  | 84/111 [00:57<00:18,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7984, UAS: 0.8920, LAS: 0.8114, UEM: 0.4254, LEM: 0.2002, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2174, partial_loss/deprel_loss: 1.3746, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4084, loss: 1.2663, batch_reg_loss: 0.0652, reg_loss: 0.0645 ||:  79%|#######9  | 88/111 [01:00<00:15,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7645, UAS: 0.8914, LAS: 0.8106, UEM: 0.4171, LEM: 0.1945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7351, partial_loss/deprel_loss: 1.6841, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7596, loss: 1.2742, batch_reg_loss: 0.0653, reg_loss: 0.0646 ||:  83%|########2 | 92/111 [01:02<00:12,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8726, UAS: 0.8916, LAS: 0.8109, UEM: 0.4169, LEM: 0.1940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4136, partial_loss/deprel_loss: 0.6496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6677, loss: 1.2720, batch_reg_loss: 0.0653, reg_loss: 0.0646 ||:  86%|########6 | 96/111 [01:05<00:10,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8617, UAS: 0.8930, LAS: 0.8124, UEM: 0.4280, LEM: 0.2003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4469, partial_loss/deprel_loss: 0.7590, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7619, loss: 1.2586, batch_reg_loss: 0.0654, reg_loss: 0.0646 ||:  89%|########9 | 99/111 [01:08<00:08,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7769, UAS: 0.8935, LAS: 0.8130, UEM: 0.4298, LEM: 0.2005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6781, partial_loss/deprel_loss: 1.5453, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6373, loss: 1.2527, batch_reg_loss: 0.0655, reg_loss: 0.0646 ||:  92%|#########1| 102/111 [01:10<00:06,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.6829, UAS: 0.8911, LAS: 0.8105, UEM: 0.4258, LEM: 0.1982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.1513, partial_loss/deprel_loss: 2.1113, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3848, loss: 1.2753, batch_reg_loss: 0.0655, reg_loss: 0.0647 ||:  95%|#########4| 105/111 [01:13<00:04,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7566, UAS: 0.8903, LAS: 0.8095, UEM: 0.4247, LEM: 0.1967, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8494, partial_loss/deprel_loss: 1.7516, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8367, loss: 1.2862, batch_reg_loss: 0.0656, reg_loss: 0.0647 ||:  97%|#########7| 108/111 [01:15<00:02,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8283, UAS: 0.8911, LAS: 0.8104, UEM: 0.4280, LEM: 0.1988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7554, partial_loss/deprel_loss: 1.0998, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0965, loss: 1.2771, batch_reg_loss: 0.0656, reg_loss: 0.0647 ||: 100%|##########| 111/111 [01:16<00:00,  1.44it/s]\n",
      "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 23:01:51,357 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.100  |       N/A\n",
      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.755  |       N/A\n",
      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.065  |       N/A\n",
      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - UEM                      |     0.428  |       N/A\n",
      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - LAS                      |     0.810  |       N/A\n",
      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - loss                     |     1.277  |       N/A\n",
      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2424.097  |       N/A\n",
      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - LEM                      |     0.199  |       N/A\n",
      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - UAS                      |     0.891  |       N/A\n",
      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - EM                       |     0.828  |       N/A\n",
      "2023-04-06 23:01:51,358 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:01:51,359 - INFO - combo.training.trainer - Epoch duration: 0:01:16.982102\n",
      "2023-04-06 23:01:51,359 - INFO - combo.training.trainer - Estimated training time remaining: 8:44:16\n",
      "2023-04-06 23:01:51,359 - INFO - allennlp.training.trainer - Epoch 9/399\n",
      "2023-04-06 23:01:51,359 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:01:51,359 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:01:51,366 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8694, UAS: 0.9255, LAS: 0.8548, UEM: 0.5504, LEM: 0.2738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4220, partial_loss/deprel_loss: 0.6260, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6508, loss: 0.8275, batch_reg_loss: 0.0656, reg_loss: 0.0656 ||:   3%|2         | 3/111 [00:02<01:21,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8375, UAS: 0.9245, LAS: 0.8515, UEM: 0.5266, LEM: 0.2491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7531, partial_loss/deprel_loss: 0.9576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9824, loss: 0.8760, batch_reg_loss: 0.0657, reg_loss: 0.0657 ||:   5%|5         | 6/111 [00:04<01:20,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8321, UAS: 0.9161, LAS: 0.8419, UEM: 0.4940, LEM: 0.2270, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8656, partial_loss/deprel_loss: 1.0827, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1050, loss: 0.9815, batch_reg_loss: 0.0657, reg_loss: 0.0657 ||:   8%|8         | 9/111 [00:06<01:16,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8601, UAS: 0.9148, LAS: 0.8396, UEM: 0.4936, LEM: 0.2105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4626, partial_loss/deprel_loss: 0.7863, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7874, loss: 1.0120, batch_reg_loss: 0.0658, reg_loss: 0.0657 ||:  11%|#         | 12/111 [00:09<01:14,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7472, UAS: 0.9118, LAS: 0.8363, UEM: 0.4936, LEM: 0.2092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1431, partial_loss/deprel_loss: 1.7409, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8873, loss: 1.0389, batch_reg_loss: 0.0659, reg_loss: 0.0657 ||:  14%|#4        | 16/111 [00:11<01:06,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8605, UAS: 0.9033, LAS: 0.8265, UEM: 0.4604, LEM: 0.1912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5063, partial_loss/deprel_loss: 0.8511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8481, loss: 1.1324, batch_reg_loss: 0.0659, reg_loss: 0.0658 ||:  18%|#8        | 20/111 [00:13<01:00,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8059, UAS: 0.9014, LAS: 0.8239, UEM: 0.4295, LEM: 0.1726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1199, partial_loss/deprel_loss: 1.4563, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4550, loss: 1.1575, batch_reg_loss: 0.0660, reg_loss: 0.0658 ||:  22%|##1       | 24/111 [00:16<00:57,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7750, UAS: 0.8952, LAS: 0.8171, UEM: 0.4111, LEM: 0.1644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6847, partial_loss/deprel_loss: 1.5184, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6177, loss: 1.2197, batch_reg_loss: 0.0661, reg_loss: 0.0658 ||:  25%|##5       | 28/111 [00:18<00:52,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7462, UAS: 0.8923, LAS: 0.8137, UEM: 0.3953, LEM: 0.1563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2574, partial_loss/deprel_loss: 1.8212, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9746, loss: 1.2571, batch_reg_loss: 0.0662, reg_loss: 0.0659 ||:  29%|##8       | 32/111 [00:21<00:50,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8600, UAS: 0.8916, LAS: 0.8133, UEM: 0.3940, LEM: 0.1561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5520, partial_loss/deprel_loss: 0.7620, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7862, loss: 1.2609, batch_reg_loss: 0.0662, reg_loss: 0.0659 ||:  32%|###2      | 36/111 [00:23<00:48,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8140, UAS: 0.8902, LAS: 0.8114, UEM: 0.3764, LEM: 0.1479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1807, partial_loss/deprel_loss: 1.2136, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2734, loss: 1.2838, batch_reg_loss: 0.0663, reg_loss: 0.0660 ||:  36%|###6      | 40/111 [00:26<00:45,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8870, UAS: 0.8915, LAS: 0.8126, UEM: 0.4016, LEM: 0.1669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2704, partial_loss/deprel_loss: 0.5464, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5576, loss: 1.2723, batch_reg_loss: 0.0664, reg_loss: 0.0660 ||:  40%|###9      | 44/111 [00:29<00:43,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8098, UAS: 0.8917, LAS: 0.8122, UEM: 0.3866, LEM: 0.1573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9682, partial_loss/deprel_loss: 1.2962, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2971, loss: 1.2742, batch_reg_loss: 0.0665, reg_loss: 0.0660 ||:  43%|####3     | 48/111 [00:31<00:41,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8341, UAS: 0.8915, LAS: 0.8119, UEM: 0.3734, LEM: 0.1493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8617, partial_loss/deprel_loss: 1.0904, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1112, loss: 1.2763, batch_reg_loss: 0.0666, reg_loss: 0.0661 ||:  47%|####6     | 52/111 [00:34<00:39,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8407, UAS: 0.8937, LAS: 0.8143, UEM: 0.3817, LEM: 0.1525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8274, partial_loss/deprel_loss: 0.9894, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0237, loss: 1.2510, batch_reg_loss: 0.0666, reg_loss: 0.0661 ||:  50%|#####     | 56/111 [00:37<00:37,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7726, UAS: 0.8911, LAS: 0.8114, UEM: 0.3731, LEM: 0.1485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7883, partial_loss/deprel_loss: 1.6515, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7456, loss: 1.2778, batch_reg_loss: 0.0667, reg_loss: 0.0661 ||:  53%|#####3    | 59/111 [00:39<00:35,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.8919, LAS: 0.8123, UEM: 0.3775, LEM: 0.1503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3845, partial_loss/deprel_loss: 0.6765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6848, loss: 1.2680, batch_reg_loss: 0.0668, reg_loss: 0.0662 ||:  57%|#####6    | 63/111 [00:42<00:33,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8825, UAS: 0.8923, LAS: 0.8129, UEM: 0.3800, LEM: 0.1507, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3847, partial_loss/deprel_loss: 0.6543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6672, loss: 1.2614, batch_reg_loss: 0.0668, reg_loss: 0.0662 ||:  60%|######    | 67/111 [00:45<00:30,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8736, UAS: 0.8945, LAS: 0.8153, UEM: 0.3887, LEM: 0.1545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4404, partial_loss/deprel_loss: 0.7233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7337, loss: 1.2393, batch_reg_loss: 0.0669, reg_loss: 0.0663 ||:  64%|######3   | 71/111 [00:47<00:27,  1.45it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8122, UAS: 0.8962, LAS: 0.8173, UEM: 0.4219, LEM: 0.1912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9752, partial_loss/deprel_loss: 1.3085, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3088, loss: 1.2234, batch_reg_loss: 0.0670, reg_loss: 0.0663 ||:  67%|######6   | 74/111 [00:50<00:26,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7825, UAS: 0.8964, LAS: 0.8179, UEM: 0.4236, LEM: 0.1933, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5015, partial_loss/deprel_loss: 1.4831, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5538, loss: 1.2192, batch_reg_loss: 0.0670, reg_loss: 0.0663 ||:  69%|######9   | 77/111 [00:52<00:24,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8175, UAS: 0.8970, LAS: 0.8187, UEM: 0.4197, LEM: 0.1886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0788, partial_loss/deprel_loss: 1.1409, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1956, loss: 1.2138, batch_reg_loss: 0.0671, reg_loss: 0.0663 ||:  73%|#######2  | 81/111 [00:54<00:20,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8500, UAS: 0.8961, LAS: 0.8179, UEM: 0.4136, LEM: 0.1848, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7436, partial_loss/deprel_loss: 0.8710, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9127, loss: 1.2214, batch_reg_loss: 0.0672, reg_loss: 0.0664 ||:  77%|#######6  | 85/111 [00:57<00:17,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7341, UAS: 0.8956, LAS: 0.8174, UEM: 0.4083, LEM: 0.1813, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2575, partial_loss/deprel_loss: 1.8813, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0237, loss: 1.2272, batch_reg_loss: 0.0672, reg_loss: 0.0664 ||:  80%|########  | 89/111 [00:59<00:14,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8867, UAS: 0.8969, LAS: 0.8191, UEM: 0.4323, LEM: 0.2002, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2403, partial_loss/deprel_loss: 0.5870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5850, loss: 1.2123, batch_reg_loss: 0.0673, reg_loss: 0.0665 ||:  84%|########3 | 93/111 [01:02<00:12,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7063, UAS: 0.8948, LAS: 0.8169, UEM: 0.4339, LEM: 0.2011, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6918, partial_loss/deprel_loss: 2.1989, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3648, loss: 1.2362, batch_reg_loss: 0.0673, reg_loss: 0.0665 ||:  86%|########6 | 96/111 [01:05<00:10,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8118, UAS: 0.8947, LAS: 0.8168, UEM: 0.4295, LEM: 0.1973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0917, partial_loss/deprel_loss: 1.1721, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2234, loss: 1.2352, batch_reg_loss: 0.0674, reg_loss: 0.0665 ||:  89%|########9 | 99/111 [01:07<00:08,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8250, UAS: 0.8951, LAS: 0.8172, UEM: 0.4260, LEM: 0.1936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9414, partial_loss/deprel_loss: 1.0274, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0777, loss: 1.2291, batch_reg_loss: 0.0675, reg_loss: 0.0665 ||:  93%|#########2| 103/111 [01:10<00:05,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8082, UAS: 0.8962, LAS: 0.8186, UEM: 0.4419, LEM: 0.2084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1479, partial_loss/deprel_loss: 1.1772, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2388, loss: 1.2158, batch_reg_loss: 0.0675, reg_loss: 0.0666 ||:  95%|#########5| 106/111 [01:12<00:03,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8127, UAS: 0.8962, LAS: 0.8185, UEM: 0.4424, LEM: 0.2096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9760, partial_loss/deprel_loss: 1.2365, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2520, loss: 1.2173, batch_reg_loss: 0.0676, reg_loss: 0.0666 ||:  99%|#########9| 110/111 [01:14<00:00,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7871, UAS: 0.8960, LAS: 0.8182, UEM: 0.4402, LEM: 0.2085, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3663, partial_loss/deprel_loss: 1.4187, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4759, loss: 1.2197, batch_reg_loss: 0.0676, reg_loss: 0.0666 ||: 100%|##########| 111/111 [01:15<00:00,  1.48it/s]\n",
      "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 23:03:06,509 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.419  |       N/A\n",
      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.366  |       N/A\n",
      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.067  |       N/A\n",
      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - UEM                      |     0.440  |       N/A\n",
      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - LAS                      |     0.818  |       N/A\n",
      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - loss                     |     1.220  |       N/A\n",
      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - LEM                      |     0.209  |       N/A\n",
      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:03:06,510 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:03:06,511 - INFO - combo.training.tensorboard_writer - UAS                      |     0.896  |       N/A\n",
      "2023-04-06 23:03:06,511 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:03:06,511 - INFO - combo.training.tensorboard_writer - EM                       |     0.787  |       N/A\n",
      "2023-04-06 23:03:06,511 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:03:06,511 - INFO - combo.training.trainer - Epoch duration: 0:01:15.152380\n",
      "2023-04-06 23:03:06,512 - INFO - combo.training.trainer - Estimated training time remaining: 8:39:28\n",
      "2023-04-06 23:03:06,512 - INFO - allennlp.training.trainer - Epoch 10/399\n",
      "2023-04-06 23:03:06,512 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:03:06,512 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:03:06,518 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8555, UAS: 0.9211, LAS: 0.8489, UEM: 0.4350, LEM: 0.1673, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6806, partial_loss/deprel_loss: 0.8446, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8795, loss: 0.9582, batch_reg_loss: 0.0677, reg_loss: 0.0676 ||:   3%|2         | 3/111 [00:02<01:13,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7567, UAS: 0.9095, LAS: 0.8358, UEM: 0.3786, LEM: 0.1376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0075, partial_loss/deprel_loss: 1.6559, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7939, loss: 1.0705, batch_reg_loss: 0.0677, reg_loss: 0.0677 ||:   6%|6         | 7/111 [00:04<01:07,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8734, UAS: 0.9037, LAS: 0.8297, UEM: 0.4104, LEM: 0.1799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4051, partial_loss/deprel_loss: 0.6088, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6359, loss: 1.1128, batch_reg_loss: 0.0678, reg_loss: 0.0677 ||:   9%|9         | 10/111 [00:06<01:06,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8079, UAS: 0.9057, LAS: 0.8309, UEM: 0.3985, LEM: 0.1653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1594, partial_loss/deprel_loss: 1.4341, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4470, loss: 1.1057, batch_reg_loss: 0.0678, reg_loss: 0.0677 ||:  12%|#1        | 13/111 [00:08<01:07,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7768, UAS: 0.8954, LAS: 0.8210, UEM: 0.3798, LEM: 0.1587, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8156, partial_loss/deprel_loss: 1.4734, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6097, loss: 1.1918, batch_reg_loss: 0.0679, reg_loss: 0.0678 ||:  14%|#4        | 16/111 [00:10<01:05,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8736, UAS: 0.9001, LAS: 0.8265, UEM: 0.3925, LEM: 0.1602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5088, partial_loss/deprel_loss: 0.6757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7103, loss: 1.1418, batch_reg_loss: 0.0680, reg_loss: 0.0678 ||:  18%|#8        | 20/111 [00:13<01:01,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8563, UAS: 0.9033, LAS: 0.8293, UEM: 0.4103, LEM: 0.1721, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5729, partial_loss/deprel_loss: 0.8466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8599, loss: 1.1190, batch_reg_loss: 0.0680, reg_loss: 0.0678 ||:  21%|##        | 23/111 [00:15<00:59,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7607, UAS: 0.9003, LAS: 0.8257, UEM: 0.3788, LEM: 0.1528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9901, partial_loss/deprel_loss: 1.5372, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6959, loss: 1.1511, batch_reg_loss: 0.0681, reg_loss: 0.0679 ||:  25%|##5       | 28/111 [00:17<00:50,  1.65it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8466, UAS: 0.9034, LAS: 0.8289, UEM: 0.3855, LEM: 0.1509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7388, partial_loss/deprel_loss: 1.0446, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0516, loss: 1.1226, batch_reg_loss: 0.0682, reg_loss: 0.0679 ||:  29%|##8       | 32/111 [00:20<00:51,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9063, LAS: 0.8325, UEM: 0.4192, LEM: 0.1846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3700, partial_loss/deprel_loss: 0.6140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6335, loss: 1.0953, batch_reg_loss: 0.0683, reg_loss: 0.0679 ||:  32%|###2      | 36/111 [00:23<00:52,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8745, UAS: 0.9079, LAS: 0.8343, UEM: 0.4254, LEM: 0.1857, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4378, partial_loss/deprel_loss: 0.7192, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7312, loss: 1.0799, batch_reg_loss: 0.0683, reg_loss: 0.0680 ||:  35%|###5      | 39/111 [00:25<00:50,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8569, UAS: 0.9090, LAS: 0.8357, UEM: 0.4734, LEM: 0.2418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5374, partial_loss/deprel_loss: 0.8689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8710, loss: 1.0719, batch_reg_loss: 0.0684, reg_loss: 0.0680 ||:  38%|###7      | 42/111 [00:28<00:52,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8581, UAS: 0.9110, LAS: 0.8381, UEM: 0.4946, LEM: 0.2545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5987, partial_loss/deprel_loss: 0.8453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8644, loss: 1.0472, batch_reg_loss: 0.0684, reg_loss: 0.0680 ||:  41%|####      | 45/111 [00:31<00:51,  1.28it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8491, UAS: 0.9084, LAS: 0.8351, UEM: 0.4845, LEM: 0.2480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6995, partial_loss/deprel_loss: 0.8959, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9251, loss: 1.0728, batch_reg_loss: 0.0685, reg_loss: 0.0680 ||:  43%|####3     | 48/111 [00:33<00:48,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8088, UAS: 0.9075, LAS: 0.8338, UEM: 0.4736, LEM: 0.2393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1152, partial_loss/deprel_loss: 1.1692, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2269, loss: 1.0826, batch_reg_loss: 0.0685, reg_loss: 0.0681 ||:  46%|####5     | 51/111 [00:35<00:44,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7492, UAS: 0.9047, LAS: 0.8305, UEM: 0.4617, LEM: 0.2330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8205, partial_loss/deprel_loss: 1.8595, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9202, loss: 1.1140, batch_reg_loss: 0.0686, reg_loss: 0.0681 ||:  49%|####8     | 54/111 [00:37<00:41,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7964, UAS: 0.9034, LAS: 0.8291, UEM: 0.4487, LEM: 0.2257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2039, partial_loss/deprel_loss: 1.3371, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3791, loss: 1.1273, batch_reg_loss: 0.0686, reg_loss: 0.0681 ||:  51%|#####1    | 57/111 [00:39<00:39,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7435, UAS: 0.9016, LAS: 0.8268, UEM: 0.4383, LEM: 0.2176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2836, partial_loss/deprel_loss: 1.8352, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9936, loss: 1.1479, batch_reg_loss: 0.0687, reg_loss: 0.0682 ||:  55%|#####4    | 61/111 [00:42<00:34,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8348, UAS: 0.9023, LAS: 0.8278, UEM: 0.4403, LEM: 0.2168, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7759, partial_loss/deprel_loss: 1.0006, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0244, loss: 1.1379, batch_reg_loss: 0.0688, reg_loss: 0.0682 ||:  58%|#####7    | 64/111 [00:44<00:32,  1.44it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8721, UAS: 0.9030, LAS: 0.8286, UEM: 0.4388, LEM: 0.2130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5197, partial_loss/deprel_loss: 0.7770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7944, loss: 1.1308, batch_reg_loss: 0.0689, reg_loss: 0.0682 ||:  60%|######    | 67/111 [00:46<00:30,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9032, LAS: 0.8287, UEM: 0.4419, LEM: 0.2154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3263, partial_loss/deprel_loss: 0.6052, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6184, loss: 1.1277, batch_reg_loss: 0.0689, reg_loss: 0.0683 ||:  63%|######3   | 70/111 [00:48<00:29,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8555, UAS: 0.9024, LAS: 0.8277, UEM: 0.4353, LEM: 0.2113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6941, partial_loss/deprel_loss: 0.8625, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8978, loss: 1.1377, batch_reg_loss: 0.0690, reg_loss: 0.0683 ||:  66%|######5   | 73/111 [00:50<00:26,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7257, UAS: 0.9023, LAS: 0.8276, UEM: 0.4461, LEM: 0.2181, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5688, partial_loss/deprel_loss: 1.8292, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0462, loss: 1.1387, batch_reg_loss: 0.0691, reg_loss: 0.0683 ||:  68%|######8   | 76/111 [00:52<00:24,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8725, UAS: 0.9029, LAS: 0.8282, UEM: 0.4496, LEM: 0.2185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4104, partial_loss/deprel_loss: 0.7276, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7332, loss: 1.1344, batch_reg_loss: 0.0691, reg_loss: 0.0683 ||:  71%|#######1  | 79/111 [00:55<00:22,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7970, UAS: 0.9011, LAS: 0.8263, UEM: 0.4404, LEM: 0.2131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4546, partial_loss/deprel_loss: 1.2680, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3746, loss: 1.1528, batch_reg_loss: 0.0692, reg_loss: 0.0684 ||:  75%|#######4  | 83/111 [00:57<00:19,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7372, UAS: 0.9006, LAS: 0.8256, UEM: 0.4416, LEM: 0.2148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9790, partial_loss/deprel_loss: 1.8560, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9498, loss: 1.1586, batch_reg_loss: 0.0693, reg_loss: 0.0684 ||:  77%|#######7  | 86/111 [00:59<00:17,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8673, UAS: 0.9005, LAS: 0.8255, UEM: 0.4447, LEM: 0.2144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4351, partial_loss/deprel_loss: 0.7105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7247, loss: 1.1604, batch_reg_loss: 0.0694, reg_loss: 0.0685 ||:  81%|########1 | 90/111 [01:02<00:14,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8762, UAS: 0.9016, LAS: 0.8266, UEM: 0.4473, LEM: 0.2139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4284, partial_loss/deprel_loss: 0.6718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6926, loss: 1.1503, batch_reg_loss: 0.0694, reg_loss: 0.0685 ||:  84%|########3 | 93/111 [01:04<00:12,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8070, UAS: 0.9025, LAS: 0.8278, UEM: 0.4611, LEM: 0.2269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3530, partial_loss/deprel_loss: 1.2532, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3427, loss: 1.1401, batch_reg_loss: 0.0695, reg_loss: 0.0685 ||:  86%|########6 | 96/111 [01:06<00:10,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9011, LAS: 0.8262, UEM: 0.4614, LEM: 0.2285, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3227, partial_loss/deprel_loss: 0.5647, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5858, loss: 1.1574, batch_reg_loss: 0.0696, reg_loss: 0.0686 ||:  90%|######### | 100/111 [01:08<00:07,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7670, UAS: 0.9000, LAS: 0.8250, UEM: 0.4556, LEM: 0.2241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6908, partial_loss/deprel_loss: 1.5468, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6452, loss: 1.1669, batch_reg_loss: 0.0696, reg_loss: 0.0686 ||:  94%|#########3| 104/111 [01:11<00:04,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8278, UAS: 0.8997, LAS: 0.8246, UEM: 0.4485, LEM: 0.2188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9835, partial_loss/deprel_loss: 1.0113, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0754, loss: 1.1688, batch_reg_loss: 0.0697, reg_loss: 0.0686 ||:  97%|#########7| 108/111 [01:13<00:01,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.8993, LAS: 0.8241, UEM: 0.4477, LEM: 0.2181, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3591, partial_loss/deprel_loss: 0.6441, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6569, loss: 1.1728, batch_reg_loss: 0.0698, reg_loss: 0.0687 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
      "2023-04-06 23:04:21,844 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9091, LAS: 0.8425, UEM: 0.5537, LEM: 0.2550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4429, partial_loss/deprel_loss: 25.5584, partial_loss/cycle_loss: 0.0000, batch_loss: 20.5353, loss: 33.4054, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:12,  1.17s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9252, LAS: 0.8642, UEM: 0.6450, LEM: 0.4138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2464, partial_loss/deprel_loss: 19.8308, partial_loss/cycle_loss: 0.0000, batch_loss: 15.9139, loss: 26.8195, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:05<00:08,  1.10s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8695, UAS: 0.9317, LAS: 0.8693, UEM: 0.6302, LEM: 0.3764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5259, partial_loss/deprel_loss: 23.7138, partial_loss/cycle_loss: 0.0000, batch_loss: 19.0762, loss: 25.0754, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:08<00:05,  1.06s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8426, UAS: 0.9354, LAS: 0.8720, UEM: 0.6148, LEM: 0.3476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0366, partial_loss/deprel_loss: 42.6409, partial_loss/cycle_loss: 0.0000, batch_loss: 34.3200, loss: 24.3461, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:10<00:02,  1.01s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8435, UAS: 0.9327, LAS: 0.8688, UEM: 0.5809, LEM: 0.3203, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1886, partial_loss/deprel_loss: 48.1446, partial_loss/cycle_loss: 0.0000, batch_loss: 38.7534, loss: 25.3898, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.03it/s]\n",
      "2023-04-06 23:04:34,521 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:04:34,521 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-06 23:04:34,521 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 23:04:34,521 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 23:04:34,521 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.644  |    48.145\n",
      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.359  |     1.189\n",
      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.069  |     0.000\n",
      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - UEM                      |     0.448  |     0.581\n",
      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - LAS                      |     0.824  |     0.869\n",
      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - loss                     |     1.173  |    25.390\n",
      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - LEM                      |     0.218  |     0.320\n",
      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - UAS                      |     0.899  |     0.933\n",
      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - EM                       |     0.879  |     0.844\n",
      "2023-04-06 23:04:34,522 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:04:34,523 - INFO - combo.training.trainer - Epoch duration: 0:01:28.011201\n",
      "2023-04-06 23:04:34,523 - INFO - combo.training.trainer - Estimated training time remaining: 8:42:55\n",
      "2023-04-06 23:04:34,523 - INFO - allennlp.training.trainer - Epoch 11/399\n",
      "2023-04-06 23:04:34,523 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:04:34,523 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:04:34,529 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7318, UAS: 0.9023, LAS: 0.8266, UEM: 0.6184, LEM: 0.2993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2381, partial_loss/deprel_loss: 1.8576, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0035, loss: 1.1306, batch_reg_loss: 0.0699, reg_loss: 0.0698 ||:   3%|2         | 3/111 [00:02<01:23,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8728, UAS: 0.9063, LAS: 0.8290, UEM: 0.4976, LEM: 0.2240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4630, partial_loss/deprel_loss: 0.8076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8086, loss: 1.1307, batch_reg_loss: 0.0699, reg_loss: 0.0699 ||:   5%|5         | 6/111 [00:04<01:18,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8167, UAS: 0.9103, LAS: 0.8362, UEM: 0.4687, LEM: 0.1954, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1053, partial_loss/deprel_loss: 1.2357, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2797, loss: 1.0641, batch_reg_loss: 0.0700, reg_loss: 0.0699 ||:   9%|9         | 10/111 [00:06<01:12,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7896, UAS: 0.9057, LAS: 0.8323, UEM: 0.4223, LEM: 0.1711, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5511, partial_loss/deprel_loss: 1.3968, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4978, loss: 1.0987, batch_reg_loss: 0.0701, reg_loss: 0.0700 ||:  12%|#1        | 13/111 [00:08<01:09,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7038, UAS: 0.8933, LAS: 0.8198, UEM: 0.4015, LEM: 0.1612, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.3903, partial_loss/deprel_loss: 2.1584, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4749, loss: 1.2235, batch_reg_loss: 0.0702, reg_loss: 0.0700 ||:  15%|#5        | 17/111 [00:11<01:05,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8609, UAS: 0.8926, LAS: 0.8186, UEM: 0.3850, LEM: 0.1549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5808, partial_loss/deprel_loss: 0.8367, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8557, loss: 1.2307, batch_reg_loss: 0.0702, reg_loss: 0.0700 ||:  18%|#8        | 20/111 [00:13<01:04,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.8979, LAS: 0.8248, UEM: 0.4068, LEM: 0.1651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4397, partial_loss/deprel_loss: 0.6836, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7051, loss: 1.1735, batch_reg_loss: 0.0703, reg_loss: 0.0701 ||:  21%|##        | 23/111 [00:16<01:02,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8470, UAS: 0.9013, LAS: 0.8287, UEM: 0.4106, LEM: 0.1665, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6933, partial_loss/deprel_loss: 0.9933, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0037, loss: 1.1421, batch_reg_loss: 0.0704, reg_loss: 0.0701 ||:  24%|##4       | 27/111 [00:18<00:56,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8822, UAS: 0.9032, LAS: 0.8303, UEM: 0.4190, LEM: 0.1744, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3419, partial_loss/deprel_loss: 0.5709, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5955, loss: 1.1172, batch_reg_loss: 0.0705, reg_loss: 0.0701 ||:  28%|##7       | 31/111 [00:21<00:54,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8587, UAS: 0.9035, LAS: 0.8302, UEM: 0.4089, LEM: 0.1680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6362, partial_loss/deprel_loss: 0.7944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8333, loss: 1.1133, batch_reg_loss: 0.0705, reg_loss: 0.0702 ||:  31%|###       | 34/111 [00:23<00:52,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8844, UAS: 0.9044, LAS: 0.8316, UEM: 0.4279, LEM: 0.1793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3551, partial_loss/deprel_loss: 0.6374, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6515, loss: 1.1019, batch_reg_loss: 0.0706, reg_loss: 0.0702 ||:  34%|###4      | 38/111 [00:25<00:47,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8177, UAS: 0.9025, LAS: 0.8289, UEM: 0.4126, LEM: 0.1706, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0452, partial_loss/deprel_loss: 1.1970, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2373, loss: 1.1266, batch_reg_loss: 0.0707, reg_loss: 0.0703 ||:  38%|###7      | 42/111 [00:28<00:44,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8176, UAS: 0.9022, LAS: 0.8284, UEM: 0.3981, LEM: 0.1621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1751, partial_loss/deprel_loss: 1.1391, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2171, loss: 1.1310, batch_reg_loss: 0.0708, reg_loss: 0.0703 ||:  41%|####1     | 46/111 [00:30<00:40,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.9036, LAS: 0.8304, UEM: 0.4308, LEM: 0.1934, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6100, partial_loss/deprel_loss: 0.8959, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9096, loss: 1.1156, batch_reg_loss: 0.0709, reg_loss: 0.0703 ||:  45%|####5     | 50/111 [00:33<00:40,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7861, UAS: 0.8996, LAS: 0.8257, UEM: 0.4162, LEM: 0.1863, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4086, partial_loss/deprel_loss: 1.4620, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5223, loss: 1.1565, batch_reg_loss: 0.0709, reg_loss: 0.0704 ||:  49%|####8     | 54/111 [00:36<00:38,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8806, UAS: 0.9003, LAS: 0.8264, UEM: 0.4200, LEM: 0.1901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4031, partial_loss/deprel_loss: 0.6066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6369, loss: 1.1513, batch_reg_loss: 0.0710, reg_loss: 0.0704 ||:  51%|#####1    | 57/111 [00:39<00:40,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8030, UAS: 0.8989, LAS: 0.8248, UEM: 0.4080, LEM: 0.1835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4330, partial_loss/deprel_loss: 1.2713, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3747, loss: 1.1698, batch_reg_loss: 0.0711, reg_loss: 0.0705 ||:  55%|#####4    | 61/111 [00:41<00:35,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.8991, LAS: 0.8250, UEM: 0.4074, LEM: 0.1823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3995, partial_loss/deprel_loss: 0.6930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7055, loss: 1.1708, batch_reg_loss: 0.0712, reg_loss: 0.0705 ||:  58%|#####7    | 64/111 [00:43<00:32,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9010, LAS: 0.8273, UEM: 0.4541, LEM: 0.2326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2275, partial_loss/deprel_loss: 0.4708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4934, loss: 1.1522, batch_reg_loss: 0.0713, reg_loss: 0.0705 ||:  60%|######    | 67/111 [00:46<00:33,  1.30it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8669, UAS: 0.9019, LAS: 0.8284, UEM: 0.4523, LEM: 0.2285, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5616, partial_loss/deprel_loss: 0.7684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7984, loss: 1.1425, batch_reg_loss: 0.0713, reg_loss: 0.0706 ||:  63%|######3   | 70/111 [00:48<00:30,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8597, UAS: 0.9028, LAS: 0.8292, UEM: 0.4489, LEM: 0.2223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5849, partial_loss/deprel_loss: 0.8075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8344, loss: 1.1331, batch_reg_loss: 0.0714, reg_loss: 0.0706 ||:  67%|######6   | 74/111 [00:51<00:27,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8455, UAS: 0.9026, LAS: 0.8289, UEM: 0.4483, LEM: 0.2209, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7892, partial_loss/deprel_loss: 0.9486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9882, loss: 1.1360, batch_reg_loss: 0.0715, reg_loss: 0.0706 ||:  69%|######9   | 77/111 [00:53<00:24,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7855, UAS: 0.9023, LAS: 0.8285, UEM: 0.4494, LEM: 0.2224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5825, partial_loss/deprel_loss: 1.4556, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5525, loss: 1.1386, batch_reg_loss: 0.0716, reg_loss: 0.0707 ||:  72%|#######2  | 80/111 [00:55<00:21,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7285, UAS: 0.9020, LAS: 0.8283, UEM: 0.4558, LEM: 0.2254, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6126, partial_loss/deprel_loss: 1.8106, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0426, loss: 1.1390, batch_reg_loss: 0.0716, reg_loss: 0.0707 ||:  75%|#######4  | 83/111 [00:57<00:21,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8581, UAS: 0.9022, LAS: 0.8285, UEM: 0.4532, LEM: 0.2213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4983, partial_loss/deprel_loss: 0.8175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8254, loss: 1.1382, batch_reg_loss: 0.0717, reg_loss: 0.0707 ||:  78%|#######8  | 87/111 [01:00<00:17,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8884, UAS: 0.9024, LAS: 0.8289, UEM: 0.4612, LEM: 0.2287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4406, partial_loss/deprel_loss: 0.6748, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6998, loss: 1.1361, batch_reg_loss: 0.0718, reg_loss: 0.0708 ||:  82%|########1 | 91/111 [01:03<00:14,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7991, UAS: 0.9021, LAS: 0.8285, UEM: 0.4575, LEM: 0.2255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4676, partial_loss/deprel_loss: 1.4466, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5226, loss: 1.1405, batch_reg_loss: 0.0719, reg_loss: 0.0708 ||:  86%|########5 | 95/111 [01:05<00:10,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7878, UAS: 0.9016, LAS: 0.8278, UEM: 0.4487, LEM: 0.2202, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5254, partial_loss/deprel_loss: 1.4661, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5499, loss: 1.1483, batch_reg_loss: 0.0720, reg_loss: 0.0709 ||:  89%|########9 | 99/111 [01:08<00:08,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8066, UAS: 0.9015, LAS: 0.8276, UEM: 0.4439, LEM: 0.2164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1248, partial_loss/deprel_loss: 1.2021, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2587, loss: 1.1491, batch_reg_loss: 0.0720, reg_loss: 0.0709 ||:  93%|#########2| 103/111 [01:10<00:05,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8412, UAS: 0.9024, LAS: 0.8286, UEM: 0.4471, LEM: 0.2176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7510, partial_loss/deprel_loss: 0.9877, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0125, loss: 1.1405, batch_reg_loss: 0.0721, reg_loss: 0.0710 ||:  96%|#########6| 107/111 [01:12<00:02,  1.63it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7498, UAS: 0.9025, LAS: 0.8286, UEM: 0.4506, LEM: 0.2200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1198, partial_loss/deprel_loss: 1.8436, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9710, loss: 1.1415, batch_reg_loss: 0.0722, reg_loss: 0.0710 ||: 100%|##########| 111/111 [01:15<00:00,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7498, UAS: 0.9025, LAS: 0.8286, UEM: 0.4506, LEM: 0.2200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1198, partial_loss/deprel_loss: 1.8436, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9710, loss: 1.1415, batch_reg_loss: 0.0722, reg_loss: 0.0710 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.844  |       N/A\n",
      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     2.120  |       N/A\n",
      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.071  |       N/A\n",
      "2023-04-06 23:05:50,104 - INFO - combo.training.tensorboard_writer - UEM                      |     0.451  |       N/A\n",
      "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - LAS                      |     0.829  |       N/A\n",
      "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - loss                     |     1.141  |       N/A\n",
      "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - LEM                      |     0.220  |       N/A\n",
      "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - UAS                      |     0.902  |       N/A\n",
      "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - EM                       |     0.750  |       N/A\n",
      "2023-04-06 23:05:50,105 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:05:50,106 - INFO - combo.training.trainer - Epoch duration: 0:01:15.582589\n",
      "2023-04-06 23:05:50,106 - INFO - combo.training.trainer - Estimated training time remaining: 8:38:50\n",
      "2023-04-06 23:05:50,106 - INFO - allennlp.training.trainer - Epoch 12/399\n",
      "2023-04-06 23:05:50,106 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:05:50,106 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:05:50,112 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8768, UAS: 0.9145, LAS: 0.8453, UEM: 0.4518, LEM: 0.2105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4663, partial_loss/deprel_loss: 0.7585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7723, loss: 1.0488, batch_reg_loss: 0.0723, reg_loss: 0.0723 ||:   3%|2         | 3/111 [00:02<01:15,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9059, LAS: 0.8377, UEM: 0.5846, LEM: 0.3476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6475, partial_loss/deprel_loss: 0.8195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8574, loss: 1.0996, batch_reg_loss: 0.0723, reg_loss: 0.0723 ||:   5%|5         | 6/111 [00:04<01:15,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9139, LAS: 0.8456, UEM: 0.5705, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4356, partial_loss/deprel_loss: 0.6474, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6774, loss: 1.0076, batch_reg_loss: 0.0724, reg_loss: 0.0723 ||:   8%|8         | 9/111 [00:06<01:13,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8927, UAS: 0.9174, LAS: 0.8482, UEM: 0.5739, LEM: 0.3006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3122, partial_loss/deprel_loss: 0.6180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6293, loss: 0.9715, batch_reg_loss: 0.0725, reg_loss: 0.0723 ||:  11%|#         | 12/111 [00:08<01:13,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8221, UAS: 0.9104, LAS: 0.8398, UEM: 0.5355, LEM: 0.2731, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0309, partial_loss/deprel_loss: 1.0752, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1389, loss: 1.0415, batch_reg_loss: 0.0725, reg_loss: 0.0724 ||:  14%|#3        | 15/111 [00:11<01:11,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8429, UAS: 0.9067, LAS: 0.8371, UEM: 0.5688, LEM: 0.3226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8351, partial_loss/deprel_loss: 0.9804, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0239, loss: 1.0859, batch_reg_loss: 0.0726, reg_loss: 0.0724 ||:  16%|#6        | 18/111 [00:13<01:10,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9099, LAS: 0.8394, UEM: 0.5595, LEM: 0.3006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5296, partial_loss/deprel_loss: 0.7868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8080, loss: 1.0573, batch_reg_loss: 0.0726, reg_loss: 0.0724 ||:  19%|#8        | 21/111 [00:15<01:05,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8695, UAS: 0.9070, LAS: 0.8361, UEM: 0.5278, LEM: 0.2775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5860, partial_loss/deprel_loss: 0.8350, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8579, loss: 1.0872, batch_reg_loss: 0.0727, reg_loss: 0.0725 ||:  23%|##2       | 25/111 [00:17<00:59,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8493, UAS: 0.9108, LAS: 0.8402, UEM: 0.5494, LEM: 0.2893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7324, partial_loss/deprel_loss: 0.9558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9839, loss: 1.0478, batch_reg_loss: 0.0728, reg_loss: 0.0725 ||:  25%|##5       | 28/111 [00:20<00:58,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8217, UAS: 0.9095, LAS: 0.8378, UEM: 0.5353, LEM: 0.2781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9042, partial_loss/deprel_loss: 1.1620, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1834, loss: 1.0668, batch_reg_loss: 0.0729, reg_loss: 0.0726 ||:  29%|##8       | 32/111 [00:22<00:53,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8655, UAS: 0.9101, LAS: 0.8382, UEM: 0.5166, LEM: 0.2622, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5087, partial_loss/deprel_loss: 0.8009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8154, loss: 1.0627, batch_reg_loss: 0.0730, reg_loss: 0.0726 ||:  32%|###2      | 36/111 [00:25<00:49,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8028, UAS: 0.9089, LAS: 0.8370, UEM: 0.5070, LEM: 0.2578, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3822, partial_loss/deprel_loss: 1.3442, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4248, loss: 1.0717, batch_reg_loss: 0.0731, reg_loss: 0.0726 ||:  36%|###6      | 40/111 [00:27<00:46,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9432, UAS: 0.9101, LAS: 0.8384, UEM: 0.5297, LEM: 0.2952, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0845, partial_loss/deprel_loss: 0.2260, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2709, loss: 1.0596, batch_reg_loss: 0.0731, reg_loss: 0.0727 ||:  40%|###9      | 44/111 [00:30<00:47,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8942, UAS: 0.9088, LAS: 0.8368, UEM: 0.5236, LEM: 0.2921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3538, partial_loss/deprel_loss: 0.5469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5815, loss: 1.0727, batch_reg_loss: 0.0732, reg_loss: 0.0727 ||:  43%|####3     | 48/111 [00:33<00:44,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8150, UAS: 0.9072, LAS: 0.8350, UEM: 0.5092, LEM: 0.2833, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0867, partial_loss/deprel_loss: 1.3690, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3859, loss: 1.0896, batch_reg_loss: 0.0733, reg_loss: 0.0728 ||:  46%|####5     | 51/111 [00:36<00:43,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8385, UAS: 0.9088, LAS: 0.8370, UEM: 0.5143, LEM: 0.2817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8776, partial_loss/deprel_loss: 1.0180, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0633, loss: 1.0735, batch_reg_loss: 0.0734, reg_loss: 0.0728 ||:  49%|####8     | 54/111 [00:38<00:43,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7273, UAS: 0.9077, LAS: 0.8359, UEM: 0.5105, LEM: 0.2755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6504, partial_loss/deprel_loss: 1.8004, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0438, loss: 1.0829, batch_reg_loss: 0.0734, reg_loss: 0.0728 ||:  51%|#####1    | 57/111 [00:40<00:39,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7544, UAS: 0.9065, LAS: 0.8341, UEM: 0.4990, LEM: 0.2681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8573, partial_loss/deprel_loss: 1.7411, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8378, loss: 1.0979, batch_reg_loss: 0.0735, reg_loss: 0.0729 ||:  54%|#####4    | 60/111 [00:42<00:37,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7376, UAS: 0.9049, LAS: 0.8321, UEM: 0.4968, LEM: 0.2647, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1506, partial_loss/deprel_loss: 1.7339, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8908, loss: 1.1161, batch_reg_loss: 0.0736, reg_loss: 0.0729 ||:  57%|#####6    | 63/111 [00:45<00:35,  1.34it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7635, UAS: 0.9050, LAS: 0.8323, UEM: 0.4953, LEM: 0.2602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9722, partial_loss/deprel_loss: 1.6385, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7789, loss: 1.1152, batch_reg_loss: 0.0737, reg_loss: 0.0729 ||:  60%|######    | 67/111 [00:47<00:31,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8878, UAS: 0.9055, LAS: 0.8327, UEM: 0.4957, LEM: 0.2607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3573, partial_loss/deprel_loss: 0.5606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5937, loss: 1.1123, batch_reg_loss: 0.0737, reg_loss: 0.0730 ||:  63%|######3   | 70/111 [00:50<00:29,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8615, UAS: 0.9058, LAS: 0.8332, UEM: 0.4880, LEM: 0.2547, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6342, partial_loss/deprel_loss: 0.7887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8317, loss: 1.1077, batch_reg_loss: 0.0738, reg_loss: 0.0730 ||:  67%|######6   | 74/111 [00:52<00:26,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8511, UAS: 0.9068, LAS: 0.8343, UEM: 0.4830, LEM: 0.2481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7012, partial_loss/deprel_loss: 0.8971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9318, loss: 1.0977, batch_reg_loss: 0.0739, reg_loss: 0.0731 ||:  70%|#######   | 78/111 [00:54<00:21,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8553, UAS: 0.9070, LAS: 0.8342, UEM: 0.4768, LEM: 0.2413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7163, partial_loss/deprel_loss: 0.9517, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9786, loss: 1.0981, batch_reg_loss: 0.0740, reg_loss: 0.0731 ||:  74%|#######3  | 82/111 [00:57<00:19,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7462, UAS: 0.9056, LAS: 0.8328, UEM: 0.4687, LEM: 0.2366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1859, partial_loss/deprel_loss: 1.6293, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8147, loss: 1.1102, batch_reg_loss: 0.0741, reg_loss: 0.0731 ||:  77%|#######7  | 86/111 [00:59<00:15,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8527, UAS: 0.9051, LAS: 0.8322, UEM: 0.4610, LEM: 0.2306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6899, partial_loss/deprel_loss: 0.8140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8633, loss: 1.1154, batch_reg_loss: 0.0742, reg_loss: 0.0732 ||:  81%|########1 | 90/111 [01:02<00:13,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9056, LAS: 0.8328, UEM: 0.4617, LEM: 0.2292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3437, partial_loss/deprel_loss: 0.5813, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6080, loss: 1.1113, batch_reg_loss: 0.0743, reg_loss: 0.0732 ||:  85%|########4 | 94/111 [01:04<00:10,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8285, UAS: 0.9058, LAS: 0.8330, UEM: 0.4594, LEM: 0.2272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8808, partial_loss/deprel_loss: 1.0929, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1248, loss: 1.1101, batch_reg_loss: 0.0743, reg_loss: 0.0733 ||:  88%|########8 | 98/111 [01:07<00:08,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9059, LAS: 0.8333, UEM: 0.4644, LEM: 0.2317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5260, partial_loss/deprel_loss: 0.6404, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6920, loss: 1.1069, batch_reg_loss: 0.0744, reg_loss: 0.0733 ||:  92%|#########1| 102/111 [01:09<00:05,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8420, UAS: 0.9051, LAS: 0.8326, UEM: 0.4572, LEM: 0.2272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7691, partial_loss/deprel_loss: 0.9381, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9788, loss: 1.1119, batch_reg_loss: 0.0745, reg_loss: 0.0734 ||:  95%|#########5| 106/111 [01:12<00:03,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8197, UAS: 0.9062, LAS: 0.8339, UEM: 0.4675, LEM: 0.2349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0885, partial_loss/deprel_loss: 1.1797, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2361, loss: 1.0998, batch_reg_loss: 0.0746, reg_loss: 0.0734 ||:  99%|#########9| 110/111 [01:15<00:00,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8198, UAS: 0.9061, LAS: 0.8338, UEM: 0.4655, LEM: 0.2335, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0232, partial_loss/deprel_loss: 1.1102, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1674, loss: 1.1004, batch_reg_loss: 0.0746, reg_loss: 0.0734 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
      "2023-04-06 23:07:05,881 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.110  |       N/A\n",
      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.023  |       N/A\n",
      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.073  |       N/A\n",
      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - UEM                      |     0.465  |       N/A\n",
      "2023-04-06 23:07:05,882 - INFO - combo.training.tensorboard_writer - LAS                      |     0.834  |       N/A\n",
      "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - loss                     |     1.100  |       N/A\n",
      "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - LEM                      |     0.233  |       N/A\n",
      "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - UAS                      |     0.906  |       N/A\n",
      "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - EM                       |     0.820  |       N/A\n",
      "2023-04-06 23:07:05,883 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:07:05,884 - INFO - combo.training.trainer - Epoch duration: 0:01:15.777801\n",
      "2023-04-06 23:07:05,884 - INFO - combo.training.trainer - Estimated training time remaining: 8:35:17\n",
      "2023-04-06 23:07:05,884 - INFO - allennlp.training.trainer - Epoch 13/399\n",
      "2023-04-06 23:07:05,884 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:07:05,884 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:07:05,891 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8541, UAS: 0.9303, LAS: 0.8619, UEM: 0.4574, LEM: 0.1618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7100, partial_loss/deprel_loss: 0.9025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9387, loss: 0.8542, batch_reg_loss: 0.0747, reg_loss: 0.0747 ||:   4%|3         | 4/111 [00:02<01:05,  1.64it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8582, UAS: 0.9274, LAS: 0.8577, UEM: 0.5495, LEM: 0.2515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5867, partial_loss/deprel_loss: 0.8378, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8624, loss: 0.9059, batch_reg_loss: 0.0747, reg_loss: 0.0747 ||:   6%|6         | 7/111 [00:04<01:06,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8469, UAS: 0.9324, LAS: 0.8661, UEM: 0.6490, LEM: 0.3987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7952, partial_loss/deprel_loss: 0.9270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9754, loss: 0.8396, batch_reg_loss: 0.0748, reg_loss: 0.0747 ||:   9%|9         | 10/111 [00:07<01:10,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8533, UAS: 0.9237, LAS: 0.8552, UEM: 0.6107, LEM: 0.3598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5861, partial_loss/deprel_loss: 0.8717, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8895, loss: 0.9147, batch_reg_loss: 0.0749, reg_loss: 0.0748 ||:  12%|#1        | 13/111 [00:09<01:09,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8860, UAS: 0.9197, LAS: 0.8506, UEM: 0.5745, LEM: 0.3269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3641, partial_loss/deprel_loss: 0.6230, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6461, loss: 0.9695, batch_reg_loss: 0.0749, reg_loss: 0.0748 ||:  15%|#5        | 17/111 [00:11<01:03,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8156, UAS: 0.9151, LAS: 0.8442, UEM: 0.5264, LEM: 0.2925, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1686, partial_loss/deprel_loss: 1.2195, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2844, loss: 1.0252, batch_reg_loss: 0.0750, reg_loss: 0.0748 ||:  19%|#8        | 21/111 [00:13<00:57,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8267, UAS: 0.9124, LAS: 0.8413, UEM: 0.4941, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0154, partial_loss/deprel_loss: 1.0660, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1310, loss: 1.0460, batch_reg_loss: 0.0751, reg_loss: 0.0749 ||:  23%|##2       | 25/111 [00:16<00:53,  1.62it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8238, UAS: 0.9086, LAS: 0.8368, UEM: 0.4664, LEM: 0.2499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0240, partial_loss/deprel_loss: 1.2609, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2887, loss: 1.0848, batch_reg_loss: 0.0752, reg_loss: 0.0749 ||:  26%|##6       | 29/111 [00:18<00:49,  1.65it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8801, UAS: 0.9055, LAS: 0.8337, UEM: 0.4621, LEM: 0.2417, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4187, partial_loss/deprel_loss: 0.6399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6710, loss: 1.1165, batch_reg_loss: 0.0753, reg_loss: 0.0749 ||:  30%|##9       | 33/111 [00:21<00:49,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8659, UAS: 0.9073, LAS: 0.8363, UEM: 0.4795, LEM: 0.2514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6131, partial_loss/deprel_loss: 0.7515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7992, loss: 1.0915, batch_reg_loss: 0.0754, reg_loss: 0.0750 ||:  33%|###3      | 37/111 [00:24<00:49,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7761, UAS: 0.9057, LAS: 0.8346, UEM: 0.4668, LEM: 0.2435, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8575, partial_loss/deprel_loss: 1.3668, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5404, loss: 1.1023, batch_reg_loss: 0.0754, reg_loss: 0.0750 ||:  36%|###6      | 40/111 [00:26<00:49,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7881, UAS: 0.9043, LAS: 0.8329, UEM: 0.4531, LEM: 0.2340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5114, partial_loss/deprel_loss: 1.4052, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5020, loss: 1.1203, batch_reg_loss: 0.0755, reg_loss: 0.0751 ||:  40%|###9      | 44/111 [00:29<00:45,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8413, UAS: 0.9052, LAS: 0.8341, UEM: 0.4580, LEM: 0.2377, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9760, partial_loss/deprel_loss: 0.9807, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0554, loss: 1.1106, batch_reg_loss: 0.0756, reg_loss: 0.0751 ||:  43%|####3     | 48/111 [00:31<00:41,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8444, UAS: 0.9044, LAS: 0.8330, UEM: 0.4435, LEM: 0.2266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8102, partial_loss/deprel_loss: 0.9511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9986, loss: 1.1189, batch_reg_loss: 0.0757, reg_loss: 0.0752 ||:  47%|####6     | 52/111 [00:34<00:38,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8000, UAS: 0.9029, LAS: 0.8312, UEM: 0.4362, LEM: 0.2202, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5169, partial_loss/deprel_loss: 1.3667, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4725, loss: 1.1357, batch_reg_loss: 0.0758, reg_loss: 0.0752 ||:  50%|#####     | 56/111 [00:36<00:36,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7002, UAS: 0.9022, LAS: 0.8304, UEM: 0.4436, LEM: 0.2236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.2238, partial_loss/deprel_loss: 2.1219, partial_loss/cycle_loss: 0.0000, batch_loss: 2.4182, loss: 1.1438, batch_reg_loss: 0.0759, reg_loss: 0.0752 ||:  54%|#####4    | 60/111 [00:39<00:33,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9040, LAS: 0.8323, UEM: 0.4516, LEM: 0.2267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6981, partial_loss/deprel_loss: 0.9456, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9721, loss: 1.1264, batch_reg_loss: 0.0760, reg_loss: 0.0753 ||:  58%|#####7    | 64/111 [00:41<00:30,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8776, UAS: 0.9055, LAS: 0.8341, UEM: 0.4556, LEM: 0.2268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4415, partial_loss/deprel_loss: 0.7414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7575, loss: 1.1101, batch_reg_loss: 0.0761, reg_loss: 0.0753 ||:  61%|######1   | 68/111 [00:44<00:28,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8575, UAS: 0.9040, LAS: 0.8328, UEM: 0.4447, LEM: 0.2207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7093, partial_loss/deprel_loss: 0.7485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8168, loss: 1.1185, batch_reg_loss: 0.0762, reg_loss: 0.0754 ||:  65%|######4   | 72/111 [00:47<00:25,  1.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8172, UAS: 0.9043, LAS: 0.8333, UEM: 0.4447, LEM: 0.2198, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2306, partial_loss/deprel_loss: 1.1250, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2224, loss: 1.1130, batch_reg_loss: 0.0763, reg_loss: 0.0754 ||:  68%|######8   | 76/111 [00:50<00:24,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8946, UAS: 0.9062, LAS: 0.8355, UEM: 0.4584, LEM: 0.2289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2390, partial_loss/deprel_loss: 0.4781, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5066, loss: 1.0937, batch_reg_loss: 0.0764, reg_loss: 0.0755 ||:  72%|#######2  | 80/111 [00:53<00:21,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8032, UAS: 0.9060, LAS: 0.8351, UEM: 0.4538, LEM: 0.2249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3960, partial_loss/deprel_loss: 1.3687, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4506, loss: 1.0980, batch_reg_loss: 0.0764, reg_loss: 0.0755 ||:  75%|#######4  | 83/111 [00:55<00:19,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8021, UAS: 0.9050, LAS: 0.8337, UEM: 0.4466, LEM: 0.2208, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3930, partial_loss/deprel_loss: 1.3680, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4495, loss: 1.1114, batch_reg_loss: 0.0765, reg_loss: 0.0755 ||:  77%|#######7  | 86/111 [00:57<00:17,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9049, LAS: 0.8336, UEM: 0.4501, LEM: 0.2231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3639, partial_loss/deprel_loss: 0.5709, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6060, loss: 1.1125, batch_reg_loss: 0.0765, reg_loss: 0.0756 ||:  80%|########  | 89/111 [00:59<00:15,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9055, LAS: 0.8343, UEM: 0.4625, LEM: 0.2369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4388, partial_loss/deprel_loss: 0.6558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6890, loss: 1.1064, batch_reg_loss: 0.0766, reg_loss: 0.0756 ||:  84%|########3 | 93/111 [01:02<00:12,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8150, UAS: 0.9057, LAS: 0.8346, UEM: 0.4606, LEM: 0.2346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0815, partial_loss/deprel_loss: 1.1541, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2163, loss: 1.1032, batch_reg_loss: 0.0767, reg_loss: 0.0757 ||:  87%|########7 | 97/111 [01:04<00:09,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8593, UAS: 0.9064, LAS: 0.8353, UEM: 0.4631, LEM: 0.2353, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5644, partial_loss/deprel_loss: 0.7545, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7933, loss: 1.0944, batch_reg_loss: 0.0768, reg_loss: 0.0757 ||:  90%|######### | 100/111 [01:07<00:07,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8722, UAS: 0.9071, LAS: 0.8359, UEM: 0.4619, LEM: 0.2309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4491, partial_loss/deprel_loss: 0.7446, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7624, loss: 1.0887, batch_reg_loss: 0.0769, reg_loss: 0.0757 ||:  94%|#########3| 104/111 [01:09<00:04,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8485, UAS: 0.9075, LAS: 0.8365, UEM: 0.4599, LEM: 0.2282, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7765, partial_loss/deprel_loss: 0.9821, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0180, loss: 1.0846, batch_reg_loss: 0.0770, reg_loss: 0.0758 ||:  97%|#########7| 108/111 [01:12<00:01,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9079, LAS: 0.8370, UEM: 0.4689, LEM: 0.2362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5006, partial_loss/deprel_loss: 0.6604, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7055, loss: 1.0791, batch_reg_loss: 0.0770, reg_loss: 0.0758 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
      "2023-04-06 23:08:20,319 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:08:20,319 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.660  |       N/A\n",
      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.501  |       N/A\n",
      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.076  |       N/A\n",
      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - UEM                      |     0.469  |       N/A\n",
      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - LAS                      |     0.837  |       N/A\n",
      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - loss                     |     1.079  |       N/A\n",
      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - LEM                      |     0.236  |       N/A\n",
      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:08:20,320 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:08:20,321 - INFO - combo.training.tensorboard_writer - UAS                      |     0.908  |       N/A\n",
      "2023-04-06 23:08:20,321 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:08:20,321 - INFO - combo.training.tensorboard_writer - EM                       |     0.877  |       N/A\n",
      "2023-04-06 23:08:20,321 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:08:20,321 - INFO - combo.training.trainer - Epoch duration: 0:01:14.437484\n",
      "2023-04-06 23:08:20,322 - INFO - combo.training.trainer - Estimated training time remaining: 8:31:27\n",
      "2023-04-06 23:08:20,322 - INFO - allennlp.training.trainer - Epoch 14/399\n",
      "2023-04-06 23:08:20,322 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:08:20,322 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:08:20,328 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8872, UAS: 0.9050, LAS: 0.8322, UEM: 0.3462, LEM: 0.1412, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3882, partial_loss/deprel_loss: 0.6340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6619, loss: 1.1053, batch_reg_loss: 0.0771, reg_loss: 0.0771 ||:   4%|3         | 4/111 [00:02<01:09,  1.53it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9041, UAS: 0.9247, LAS: 0.8550, UEM: 0.5441, LEM: 0.2661, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2521, partial_loss/deprel_loss: 0.4683, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5022, loss: 0.9122, batch_reg_loss: 0.0772, reg_loss: 0.0771 ||:   6%|6         | 7/111 [00:04<01:09,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8409, UAS: 0.9159, LAS: 0.8477, UEM: 0.6024, LEM: 0.3563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8878, partial_loss/deprel_loss: 0.9722, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0326, loss: 0.9816, batch_reg_loss: 0.0773, reg_loss: 0.0772 ||:   9%|9         | 10/111 [00:06<01:09,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8393, UAS: 0.9164, LAS: 0.8477, UEM: 0.5390, LEM: 0.2992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8523, partial_loss/deprel_loss: 0.9885, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0386, loss: 0.9758, batch_reg_loss: 0.0773, reg_loss: 0.0772 ||:  13%|#2        | 14/111 [00:09<01:03,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7601, UAS: 0.9110, LAS: 0.8412, UEM: 0.5185, LEM: 0.2800, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9668, partial_loss/deprel_loss: 1.5166, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6841, loss: 1.0342, batch_reg_loss: 0.0774, reg_loss: 0.0772 ||:  15%|#5        | 17/111 [00:11<01:04,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8805, UAS: 0.9141, LAS: 0.8444, UEM: 0.5072, LEM: 0.2637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3938, partial_loss/deprel_loss: 0.6296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6599, loss: 1.0093, batch_reg_loss: 0.0775, reg_loss: 0.0773 ||:  19%|#8        | 21/111 [00:14<01:00,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8259, UAS: 0.9116, LAS: 0.8416, UEM: 0.4865, LEM: 0.2501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0877, partial_loss/deprel_loss: 1.1095, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1827, loss: 1.0410, batch_reg_loss: 0.0776, reg_loss: 0.0773 ||:  23%|##2       | 25/111 [00:16<00:57,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8550, UAS: 0.9061, LAS: 0.8356, UEM: 0.4625, LEM: 0.2324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7059, partial_loss/deprel_loss: 0.8587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9058, loss: 1.0970, batch_reg_loss: 0.0777, reg_loss: 0.0774 ||:  26%|##6       | 29/111 [00:19<00:52,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8325, UAS: 0.9051, LAS: 0.8340, UEM: 0.4469, LEM: 0.2211, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0395, partial_loss/deprel_loss: 1.0731, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1441, loss: 1.1120, batch_reg_loss: 0.0778, reg_loss: 0.0774 ||:  30%|##9       | 33/111 [00:21<00:50,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9085, LAS: 0.8382, UEM: 0.4764, LEM: 0.2406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3495, partial_loss/deprel_loss: 0.6205, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6442, loss: 1.0744, batch_reg_loss: 0.0778, reg_loss: 0.0774 ||:  32%|###2      | 36/111 [00:24<00:52,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8723, UAS: 0.9108, LAS: 0.8411, UEM: 0.4902, LEM: 0.2499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6145, partial_loss/deprel_loss: 0.7804, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8251, loss: 1.0500, batch_reg_loss: 0.0779, reg_loss: 0.0775 ||:  36%|###6      | 40/111 [00:26<00:48,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8914, UAS: 0.9124, LAS: 0.8426, UEM: 0.4984, LEM: 0.2531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3140, partial_loss/deprel_loss: 0.5344, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5684, loss: 1.0315, batch_reg_loss: 0.0780, reg_loss: 0.0775 ||:  40%|###9      | 44/111 [00:29<00:45,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8373, UAS: 0.9119, LAS: 0.8419, UEM: 0.4840, LEM: 0.2437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9631, partial_loss/deprel_loss: 1.0249, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0907, loss: 1.0371, batch_reg_loss: 0.0781, reg_loss: 0.0776 ||:  42%|####2     | 47/111 [00:31<00:44,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9133, LAS: 0.8437, UEM: 0.4948, LEM: 0.2530, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2245, partial_loss/deprel_loss: 0.4133, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4537, loss: 1.0207, batch_reg_loss: 0.0782, reg_loss: 0.0776 ||:  46%|####5     | 51/111 [00:34<00:41,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7901, UAS: 0.9129, LAS: 0.8434, UEM: 0.4891, LEM: 0.2476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6952, partial_loss/deprel_loss: 1.4274, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5592, loss: 1.0256, batch_reg_loss: 0.0782, reg_loss: 0.0776 ||:  49%|####8     | 54/111 [00:36<00:40,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9030, UAS: 0.9121, LAS: 0.8425, UEM: 0.4933, LEM: 0.2509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1891, partial_loss/deprel_loss: 0.4925, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5101, loss: 1.0326, batch_reg_loss: 0.0783, reg_loss: 0.0777 ||:  52%|#####2    | 58/111 [00:39<00:37,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8539, UAS: 0.9113, LAS: 0.8415, UEM: 0.4846, LEM: 0.2433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6334, partial_loss/deprel_loss: 0.8711, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9019, loss: 1.0366, batch_reg_loss: 0.0784, reg_loss: 0.0777 ||:  56%|#####5    | 62/111 [00:41<00:33,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8846, UAS: 0.9111, LAS: 0.8413, UEM: 0.4800, LEM: 0.2409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4166, partial_loss/deprel_loss: 0.6120, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6514, loss: 1.0415, batch_reg_loss: 0.0785, reg_loss: 0.0778 ||:  59%|#####8    | 65/111 [00:44<00:31,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7980, UAS: 0.9108, LAS: 0.8410, UEM: 0.4735, LEM: 0.2367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4804, partial_loss/deprel_loss: 1.3567, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4600, loss: 1.0455, batch_reg_loss: 0.0785, reg_loss: 0.0778 ||:  61%|######1   | 68/111 [00:46<00:30,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7880, UAS: 0.9112, LAS: 0.8414, UEM: 0.4779, LEM: 0.2394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6517, partial_loss/deprel_loss: 1.4157, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5415, loss: 1.0425, batch_reg_loss: 0.0786, reg_loss: 0.0778 ||:  64%|######3   | 71/111 [00:48<00:29,  1.38it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9119, LAS: 0.8426, UEM: 0.4984, LEM: 0.2679, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1117, partial_loss/deprel_loss: 0.2414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2941, loss: 1.0349, batch_reg_loss: 0.0786, reg_loss: 0.0779 ||:  67%|######6   | 74/111 [00:50<00:27,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7983, UAS: 0.9113, LAS: 0.8419, UEM: 0.4900, LEM: 0.2614, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4769, partial_loss/deprel_loss: 1.3341, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4414, loss: 1.0420, batch_reg_loss: 0.0787, reg_loss: 0.0779 ||:  70%|#######   | 78/111 [00:53<00:23,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7141, UAS: 0.9108, LAS: 0.8416, UEM: 0.4961, LEM: 0.2649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.2212, partial_loss/deprel_loss: 2.0886, partial_loss/cycle_loss: 0.0000, batch_loss: 2.3939, loss: 1.0457, batch_reg_loss: 0.0788, reg_loss: 0.0779 ||:  74%|#######3  | 82/111 [00:56<00:20,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8603, UAS: 0.9102, LAS: 0.8409, UEM: 0.4893, LEM: 0.2593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6706, partial_loss/deprel_loss: 0.8114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8622, loss: 1.0496, batch_reg_loss: 0.0789, reg_loss: 0.0780 ||:  77%|#######7  | 86/111 [00:58<00:17,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7963, UAS: 0.9103, LAS: 0.8411, UEM: 0.4857, LEM: 0.2558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4870, partial_loss/deprel_loss: 1.3774, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4783, loss: 1.0499, batch_reg_loss: 0.0790, reg_loss: 0.0780 ||:  81%|########1 | 90/111 [01:01<00:14,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8439, UAS: 0.9096, LAS: 0.8401, UEM: 0.4780, LEM: 0.2496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7491, partial_loss/deprel_loss: 0.8945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9445, loss: 1.0577, batch_reg_loss: 0.0791, reg_loss: 0.0781 ||:  85%|########4 | 94/111 [01:03<00:10,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8615, UAS: 0.9107, LAS: 0.8414, UEM: 0.4827, LEM: 0.2505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6406, partial_loss/deprel_loss: 0.8061, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8522, loss: 1.0448, batch_reg_loss: 0.0792, reg_loss: 0.0781 ||:  88%|########8 | 98/111 [01:06<00:08,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8037, UAS: 0.9103, LAS: 0.8410, UEM: 0.4798, LEM: 0.2484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2133, partial_loss/deprel_loss: 1.2041, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2852, loss: 1.0474, batch_reg_loss: 0.0792, reg_loss: 0.0781 ||:  91%|######### | 101/111 [01:08<00:07,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7601, UAS: 0.9088, LAS: 0.8395, UEM: 0.4738, LEM: 0.2452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0699, partial_loss/deprel_loss: 1.6046, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7770, loss: 1.0608, batch_reg_loss: 0.0793, reg_loss: 0.0782 ||:  94%|#########3| 104/111 [01:11<00:04,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8128, UAS: 0.9079, LAS: 0.8384, UEM: 0.4676, LEM: 0.2416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1866, partial_loss/deprel_loss: 1.2551, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3208, loss: 1.0707, batch_reg_loss: 0.0794, reg_loss: 0.0782 ||:  96%|#########6| 107/111 [01:13<00:02,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.9092, LAS: 0.8398, UEM: 0.4744, LEM: 0.2438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3939, partial_loss/deprel_loss: 0.6267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6596, loss: 1.0586, batch_reg_loss: 0.0795, reg_loss: 0.0783 ||: 100%|##########| 111/111 [01:15<00:00,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.9092, LAS: 0.8398, UEM: 0.4744, LEM: 0.2438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3939, partial_loss/deprel_loss: 0.6267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6596, loss: 1.0586, batch_reg_loss: 0.0795, reg_loss: 0.0783 ||: 100%|##########| 111/111 [01:15<00:00,  1.46it/s]\n",
      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.627  |       N/A\n",
      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.394  |       N/A\n",
      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.078  |       N/A\n",
      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - UEM                      |     0.474  |       N/A\n",
      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - LAS                      |     0.840  |       N/A\n",
      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - loss                     |     1.059  |       N/A\n",
      "2023-04-06 23:09:36,176 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:09:36,177 - INFO - combo.training.tensorboard_writer - LEM                      |     0.244  |       N/A\n",
      "2023-04-06 23:09:36,177 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:09:36,177 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:09:36,177 - INFO - combo.training.tensorboard_writer - UAS                      |     0.909  |       N/A\n",
      "2023-04-06 23:09:36,177 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:09:36,177 - INFO - combo.training.tensorboard_writer - EM                       |     0.879  |       N/A\n",
      "2023-04-06 23:09:36,177 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:09:36,177 - INFO - combo.training.trainer - Epoch duration: 0:01:15.855623\n",
      "2023-04-06 23:09:36,177 - INFO - combo.training.trainer - Estimated training time remaining: 8:28:34\n",
      "2023-04-06 23:09:36,178 - INFO - allennlp.training.trainer - Epoch 15/399\n",
      "2023-04-06 23:09:36,178 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:09:36,178 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:09:36,183 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9129, LAS: 0.8471, UEM: 0.5121, LEM: 0.2814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3401, partial_loss/deprel_loss: 0.5037, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5505, loss: 1.0156, batch_reg_loss: 0.0795, reg_loss: 0.0795 ||:   3%|2         | 3/111 [00:02<01:16,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8599, UAS: 0.9213, LAS: 0.8539, UEM: 0.5395, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6728, partial_loss/deprel_loss: 0.8153, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8665, loss: 0.9328, batch_reg_loss: 0.0796, reg_loss: 0.0796 ||:   6%|6         | 7/111 [00:04<01:10,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8601, UAS: 0.9119, LAS: 0.8434, UEM: 0.4963, LEM: 0.2662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5714, partial_loss/deprel_loss: 0.8098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8418, loss: 1.0238, batch_reg_loss: 0.0797, reg_loss: 0.0796 ||:   9%|9         | 10/111 [00:06<01:08,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8758, UAS: 0.9158, LAS: 0.8482, UEM: 0.4947, LEM: 0.2493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4600, partial_loss/deprel_loss: 0.6518, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6932, loss: 0.9811, batch_reg_loss: 0.0798, reg_loss: 0.0796 ||:  13%|#2        | 14/111 [00:09<01:06,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9126, LAS: 0.8430, UEM: 0.4992, LEM: 0.2573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1905, partial_loss/deprel_loss: 0.5070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5236, loss: 1.0350, batch_reg_loss: 0.0799, reg_loss: 0.0797 ||:  16%|#6        | 18/111 [00:11<01:01,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8956, UAS: 0.9172, LAS: 0.8487, UEM: 0.5242, LEM: 0.2724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3962, partial_loss/deprel_loss: 0.5998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6390, loss: 0.9883, batch_reg_loss: 0.0799, reg_loss: 0.0797 ||:  19%|#8        | 21/111 [00:14<01:01,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8737, UAS: 0.9172, LAS: 0.8486, UEM: 0.5373, LEM: 0.2797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4394, partial_loss/deprel_loss: 0.6408, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6805, loss: 0.9807, batch_reg_loss: 0.0800, reg_loss: 0.0797 ||:  22%|##1       | 24/111 [00:16<01:03,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8847, UAS: 0.9188, LAS: 0.8518, UEM: 0.5242, LEM: 0.2712, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5723, partial_loss/deprel_loss: 0.6435, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7094, loss: 0.9584, batch_reg_loss: 0.0801, reg_loss: 0.0798 ||:  25%|##5       | 28/111 [00:19<00:58,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9203, LAS: 0.8540, UEM: 0.5249, LEM: 0.2724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2475, partial_loss/deprel_loss: 0.4650, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5017, loss: 0.9409, batch_reg_loss: 0.0802, reg_loss: 0.0798 ||:  29%|##8       | 32/111 [00:21<00:54,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8028, UAS: 0.9190, LAS: 0.8522, UEM: 0.5190, LEM: 0.2695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3828, partial_loss/deprel_loss: 1.3768, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4582, loss: 0.9604, batch_reg_loss: 0.0802, reg_loss: 0.0799 ||:  32%|###1      | 35/111 [00:23<00:52,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7389, UAS: 0.9176, LAS: 0.8506, UEM: 0.5181, LEM: 0.2656, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2919, partial_loss/deprel_loss: 1.6833, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8853, loss: 0.9725, batch_reg_loss: 0.0803, reg_loss: 0.0799 ||:  34%|###4      | 38/111 [00:26<00:52,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8916, UAS: 0.9187, LAS: 0.8517, UEM: 0.5193, LEM: 0.2625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3254, partial_loss/deprel_loss: 0.5673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5993, loss: 0.9599, batch_reg_loss: 0.0804, reg_loss: 0.0799 ||:  37%|###6      | 41/111 [00:28<00:50,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8510, UAS: 0.9194, LAS: 0.8522, UEM: 0.5159, LEM: 0.2569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7491, partial_loss/deprel_loss: 0.8486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9091, loss: 0.9546, batch_reg_loss: 0.0804, reg_loss: 0.0800 ||:  40%|###9      | 44/111 [00:30<00:47,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9198, LAS: 0.8526, UEM: 0.5182, LEM: 0.2558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4518, partial_loss/deprel_loss: 0.7032, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7334, loss: 0.9497, batch_reg_loss: 0.0805, reg_loss: 0.0800 ||:  42%|####2     | 47/111 [00:32<00:45,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9207, LAS: 0.8539, UEM: 0.5335, LEM: 0.2761, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1517, partial_loss/deprel_loss: 0.3182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3655, loss: 0.9379, batch_reg_loss: 0.0805, reg_loss: 0.0800 ||:  45%|####5     | 50/111 [00:34<00:43,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8364, UAS: 0.9215, LAS: 0.8548, UEM: 0.5430, LEM: 0.2846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9017, partial_loss/deprel_loss: 1.0522, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1027, loss: 0.9278, batch_reg_loss: 0.0806, reg_loss: 0.0801 ||:  48%|####7     | 53/111 [00:37<00:42,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8623, UAS: 0.9200, LAS: 0.8530, UEM: 0.5317, LEM: 0.2759, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6586, partial_loss/deprel_loss: 0.8304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8768, loss: 0.9473, batch_reg_loss: 0.0807, reg_loss: 0.0801 ||:  51%|#####1    | 57/111 [00:39<00:37,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9206, LAS: 0.8537, UEM: 0.5313, LEM: 0.2737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3370, partial_loss/deprel_loss: 0.5406, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5806, loss: 0.9414, batch_reg_loss: 0.0807, reg_loss: 0.0801 ||:  54%|#####4    | 60/111 [00:41<00:35,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8269, UAS: 0.9210, LAS: 0.8541, UEM: 0.5338, LEM: 0.2764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9455, partial_loss/deprel_loss: 1.0358, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0985, loss: 0.9351, batch_reg_loss: 0.0808, reg_loss: 0.0802 ||:  57%|#####6    | 63/111 [00:43<00:34,  1.40it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7807, UAS: 0.9184, LAS: 0.8511, UEM: 0.5201, LEM: 0.2688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6969, partial_loss/deprel_loss: 1.4591, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5876, loss: 0.9608, batch_reg_loss: 0.0809, reg_loss: 0.0802 ||:  60%|######    | 67/111 [00:46<00:30,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7824, UAS: 0.9154, LAS: 0.8479, UEM: 0.5090, LEM: 0.2617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7713, partial_loss/deprel_loss: 1.3922, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5490, loss: 0.9869, batch_reg_loss: 0.0810, reg_loss: 0.0802 ||:  64%|######3   | 71/111 [00:49<00:27,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9155, LAS: 0.8480, UEM: 0.5164, LEM: 0.2689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1790, partial_loss/deprel_loss: 0.4022, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4386, loss: 0.9870, batch_reg_loss: 0.0811, reg_loss: 0.0803 ||:  68%|######7   | 75/111 [00:51<00:24,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9141, LAS: 0.8463, UEM: 0.5077, LEM: 0.2615, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6719, partial_loss/deprel_loss: 0.8466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8928, loss: 1.0058, batch_reg_loss: 0.0812, reg_loss: 0.0803 ||:  71%|#######1  | 79/111 [00:54<00:21,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7749, UAS: 0.9124, LAS: 0.8444, UEM: 0.4999, LEM: 0.2572, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7582, partial_loss/deprel_loss: 1.4269, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5744, loss: 1.0213, batch_reg_loss: 0.0812, reg_loss: 0.0804 ||:  74%|#######3  | 82/111 [00:56<00:19,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8659, UAS: 0.9121, LAS: 0.8439, UEM: 0.4934, LEM: 0.2531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5849, partial_loss/deprel_loss: 0.7789, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8214, loss: 1.0266, batch_reg_loss: 0.0813, reg_loss: 0.0804 ||:  77%|#######6  | 85/111 [00:58<00:17,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8452, UAS: 0.9122, LAS: 0.8440, UEM: 0.4887, LEM: 0.2487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7833, partial_loss/deprel_loss: 1.0462, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0750, loss: 1.0278, batch_reg_loss: 0.0814, reg_loss: 0.0804 ||:  80%|########  | 89/111 [01:01<00:14,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8722, UAS: 0.9112, LAS: 0.8429, UEM: 0.4808, LEM: 0.2430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5965, partial_loss/deprel_loss: 0.7940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8360, loss: 1.0355, batch_reg_loss: 0.0815, reg_loss: 0.0805 ||:  84%|########3 | 93/111 [01:03<00:11,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7975, UAS: 0.9112, LAS: 0.8426, UEM: 0.4752, LEM: 0.2377, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3786, partial_loss/deprel_loss: 1.3451, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4334, loss: 1.0376, batch_reg_loss: 0.0816, reg_loss: 0.0805 ||:  87%|########7 | 97/111 [01:05<00:08,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8615, UAS: 0.9109, LAS: 0.8420, UEM: 0.4715, LEM: 0.2341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6782, partial_loss/deprel_loss: 0.8343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8848, loss: 1.0429, batch_reg_loss: 0.0817, reg_loss: 0.0806 ||:  91%|######### | 101/111 [01:08<00:06,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7601, UAS: 0.9114, LAS: 0.8427, UEM: 0.4907, LEM: 0.2558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8753, partial_loss/deprel_loss: 1.6942, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8122, loss: 1.0390, batch_reg_loss: 0.0818, reg_loss: 0.0806 ||:  95%|#########4| 105/111 [01:11<00:04,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8028, UAS: 0.9112, LAS: 0.8426, UEM: 0.4832, LEM: 0.2502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3786, partial_loss/deprel_loss: 1.2117, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3270, loss: 1.0401, batch_reg_loss: 0.0819, reg_loss: 0.0807 ||:  98%|#########8| 109/111 [01:14<00:01,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8393, UAS: 0.9112, LAS: 0.8424, UEM: 0.4790, LEM: 0.2474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8623, partial_loss/deprel_loss: 1.0124, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0643, loss: 1.0407, batch_reg_loss: 0.0819, reg_loss: 0.0807 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
      "2023-04-06 23:10:51,901 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9633, LAS: 0.9155, UEM: 0.8426, LEM: 0.6012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2034, partial_loss/deprel_loss: 20.0996, partial_loss/cycle_loss: 0.0000, batch_loss: 16.1204, loss: 18.3759, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:11,  1.05s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8487, UAS: 0.9482, LAS: 0.8943, UEM: 0.7481, LEM: 0.4864, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1447, partial_loss/deprel_loss: 48.1773, partial_loss/cycle_loss: 0.0000, batch_loss: 38.7708, loss: 23.6897, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  31%|###       | 4/13 [00:04<00:09,  1.04s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8831, UAS: 0.9460, LAS: 0.8896, UEM: 0.6815, LEM: 0.4016, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5206, partial_loss/deprel_loss: 23.6872, partial_loss/cycle_loss: 0.0000, batch_loss: 19.0539, loss: 21.7025, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  54%|#####3    | 7/13 [00:06<00:05,  1.01it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8469, UAS: 0.9392, LAS: 0.8802, UEM: 0.6161, LEM: 0.3403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0001, partial_loss/deprel_loss: 36.3661, partial_loss/cycle_loss: 0.0000, batch_loss: 29.2929, loss: 24.2677, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  77%|#######6  | 10/13 [00:09<00:02,  1.03it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8713, UAS: 0.9333, LAS: 0.8731, UEM: 0.5785, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7952, partial_loss/deprel_loss: 29.1962, partial_loss/cycle_loss: 0.0000, batch_loss: 23.5160, loss: 26.0322, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  92%|#########2| 12/13 [00:11<00:01,  1.01s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9363, LAS: 0.8771, UEM: 0.6121, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2237, partial_loss/deprel_loss: 23.0313, partial_loss/cycle_loss: 0.0000, batch_loss: 18.4698, loss: 25.4504, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.03it/s]\n",
      "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-06 23:11:04,511 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.012  |    23.031\n",
      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.862  |     0.224\n",
      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.081  |     0.000\n",
      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - UEM                      |     0.479  |     0.612\n",
      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - LAS                      |     0.842  |     0.877\n",
      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - loss                     |     1.041  |    25.450\n",
      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - LEM                      |     0.247  |     0.344\n",
      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - UAS                      |     0.911  |     0.936\n",
      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - EM                       |     0.839  |     0.925\n",
      "2023-04-06 23:11:04,512 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:11:04,513 - INFO - combo.training.trainer - Epoch duration: 0:01:28.335274\n",
      "2023-04-06 23:11:04,513 - INFO - combo.training.trainer - Estimated training time remaining: 8:30:52\n",
      "2023-04-06 23:11:04,513 - INFO - allennlp.training.trainer - Epoch 16/399\n",
      "2023-04-06 23:11:04,513 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:11:04,513 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:11:04,519 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7589, UAS: 0.9080, LAS: 0.8432, UEM: 0.5846, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2122, partial_loss/deprel_loss: 1.5676, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7785, loss: 1.0280, batch_reg_loss: 0.0820, reg_loss: 0.0820 ||:   3%|2         | 3/111 [00:02<01:22,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8663, UAS: 0.9242, LAS: 0.8615, UEM: 0.5455, LEM: 0.2476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6915, partial_loss/deprel_loss: 0.7745, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8400, loss: 0.8831, batch_reg_loss: 0.0821, reg_loss: 0.0820 ||:   6%|6         | 7/111 [00:04<01:14,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8331, UAS: 0.9154, LAS: 0.8499, UEM: 0.4670, LEM: 0.2081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9397, partial_loss/deprel_loss: 1.1732, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2086, loss: 1.0023, batch_reg_loss: 0.0822, reg_loss: 0.0821 ||:   9%|9         | 10/111 [00:06<01:12,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8657, UAS: 0.9175, LAS: 0.8510, UEM: 0.4862, LEM: 0.2185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5694, partial_loss/deprel_loss: 0.7629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8065, loss: 0.9746, batch_reg_loss: 0.0823, reg_loss: 0.0821 ||:  13%|#2        | 14/111 [00:09<01:05,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8733, UAS: 0.9107, LAS: 0.8442, UEM: 0.4501, LEM: 0.1969, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7070, partial_loss/deprel_loss: 0.7876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8538, loss: 1.0366, batch_reg_loss: 0.0823, reg_loss: 0.0821 ||:  16%|#6        | 18/111 [00:11<01:01,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9177, LAS: 0.8516, UEM: 0.5343, LEM: 0.2646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2673, partial_loss/deprel_loss: 0.4801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5199, loss: 0.9668, batch_reg_loss: 0.0824, reg_loss: 0.0822 ||:  20%|#9        | 22/111 [00:14<00:58,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9192, LAS: 0.8529, UEM: 0.5322, LEM: 0.2637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3409, partial_loss/deprel_loss: 0.5948, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6265, loss: 0.9500, batch_reg_loss: 0.0825, reg_loss: 0.0822 ||:  23%|##2       | 25/111 [00:16<01:00,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8353, UAS: 0.9144, LAS: 0.8473, UEM: 0.5001, LEM: 0.2444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9402, partial_loss/deprel_loss: 1.0992, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1499, loss: 1.0039, batch_reg_loss: 0.0826, reg_loss: 0.0823 ||:  26%|##6       | 29/111 [00:19<00:54,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8619, UAS: 0.9124, LAS: 0.8448, UEM: 0.4943, LEM: 0.2411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6395, partial_loss/deprel_loss: 0.8357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8791, loss: 1.0205, batch_reg_loss: 0.0826, reg_loss: 0.0823 ||:  30%|##9       | 33/111 [00:21<00:50,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8202, UAS: 0.9116, LAS: 0.8445, UEM: 0.4757, LEM: 0.2289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1420, partial_loss/deprel_loss: 1.1341, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2184, loss: 1.0229, batch_reg_loss: 0.0827, reg_loss: 0.0823 ||:  32%|###2      | 36/111 [00:23<00:49,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9109, LAS: 0.8433, UEM: 0.4713, LEM: 0.2254, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4303, partial_loss/deprel_loss: 0.6151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6610, loss: 1.0294, batch_reg_loss: 0.0828, reg_loss: 0.0824 ||:  36%|###6      | 40/111 [00:26<00:47,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8473, UAS: 0.9110, LAS: 0.8432, UEM: 0.4799, LEM: 0.2322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7995, partial_loss/deprel_loss: 0.8820, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9484, loss: 1.0291, batch_reg_loss: 0.0829, reg_loss: 0.0824 ||:  39%|###8      | 43/111 [00:28<00:47,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7958, UAS: 0.9110, LAS: 0.8432, UEM: 0.4756, LEM: 0.2299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3631, partial_loss/deprel_loss: 1.3073, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4014, loss: 1.0309, batch_reg_loss: 0.0829, reg_loss: 0.0825 ||:  41%|####1     | 46/111 [00:30<00:45,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8617, UAS: 0.9128, LAS: 0.8450, UEM: 0.4773, LEM: 0.2268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7004, partial_loss/deprel_loss: 0.9011, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9440, loss: 1.0167, batch_reg_loss: 0.0830, reg_loss: 0.0825 ||:  44%|####4     | 49/111 [00:33<00:44,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8606, UAS: 0.9116, LAS: 0.8436, UEM: 0.4651, LEM: 0.2188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6289, partial_loss/deprel_loss: 0.8555, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8933, loss: 1.0315, batch_reg_loss: 0.0831, reg_loss: 0.0825 ||:  48%|####7     | 53/111 [00:35<00:39,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8008, UAS: 0.9112, LAS: 0.8430, UEM: 0.4520, LEM: 0.2096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1899, partial_loss/deprel_loss: 1.2488, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3202, loss: 1.0350, batch_reg_loss: 0.0832, reg_loss: 0.0826 ||:  51%|#####1    | 57/111 [00:38<00:35,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9118, LAS: 0.8436, UEM: 0.4508, LEM: 0.2074, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4705, partial_loss/deprel_loss: 0.6971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7350, loss: 1.0315, batch_reg_loss: 0.0833, reg_loss: 0.0826 ||:  55%|#####4    | 61/111 [00:40<00:34,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8310, UAS: 0.9122, LAS: 0.8440, UEM: 0.4514, LEM: 0.2077, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0268, partial_loss/deprel_loss: 1.1379, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1990, loss: 1.0293, batch_reg_loss: 0.0833, reg_loss: 0.0826 ||:  58%|#####7    | 64/111 [00:43<00:32,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8854, UAS: 0.9126, LAS: 0.8445, UEM: 0.4557, LEM: 0.2132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3577, partial_loss/deprel_loss: 0.5272, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5768, loss: 1.0256, batch_reg_loss: 0.0834, reg_loss: 0.0827 ||:  61%|######1   | 68/111 [00:45<00:29,  1.46it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8613, UAS: 0.9138, LAS: 0.8459, UEM: 0.4563, LEM: 0.2122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6427, partial_loss/deprel_loss: 0.9296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9557, loss: 1.0155, batch_reg_loss: 0.0835, reg_loss: 0.0827 ||:  65%|######4   | 72/111 [00:48<00:26,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8333, UAS: 0.9128, LAS: 0.8448, UEM: 0.4481, LEM: 0.2077, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9213, partial_loss/deprel_loss: 0.9996, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0676, loss: 1.0238, batch_reg_loss: 0.0836, reg_loss: 0.0828 ||:  68%|######8   | 76/111 [00:50<00:23,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9138, LAS: 0.8463, UEM: 0.4699, LEM: 0.2289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1576, partial_loss/deprel_loss: 0.3164, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3683, loss: 1.0118, batch_reg_loss: 0.0837, reg_loss: 0.0828 ||:  72%|#######2  | 80/111 [00:53<00:20,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7485, UAS: 0.9127, LAS: 0.8450, UEM: 0.4712, LEM: 0.2295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4496, partial_loss/deprel_loss: 1.8294, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0372, loss: 1.0233, batch_reg_loss: 0.0838, reg_loss: 0.0829 ||:  76%|#######5  | 84/111 [00:56<00:17,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9140, LAS: 0.8467, UEM: 0.4935, LEM: 0.2568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0828, partial_loss/deprel_loss: 0.2183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2751, loss: 1.0081, batch_reg_loss: 0.0839, reg_loss: 0.0829 ||:  79%|#######9  | 88/111 [00:59<00:15,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9135, LAS: 0.8460, UEM: 0.4869, LEM: 0.2512, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4877, partial_loss/deprel_loss: 0.7291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7648, loss: 1.0140, batch_reg_loss: 0.0840, reg_loss: 0.0830 ||:  83%|########2 | 92/111 [01:01<00:12,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8203, UAS: 0.9137, LAS: 0.8462, UEM: 0.4900, LEM: 0.2533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0775, partial_loss/deprel_loss: 1.0943, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1750, loss: 1.0106, batch_reg_loss: 0.0841, reg_loss: 0.0830 ||:  86%|########6 | 96/111 [01:04<00:10,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8337, UAS: 0.9119, LAS: 0.8443, UEM: 0.4847, LEM: 0.2501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0740, partial_loss/deprel_loss: 1.0761, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1598, loss: 1.0296, batch_reg_loss: 0.0841, reg_loss: 0.0830 ||:  89%|########9 | 99/111 [01:07<00:08,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8246, UAS: 0.9125, LAS: 0.8451, UEM: 0.4915, LEM: 0.2556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0728, partial_loss/deprel_loss: 1.0576, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1448, loss: 1.0224, batch_reg_loss: 0.0842, reg_loss: 0.0831 ||:  92%|#########1| 102/111 [01:09<00:06,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8747, UAS: 0.9125, LAS: 0.8449, UEM: 0.4885, LEM: 0.2531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4391, partial_loss/deprel_loss: 0.6192, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6675, loss: 1.0221, batch_reg_loss: 0.0843, reg_loss: 0.0831 ||:  95%|#########4| 105/111 [01:11<00:04,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8539, UAS: 0.9127, LAS: 0.8451, UEM: 0.4833, LEM: 0.2480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6720, partial_loss/deprel_loss: 0.8026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8609, loss: 1.0200, batch_reg_loss: 0.0844, reg_loss: 0.0831 ||:  98%|#########8| 109/111 [01:13<00:01,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8645, UAS: 0.9127, LAS: 0.8451, UEM: 0.4802, LEM: 0.2455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5954, partial_loss/deprel_loss: 0.8870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9131, loss: 1.0210, batch_reg_loss: 0.0844, reg_loss: 0.0832 ||: 100%|##########| 111/111 [01:14<00:00,  1.48it/s]\n",
      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.887  |       N/A\n",
      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.595  |       N/A\n",
      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.083  |       N/A\n",
      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - UEM                      |     0.480  |       N/A\n",
      "2023-04-06 23:12:19,452 - INFO - combo.training.tensorboard_writer - LAS                      |     0.845  |       N/A\n",
      "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - loss                     |     1.021  |       N/A\n",
      "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - LEM                      |     0.246  |       N/A\n",
      "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - UAS                      |     0.913  |       N/A\n",
      "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - EM                       |     0.864  |       N/A\n",
      "2023-04-06 23:12:19,453 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:12:19,454 - INFO - combo.training.trainer - Epoch duration: 0:01:14.940605\n",
      "2023-04-06 23:12:19,454 - INFO - combo.training.trainer - Estimated training time remaining: 8:27:43\n",
      "2023-04-06 23:12:19,454 - INFO - allennlp.training.trainer - Epoch 17/399\n",
      "2023-04-06 23:12:19,454 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:12:19,454 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:12:19,461 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8653, UAS: 0.9216, LAS: 0.8554, UEM: 0.3382, LEM: 0.1011, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5816, partial_loss/deprel_loss: 0.8625, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8908, loss: 0.9648, batch_reg_loss: 0.0845, reg_loss: 0.0845 ||:   4%|3         | 4/111 [00:02<01:04,  1.66it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8527, UAS: 0.9265, LAS: 0.8618, UEM: 0.3934, LEM: 0.1398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6621, partial_loss/deprel_loss: 0.8200, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8730, loss: 0.8968, batch_reg_loss: 0.0846, reg_loss: 0.0845 ||:   6%|6         | 7/111 [00:04<01:08,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8333, UAS: 0.9162, LAS: 0.8500, UEM: 0.3532, LEM: 0.1257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0305, partial_loss/deprel_loss: 0.9789, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0739, loss: 0.9920, batch_reg_loss: 0.0846, reg_loss: 0.0845 ||:   9%|9         | 10/111 [00:06<01:06,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8026, UAS: 0.9184, LAS: 0.8528, UEM: 0.4350, LEM: 0.1899, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3660, partial_loss/deprel_loss: 1.2370, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3475, loss: 0.9582, batch_reg_loss: 0.0847, reg_loss: 0.0846 ||:  12%|#1        | 13/111 [00:08<01:05,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8967, UAS: 0.9205, LAS: 0.8554, UEM: 0.4904, LEM: 0.2367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4147, partial_loss/deprel_loss: 0.5218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5851, loss: 0.9331, batch_reg_loss: 0.0848, reg_loss: 0.0846 ||:  15%|#5        | 17/111 [00:11<01:02,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9110, UAS: 0.9219, LAS: 0.8575, UEM: 0.5308, LEM: 0.2704, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1652, partial_loss/deprel_loss: 0.4622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4877, loss: 0.9235, batch_reg_loss: 0.0849, reg_loss: 0.0846 ||:  18%|#8        | 20/111 [00:13<01:00,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8204, UAS: 0.9207, LAS: 0.8556, UEM: 0.5155, LEM: 0.2657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1489, partial_loss/deprel_loss: 1.1239, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2139, loss: 0.9339, batch_reg_loss: 0.0850, reg_loss: 0.0847 ||:  22%|##1       | 24/111 [00:16<00:57,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8496, UAS: 0.9208, LAS: 0.8555, UEM: 0.4917, LEM: 0.2469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7885, partial_loss/deprel_loss: 0.9084, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9694, loss: 0.9335, batch_reg_loss: 0.0850, reg_loss: 0.0847 ||:  25%|##5       | 28/111 [00:18<00:52,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9203, LAS: 0.8549, UEM: 0.4892, LEM: 0.2457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2998, partial_loss/deprel_loss: 0.5312, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5701, loss: 0.9418, batch_reg_loss: 0.0851, reg_loss: 0.0848 ||:  28%|##7       | 31/111 [00:20<00:53,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8699, UAS: 0.9203, LAS: 0.8548, UEM: 0.4730, LEM: 0.2298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5786, partial_loss/deprel_loss: 0.7671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8146, loss: 0.9400, batch_reg_loss: 0.0852, reg_loss: 0.0848 ||:  32%|###1      | 35/111 [00:23<00:50,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9223, LAS: 0.8573, UEM: 0.4940, LEM: 0.2481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5172, partial_loss/deprel_loss: 0.6889, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7398, loss: 0.9204, batch_reg_loss: 0.0853, reg_loss: 0.0849 ||:  34%|###4      | 38/111 [00:25<00:50,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8749, UAS: 0.9217, LAS: 0.8563, UEM: 0.4839, LEM: 0.2367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5008, partial_loss/deprel_loss: 0.7724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8034, loss: 0.9291, batch_reg_loss: 0.0854, reg_loss: 0.0849 ||:  38%|###7      | 42/111 [00:27<00:45,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8884, UAS: 0.9206, LAS: 0.8548, UEM: 0.4822, LEM: 0.2346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3619, partial_loss/deprel_loss: 0.5743, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6173, loss: 0.9410, batch_reg_loss: 0.0854, reg_loss: 0.0849 ||:  41%|####      | 45/111 [00:30<00:46,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8460, UAS: 0.9174, LAS: 0.8517, UEM: 0.4643, LEM: 0.2239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9001, partial_loss/deprel_loss: 0.9548, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0294, loss: 0.9654, batch_reg_loss: 0.0855, reg_loss: 0.0850 ||:  44%|####4     | 49/111 [00:32<00:42,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8553, UAS: 0.9165, LAS: 0.8508, UEM: 0.4653, LEM: 0.2219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8402, partial_loss/deprel_loss: 0.8455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9301, loss: 0.9775, batch_reg_loss: 0.0856, reg_loss: 0.0850 ||:  48%|####7     | 53/111 [00:35<00:38,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8495, UAS: 0.9179, LAS: 0.8524, UEM: 0.4743, LEM: 0.2237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8424, partial_loss/deprel_loss: 0.9273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9960, loss: 0.9632, batch_reg_loss: 0.0857, reg_loss: 0.0851 ||:  51%|#####1    | 57/111 [00:37<00:35,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8958, UAS: 0.9181, LAS: 0.8528, UEM: 0.4839, LEM: 0.2345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3615, partial_loss/deprel_loss: 0.5027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5603, loss: 0.9589, batch_reg_loss: 0.0858, reg_loss: 0.0851 ||:  55%|#####4    | 61/111 [00:40<00:33,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9201, LAS: 0.8551, UEM: 0.5090, LEM: 0.2596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4550, partial_loss/deprel_loss: 0.6768, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7183, loss: 0.9397, batch_reg_loss: 0.0859, reg_loss: 0.0852 ||:  59%|#####8    | 65/111 [00:43<00:30,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8599, UAS: 0.9196, LAS: 0.8545, UEM: 0.5017, LEM: 0.2534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6634, partial_loss/deprel_loss: 0.7655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8311, loss: 0.9431, batch_reg_loss: 0.0860, reg_loss: 0.0852 ||:  62%|######2   | 69/111 [00:46<00:28,  1.48it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9189, LAS: 0.8537, UEM: 0.4995, LEM: 0.2534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4002, partial_loss/deprel_loss: 0.5723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6239, loss: 0.9510, batch_reg_loss: 0.0860, reg_loss: 0.0852 ||:  65%|######4   | 72/111 [00:48<00:26,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9195, LAS: 0.8542, UEM: 0.5001, LEM: 0.2517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4251, partial_loss/deprel_loss: 0.7046, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7348, loss: 0.9440, batch_reg_loss: 0.0861, reg_loss: 0.0853 ||:  68%|######8   | 76/111 [00:50<00:23,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8669, UAS: 0.9161, LAS: 0.8505, UEM: 0.4923, LEM: 0.2467, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5704, partial_loss/deprel_loss: 0.8707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8969, loss: 0.9753, batch_reg_loss: 0.0862, reg_loss: 0.0853 ||:  72%|#######2  | 80/111 [00:53<00:20,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8143, UAS: 0.9160, LAS: 0.8504, UEM: 0.4899, LEM: 0.2445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3190, partial_loss/deprel_loss: 1.2196, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3258, loss: 0.9778, batch_reg_loss: 0.0863, reg_loss: 0.0854 ||:  76%|#######5  | 84/111 [00:55<00:17,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7646, UAS: 0.9146, LAS: 0.8487, UEM: 0.4840, LEM: 0.2404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9803, partial_loss/deprel_loss: 1.4948, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6783, loss: 0.9919, batch_reg_loss: 0.0864, reg_loss: 0.0854 ||:  79%|#######9  | 88/111 [00:57<00:14,  1.64it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9360, UAS: 0.9150, LAS: 0.8493, UEM: 0.5098, LEM: 0.2731, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0973, partial_loss/deprel_loss: 0.2371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2956, loss: 0.9903, batch_reg_loss: 0.0865, reg_loss: 0.0855 ||:  83%|########2 | 92/111 [01:01<00:12,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8278, UAS: 0.9145, LAS: 0.8486, UEM: 0.5008, LEM: 0.2669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1653, partial_loss/deprel_loss: 1.1575, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2456, loss: 0.9977, batch_reg_loss: 0.0866, reg_loss: 0.0855 ||:  86%|########6 | 96/111 [01:05<00:11,  1.26it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8094, UAS: 0.9144, LAS: 0.8484, UEM: 0.4967, LEM: 0.2632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3131, partial_loss/deprel_loss: 1.1735, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2881, loss: 0.9981, batch_reg_loss: 0.0867, reg_loss: 0.0855 ||:  89%|########9 | 99/111 [01:07<00:09,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8428, UAS: 0.9144, LAS: 0.8483, UEM: 0.4979, LEM: 0.2638, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8804, partial_loss/deprel_loss: 1.0840, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1300, loss: 0.9994, batch_reg_loss: 0.0867, reg_loss: 0.0856 ||:  92%|#########1| 102/111 [01:09<00:06,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8894, UAS: 0.9148, LAS: 0.8489, UEM: 0.4973, LEM: 0.2625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4124, partial_loss/deprel_loss: 0.5711, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6262, loss: 0.9941, batch_reg_loss: 0.0868, reg_loss: 0.0856 ||:  95%|#########4| 105/111 [01:12<00:04,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8624, UAS: 0.9151, LAS: 0.8490, UEM: 0.4923, LEM: 0.2570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7387, partial_loss/deprel_loss: 0.8004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8749, loss: 0.9937, batch_reg_loss: 0.0869, reg_loss: 0.0857 ||:  98%|#########8| 109/111 [01:14<00:01,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8040, UAS: 0.9140, LAS: 0.8479, UEM: 0.4885, LEM: 0.2549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3149, partial_loss/deprel_loss: 1.1623, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2798, loss: 1.0035, batch_reg_loss: 0.0869, reg_loss: 0.0857 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
      "2023-04-06 23:13:34,894 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.162  |       N/A\n",
      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.315  |       N/A\n",
      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.086  |       N/A\n",
      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - UEM                      |     0.489  |       N/A\n",
      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - LAS                      |     0.848  |       N/A\n",
      "2023-04-06 23:13:34,895 - INFO - combo.training.tensorboard_writer - loss                     |     1.004  |       N/A\n",
      "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - LEM                      |     0.255  |       N/A\n",
      "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - UAS                      |     0.914  |       N/A\n",
      "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - EM                       |     0.804  |       N/A\n",
      "2023-04-06 23:13:34,896 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:13:34,897 - INFO - combo.training.trainer - Epoch duration: 0:01:15.442752\n",
      "2023-04-06 23:13:34,897 - INFO - combo.training.trainer - Estimated training time remaining: 8:24:56\n",
      "2023-04-06 23:13:34,897 - INFO - allennlp.training.trainer - Epoch 18/399\n",
      "2023-04-06 23:13:34,897 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:13:34,897 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:13:34,904 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8228, UAS: 0.9169, LAS: 0.8505, UEM: 0.3212, LEM: 0.0933, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0915, partial_loss/deprel_loss: 1.1094, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1928, loss: 0.9545, batch_reg_loss: 0.0870, reg_loss: 0.0870 ||:   3%|2         | 3/111 [00:02<01:20,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8898, UAS: 0.9276, LAS: 0.8623, UEM: 0.5231, LEM: 0.2611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3255, partial_loss/deprel_loss: 0.5087, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5591, loss: 0.8390, batch_reg_loss: 0.0871, reg_loss: 0.0870 ||:   5%|5         | 6/111 [00:04<01:20,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9346, LAS: 0.8740, UEM: 0.6711, LEM: 0.4448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1051, partial_loss/deprel_loss: 0.2196, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2839, loss: 0.7732, batch_reg_loss: 0.0872, reg_loss: 0.0871 ||:   9%|9         | 10/111 [00:07<01:17,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8591, UAS: 0.9301, LAS: 0.8680, UEM: 0.6054, LEM: 0.3828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6862, partial_loss/deprel_loss: 0.8887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9355, loss: 0.8377, batch_reg_loss: 0.0873, reg_loss: 0.0871 ||:  13%|#2        | 14/111 [00:10<01:09,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9300, LAS: 0.8676, UEM: 0.5688, LEM: 0.3422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5562, partial_loss/deprel_loss: 0.6804, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7430, loss: 0.8469, batch_reg_loss: 0.0874, reg_loss: 0.0872 ||:  16%|#6        | 18/111 [00:12<01:04,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9126, UAS: 0.9308, LAS: 0.8677, UEM: 0.5772, LEM: 0.3364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1748, partial_loss/deprel_loss: 0.4864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5115, loss: 0.8475, batch_reg_loss: 0.0874, reg_loss: 0.0872 ||:  20%|#9        | 22/111 [00:15<01:00,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8934, UAS: 0.9230, LAS: 0.8594, UEM: 0.5669, LEM: 0.3287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3768, partial_loss/deprel_loss: 0.5494, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6024, loss: 0.9163, batch_reg_loss: 0.0875, reg_loss: 0.0872 ||:  23%|##2       | 25/111 [00:17<01:01,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8352, UAS: 0.9221, LAS: 0.8583, UEM: 0.5419, LEM: 0.3100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9141, partial_loss/deprel_loss: 1.1264, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1715, loss: 0.9262, batch_reg_loss: 0.0876, reg_loss: 0.0873 ||:  25%|##5       | 28/111 [00:19<00:57,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9203, LAS: 0.8562, UEM: 0.5457, LEM: 0.3061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3203, partial_loss/deprel_loss: 0.5512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5926, loss: 0.9386, batch_reg_loss: 0.0876, reg_loss: 0.0873 ||:  28%|##7       | 31/111 [00:21<00:55,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8389, UAS: 0.9183, LAS: 0.8538, UEM: 0.5326, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9560, partial_loss/deprel_loss: 0.9772, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0607, loss: 0.9626, batch_reg_loss: 0.0877, reg_loss: 0.0874 ||:  32%|###1      | 35/111 [00:24<00:51,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9185, LAS: 0.8543, UEM: 0.5263, LEM: 0.2879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3537, partial_loss/deprel_loss: 0.5632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6091, loss: 0.9598, batch_reg_loss: 0.0878, reg_loss: 0.0874 ||:  35%|###5      | 39/111 [00:27<00:49,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9138, LAS: 0.8490, UEM: 0.5170, LEM: 0.2822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4010, partial_loss/deprel_loss: 0.5286, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5910, loss: 1.0039, batch_reg_loss: 0.0879, reg_loss: 0.0874 ||:  39%|###8      | 43/111 [00:29<00:47,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9152, LAS: 0.8507, UEM: 0.5210, LEM: 0.2825, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4241, partial_loss/deprel_loss: 0.6749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7127, loss: 0.9916, batch_reg_loss: 0.0880, reg_loss: 0.0875 ||:  41%|####1     | 46/111 [00:32<00:45,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8042, UAS: 0.9142, LAS: 0.8494, UEM: 0.5098, LEM: 0.2753, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3450, partial_loss/deprel_loss: 1.1223, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2549, loss: 0.9971, batch_reg_loss: 0.0881, reg_loss: 0.0875 ||:  44%|####4     | 49/111 [00:34<00:44,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8924, UAS: 0.9148, LAS: 0.8502, UEM: 0.5006, LEM: 0.2659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4315, partial_loss/deprel_loss: 0.6747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7142, loss: 0.9906, batch_reg_loss: 0.0882, reg_loss: 0.0876 ||:  48%|####7     | 53/111 [00:36<00:40,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8735, UAS: 0.9139, LAS: 0.8492, UEM: 0.4906, LEM: 0.2577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5756, partial_loss/deprel_loss: 0.7295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7870, loss: 0.9980, batch_reg_loss: 0.0883, reg_loss: 0.0876 ||:  51%|#####1    | 57/111 [00:39<00:35,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7875, UAS: 0.9122, LAS: 0.8470, UEM: 0.4822, LEM: 0.2516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5783, partial_loss/deprel_loss: 1.4357, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5525, loss: 1.0136, batch_reg_loss: 0.0884, reg_loss: 0.0877 ||:  55%|#####4    | 61/111 [00:41<00:33,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9123, LAS: 0.8474, UEM: 0.4979, LEM: 0.2680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2670, partial_loss/deprel_loss: 0.4382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4924, loss: 1.0101, batch_reg_loss: 0.0884, reg_loss: 0.0877 ||:  59%|#####8    | 65/111 [00:44<00:31,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8053, UAS: 0.9124, LAS: 0.8475, UEM: 0.4922, LEM: 0.2636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3323, partial_loss/deprel_loss: 1.3069, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4005, loss: 1.0098, batch_reg_loss: 0.0885, reg_loss: 0.0877 ||:  61%|######1   | 68/111 [00:46<00:29,  1.46it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8203, UAS: 0.9130, LAS: 0.8481, UEM: 0.4973, LEM: 0.2674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1742, partial_loss/deprel_loss: 1.2064, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2885, loss: 1.0040, batch_reg_loss: 0.0886, reg_loss: 0.0878 ||:  64%|######3   | 71/111 [00:48<00:27,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9135, LAS: 0.8489, UEM: 0.5123, LEM: 0.2847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1399, partial_loss/deprel_loss: 0.3012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3576, loss: 0.9980, batch_reg_loss: 0.0887, reg_loss: 0.0878 ||:  68%|######7   | 75/111 [00:51<00:24,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8536, UAS: 0.9134, LAS: 0.8486, UEM: 0.5078, LEM: 0.2796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7427, partial_loss/deprel_loss: 0.9010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9581, loss: 1.0009, batch_reg_loss: 0.0887, reg_loss: 0.0879 ||:  70%|#######   | 78/111 [00:53<00:23,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7803, UAS: 0.9131, LAS: 0.8483, UEM: 0.5069, LEM: 0.2774, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8427, partial_loss/deprel_loss: 1.5858, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7260, loss: 1.0046, batch_reg_loss: 0.0888, reg_loss: 0.0879 ||:  73%|#######2  | 81/111 [00:56<00:21,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8095, UAS: 0.9134, LAS: 0.8483, UEM: 0.5000, LEM: 0.2705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2830, partial_loss/deprel_loss: 1.1385, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2563, loss: 1.0034, batch_reg_loss: 0.0889, reg_loss: 0.0879 ||:  77%|#######6  | 85/111 [00:58<00:17,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8533, UAS: 0.9131, LAS: 0.8480, UEM: 0.4932, LEM: 0.2646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8080, partial_loss/deprel_loss: 0.8970, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9682, loss: 1.0072, batch_reg_loss: 0.0890, reg_loss: 0.0880 ||:  80%|########  | 89/111 [01:00<00:14,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9132, LAS: 0.8480, UEM: 0.4909, LEM: 0.2622, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3357, partial_loss/deprel_loss: 0.5487, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5952, loss: 1.0083, batch_reg_loss: 0.0891, reg_loss: 0.0880 ||:  84%|########3 | 93/111 [01:03<00:11,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8723, UAS: 0.9140, LAS: 0.8488, UEM: 0.4943, LEM: 0.2648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4893, partial_loss/deprel_loss: 0.7979, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8254, loss: 1.0029, batch_reg_loss: 0.0892, reg_loss: 0.0881 ||:  87%|########7 | 97/111 [01:06<00:09,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8230, UAS: 0.9135, LAS: 0.8483, UEM: 0.4857, LEM: 0.2584, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1926, partial_loss/deprel_loss: 1.1354, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2361, loss: 1.0052, batch_reg_loss: 0.0893, reg_loss: 0.0881 ||:  91%|######### | 101/111 [01:08<00:06,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8649, UAS: 0.9144, LAS: 0.8493, UEM: 0.4890, LEM: 0.2579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6948, partial_loss/deprel_loss: 0.8095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8759, loss: 0.9975, batch_reg_loss: 0.0893, reg_loss: 0.0882 ||:  94%|#########3| 104/111 [01:11<00:04,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8489, UAS: 0.9143, LAS: 0.8492, UEM: 0.4848, LEM: 0.2548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9411, partial_loss/deprel_loss: 0.8917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9910, loss: 0.9983, batch_reg_loss: 0.0894, reg_loss: 0.0882 ||:  96%|#########6| 107/111 [01:13<00:02,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8840, UAS: 0.9151, LAS: 0.8501, UEM: 0.4914, LEM: 0.2580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3863, partial_loss/deprel_loss: 0.6280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6691, loss: 0.9898, batch_reg_loss: 0.0895, reg_loss: 0.0882 ||:  99%|#########9| 110/111 [01:15<00:00,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8704, UAS: 0.9153, LAS: 0.8503, UEM: 0.4906, LEM: 0.2570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5699, partial_loss/deprel_loss: 0.8068, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8490, loss: 0.9886, batch_reg_loss: 0.0895, reg_loss: 0.0882 ||: 100%|##########| 111/111 [01:16<00:00,  1.46it/s]\n",
      "2023-04-06 23:14:50,914 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:14:50,914 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.807  |       N/A\n",
      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.570  |       N/A\n",
      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.088  |       N/A\n",
      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - UEM                      |     0.491  |       N/A\n",
      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - LAS                      |     0.850  |       N/A\n",
      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - loss                     |     0.989  |       N/A\n",
      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:14:50,915 - INFO - combo.training.tensorboard_writer - LEM                      |     0.257  |       N/A\n",
      "2023-04-06 23:14:50,916 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:14:50,916 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:14:50,916 - INFO - combo.training.tensorboard_writer - UAS                      |     0.915  |       N/A\n",
      "2023-04-06 23:14:50,916 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:14:50,916 - INFO - combo.training.tensorboard_writer - EM                       |     0.870  |       N/A\n",
      "2023-04-06 23:14:50,916 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:14:50,916 - INFO - combo.training.trainer - Epoch duration: 0:01:16.019608\n",
      "2023-04-06 23:14:50,917 - INFO - combo.training.trainer - Estimated training time remaining: 8:22:31\n",
      "2023-04-06 23:14:50,917 - INFO - allennlp.training.trainer - Epoch 19/399\n",
      "2023-04-06 23:14:50,917 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:14:50,917 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-06 23:14:50,923 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9280, LAS: 0.8663, UEM: 0.4818, LEM: 0.2052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3412, partial_loss/deprel_loss: 0.5427, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5920, loss: 0.8326, batch_reg_loss: 0.0896, reg_loss: 0.0896 ||:   4%|3         | 4/111 [00:02<01:06,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8347, UAS: 0.9147, LAS: 0.8502, UEM: 0.3867, LEM: 0.1510, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0561, partial_loss/deprel_loss: 1.0243, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1203, loss: 0.9958, batch_reg_loss: 0.0897, reg_loss: 0.0896 ||:   6%|6         | 7/111 [00:04<01:07,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7890, UAS: 0.9112, LAS: 0.8450, UEM: 0.3595, LEM: 0.1344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5057, partial_loss/deprel_loss: 1.4440, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5460, loss: 1.0469, batch_reg_loss: 0.0897, reg_loss: 0.0896 ||:   9%|9         | 10/111 [00:06<01:06,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8477, UAS: 0.9132, LAS: 0.8471, UEM: 0.3635, LEM: 0.1282, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8014, partial_loss/deprel_loss: 0.8880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9604, loss: 1.0209, batch_reg_loss: 0.0898, reg_loss: 0.0897 ||:  12%|#1        | 13/111 [00:08<01:05,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8711, UAS: 0.9142, LAS: 0.8481, UEM: 0.3500, LEM: 0.1202, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5703, partial_loss/deprel_loss: 0.7201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7801, loss: 1.0151, batch_reg_loss: 0.0899, reg_loss: 0.0897 ||:  15%|#5        | 17/111 [00:11<01:02,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8080, UAS: 0.9147, LAS: 0.8485, UEM: 0.3594, LEM: 0.1297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3113, partial_loss/deprel_loss: 1.1270, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2538, loss: 1.0083, batch_reg_loss: 0.0899, reg_loss: 0.0897 ||:  18%|#8        | 20/111 [00:13<01:01,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8353, UAS: 0.9089, LAS: 0.8422, UEM: 0.3288, LEM: 0.1173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0613, partial_loss/deprel_loss: 0.9594, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0698, loss: 1.0639, batch_reg_loss: 0.0900, reg_loss: 0.0898 ||:  22%|##1       | 24/111 [00:16<00:57,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8194, UAS: 0.9075, LAS: 0.8401, UEM: 0.3043, LEM: 0.1081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1332, partial_loss/deprel_loss: 1.1339, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2239, loss: 1.0805, batch_reg_loss: 0.0901, reg_loss: 0.0898 ||:  25%|##5       | 28/111 [00:18<00:54,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9118, LAS: 0.8454, UEM: 0.3797, LEM: 0.1651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2529, partial_loss/deprel_loss: 0.4029, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4631, loss: 1.0336, batch_reg_loss: 0.0902, reg_loss: 0.0899 ||:  28%|##7       | 31/111 [00:20<00:53,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9146, LAS: 0.8488, UEM: 0.4005, LEM: 0.1766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2672, partial_loss/deprel_loss: 0.4931, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5382, loss: 1.0074, batch_reg_loss: 0.0903, reg_loss: 0.0899 ||:  32%|###1      | 35/111 [00:23<00:51,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9167, LAS: 0.8515, UEM: 0.4096, LEM: 0.1790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5449, partial_loss/deprel_loss: 0.7061, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7642, loss: 0.9820, batch_reg_loss: 0.0904, reg_loss: 0.0899 ||:  35%|###5      | 39/111 [00:25<00:47,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9189, LAS: 0.8544, UEM: 0.4478, LEM: 0.2113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2027, partial_loss/deprel_loss: 0.4174, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4649, loss: 0.9584, batch_reg_loss: 0.0905, reg_loss: 0.0900 ||:  38%|###7      | 42/111 [00:28<00:47,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8055, UAS: 0.9189, LAS: 0.8545, UEM: 0.4558, LEM: 0.2175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4937, partial_loss/deprel_loss: 1.2253, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3695, loss: 0.9560, batch_reg_loss: 0.0905, reg_loss: 0.0900 ||:  41%|####      | 45/111 [00:30<00:46,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7630, UAS: 0.9134, LAS: 0.8488, UEM: 0.4408, LEM: 0.2103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9478, partial_loss/deprel_loss: 1.5173, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6940, loss: 1.0013, batch_reg_loss: 0.0906, reg_loss: 0.0901 ||:  44%|####4     | 49/111 [00:33<00:42,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9136, LAS: 0.8490, UEM: 0.4447, LEM: 0.2155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3234, partial_loss/deprel_loss: 0.4641, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5266, loss: 1.0002, batch_reg_loss: 0.0907, reg_loss: 0.0901 ||:  47%|####6     | 52/111 [00:35<00:42,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8632, UAS: 0.9148, LAS: 0.8508, UEM: 0.4497, LEM: 0.2170, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8531, partial_loss/deprel_loss: 0.7755, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8818, loss: 0.9856, batch_reg_loss: 0.0907, reg_loss: 0.0901 ||:  50%|####9     | 55/111 [00:37<00:39,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8783, UAS: 0.9144, LAS: 0.8503, UEM: 0.4407, LEM: 0.2094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4102, partial_loss/deprel_loss: 0.7027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7350, loss: 0.9948, batch_reg_loss: 0.0908, reg_loss: 0.0902 ||:  53%|#####3    | 59/111 [00:40<00:35,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8627, UAS: 0.9144, LAS: 0.8500, UEM: 0.4305, LEM: 0.2013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7175, partial_loss/deprel_loss: 0.8354, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9027, loss: 0.9954, batch_reg_loss: 0.0909, reg_loss: 0.0902 ||:  57%|#####6    | 63/111 [00:42<00:32,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9160, LAS: 0.8519, UEM: 0.4603, LEM: 0.2304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1260, partial_loss/deprel_loss: 0.2969, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3537, loss: 0.9770, batch_reg_loss: 0.0910, reg_loss: 0.0903 ||:  59%|#####9    | 66/111 [00:44<00:31,  1.41it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9146, LAS: 0.8503, UEM: 0.4620, LEM: 0.2308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3607, partial_loss/deprel_loss: 0.5944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6387, loss: 0.9922, batch_reg_loss: 0.0911, reg_loss: 0.0903 ||:  62%|######2   | 69/111 [00:47<00:29,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9476, UAS: 0.9152, LAS: 0.8511, UEM: 0.4865, LEM: 0.2638, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0865, partial_loss/deprel_loss: 0.2023, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2703, loss: 0.9884, batch_reg_loss: 0.0911, reg_loss: 0.0903 ||:  65%|######4   | 72/111 [00:49<00:29,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7450, UAS: 0.9129, LAS: 0.8483, UEM: 0.4786, LEM: 0.2592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4474, partial_loss/deprel_loss: 1.6060, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8655, loss: 1.0093, batch_reg_loss: 0.0912, reg_loss: 0.0904 ||:  68%|######7   | 75/111 [00:51<00:26,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9145, LAS: 0.8501, UEM: 0.4913, LEM: 0.2646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3422, partial_loss/deprel_loss: 0.5563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6047, loss: 0.9942, batch_reg_loss: 0.0913, reg_loss: 0.0904 ||:  70%|#######   | 78/111 [00:53<00:23,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8686, UAS: 0.9147, LAS: 0.8503, UEM: 0.4911, LEM: 0.2628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6024, partial_loss/deprel_loss: 0.8119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8614, loss: 0.9942, batch_reg_loss: 0.0914, reg_loss: 0.0904 ||:  74%|#######3  | 82/111 [00:56<00:19,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8070, UAS: 0.9148, LAS: 0.8505, UEM: 0.4921, LEM: 0.2639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3560, partial_loss/deprel_loss: 1.2549, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3665, loss: 0.9919, batch_reg_loss: 0.0914, reg_loss: 0.0905 ||:  77%|#######6  | 85/111 [00:58<00:18,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8503, UAS: 0.9139, LAS: 0.8493, UEM: 0.4854, LEM: 0.2583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7237, partial_loss/deprel_loss: 0.8698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9321, loss: 1.0020, batch_reg_loss: 0.0915, reg_loss: 0.0905 ||:  80%|########  | 89/111 [01:01<00:15,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7970, UAS: 0.9132, LAS: 0.8486, UEM: 0.4798, LEM: 0.2545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6280, partial_loss/deprel_loss: 1.2208, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3938, loss: 1.0073, batch_reg_loss: 0.0916, reg_loss: 0.0905 ||:  83%|########2 | 92/111 [01:03<00:13,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9145, LAS: 0.8499, UEM: 0.4895, LEM: 0.2595, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1750, partial_loss/deprel_loss: 0.4655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4991, loss: 0.9969, batch_reg_loss: 0.0917, reg_loss: 0.0906 ||:  86%|########5 | 95/111 [01:05<00:11,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8012, UAS: 0.9144, LAS: 0.8497, UEM: 0.4877, LEM: 0.2581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4152, partial_loss/deprel_loss: 1.2303, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3590, loss: 0.9990, batch_reg_loss: 0.0917, reg_loss: 0.0906 ||:  88%|########8 | 98/111 [01:07<00:09,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8507, UAS: 0.9146, LAS: 0.8498, UEM: 0.4837, LEM: 0.2542, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7947, partial_loss/deprel_loss: 0.9044, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9742, loss: 0.9972, batch_reg_loss: 0.0918, reg_loss: 0.0907 ||:  91%|######### | 101/111 [01:09<00:07,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8882, UAS: 0.9154, LAS: 0.8507, UEM: 0.4849, LEM: 0.2528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4251, partial_loss/deprel_loss: 0.5496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6166, loss: 0.9904, batch_reg_loss: 0.0919, reg_loss: 0.0907 ||:  95%|#########4| 105/111 [01:12<00:04,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9157, LAS: 0.8511, UEM: 0.4917, LEM: 0.2596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4593, partial_loss/deprel_loss: 0.6486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7027, loss: 0.9860, batch_reg_loss: 0.0919, reg_loss: 0.0907 ||:  97%|#########7| 108/111 [01:15<00:02,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8103, UAS: 0.9161, LAS: 0.8514, UEM: 0.4941, LEM: 0.2598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3019, partial_loss/deprel_loss: 1.1335, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2592, loss: 0.9835, batch_reg_loss: 0.0920, reg_loss: 0.0908 ||: 100%|##########| 111/111 [01:17<00:00,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8103, UAS: 0.9161, LAS: 0.8514, UEM: 0.4941, LEM: 0.2598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3019, partial_loss/deprel_loss: 1.1335, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2592, loss: 0.9835, batch_reg_loss: 0.0920, reg_loss: 0.0908 ||: 100%|##########| 111/111 [01:17<00:00,  1.43it/s]\n",
      "2023-04-06 23:16:08,307 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.134  |       N/A\n",
      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.302  |       N/A\n",
      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.091  |       N/A\n",
      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - UEM                      |     0.494  |       N/A\n",
      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - LAS                      |     0.851  |       N/A\n",
      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - loss                     |     0.984  |       N/A\n",
      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:16:08,308 - INFO - combo.training.tensorboard_writer - LEM                      |     0.260  |       N/A\n",
      "2023-04-06 23:16:08,309 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:16:08,309 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:16:08,309 - INFO - combo.training.tensorboard_writer - UAS                      |     0.916  |       N/A\n",
      "2023-04-06 23:16:08,309 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:16:08,309 - INFO - combo.training.tensorboard_writer - EM                       |     0.810  |       N/A\n",
      "2023-04-06 23:16:08,309 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:16:08,309 - INFO - combo.training.trainer - Epoch duration: 0:01:17.392753\n",
      "2023-04-06 23:16:08,310 - INFO - combo.training.trainer - Estimated training time remaining: 8:20:39\n",
      "2023-04-06 23:16:08,310 - INFO - allennlp.training.trainer - Epoch 20/399\n",
      "2023-04-06 23:16:08,310 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:16:08,310 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-06 23:16:08,316 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9521, LAS: 0.8974, UEM: 0.7753, LEM: 0.6200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3512, partial_loss/deprel_loss: 0.6386, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6732, loss: 0.6190, batch_reg_loss: 0.0921, reg_loss: 0.0920 ||:   3%|2         | 3/111 [00:02<01:31,  1.17it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7149, UAS: 0.9217, LAS: 0.8639, UEM: 0.7221, LEM: 0.5348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.0170, partial_loss/deprel_loss: 1.8682, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1901, loss: 0.8866, batch_reg_loss: 0.0921, reg_loss: 0.0921 ||:   6%|6         | 7/111 [00:04<01:20,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9203, LAS: 0.8612, UEM: 0.6885, LEM: 0.4941, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2541, partial_loss/deprel_loss: 0.4469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5005, loss: 0.9092, batch_reg_loss: 0.0922, reg_loss: 0.0921 ||:   9%|9         | 10/111 [00:07<01:16,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8377, UAS: 0.9200, LAS: 0.8602, UEM: 0.6465, LEM: 0.4483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9482, partial_loss/deprel_loss: 1.0288, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1050, loss: 0.9218, batch_reg_loss: 0.0923, reg_loss: 0.0921 ||:  12%|#1        | 13/111 [00:09<01:13,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8989, UAS: 0.9260, LAS: 0.8667, UEM: 0.6404, LEM: 0.4198, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3305, partial_loss/deprel_loss: 0.5257, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5790, loss: 0.8611, batch_reg_loss: 0.0923, reg_loss: 0.0922 ||:  15%|#5        | 17/111 [00:11<01:06,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8555, UAS: 0.9266, LAS: 0.8650, UEM: 0.6031, LEM: 0.3783, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6330, partial_loss/deprel_loss: 0.8089, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8662, loss: 0.8658, batch_reg_loss: 0.0924, reg_loss: 0.0922 ||:  19%|#8        | 21/111 [00:14<01:01,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9235, LAS: 0.8615, UEM: 0.5818, LEM: 0.3567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5684, partial_loss/deprel_loss: 0.7775, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8282, loss: 0.8950, batch_reg_loss: 0.0925, reg_loss: 0.0923 ||:  22%|##1       | 24/111 [00:16<00:59,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8780, UAS: 0.9259, LAS: 0.8641, UEM: 0.5802, LEM: 0.3457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4870, partial_loss/deprel_loss: 0.6752, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7301, loss: 0.8726, batch_reg_loss: 0.0926, reg_loss: 0.0923 ||:  24%|##4       | 27/111 [00:18<00:58,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9255, LAS: 0.8640, UEM: 0.5700, LEM: 0.3358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3910, partial_loss/deprel_loss: 0.4800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5549, loss: 0.8753, batch_reg_loss: 0.0926, reg_loss: 0.0923 ||:  27%|##7       | 30/111 [00:20<00:56,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8875, UAS: 0.9263, LAS: 0.8651, UEM: 0.5635, LEM: 0.3275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5597, partial_loss/deprel_loss: 0.6210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7014, loss: 0.8682, batch_reg_loss: 0.0927, reg_loss: 0.0923 ||:  30%|##9       | 33/111 [00:22<00:53,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9252, LAS: 0.8637, UEM: 0.5582, LEM: 0.3224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3287, partial_loss/deprel_loss: 0.5773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6203, loss: 0.8801, batch_reg_loss: 0.0927, reg_loss: 0.0924 ||:  32%|###2      | 36/111 [00:24<00:52,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8709, UAS: 0.9254, LAS: 0.8637, UEM: 0.5541, LEM: 0.3170, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6296, partial_loss/deprel_loss: 0.7761, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8396, loss: 0.8814, batch_reg_loss: 0.0928, reg_loss: 0.0924 ||:  35%|###5      | 39/111 [00:27<00:52,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8333, UAS: 0.9236, LAS: 0.8612, UEM: 0.5381, LEM: 0.3055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0152, partial_loss/deprel_loss: 0.9462, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0529, loss: 0.9042, batch_reg_loss: 0.0929, reg_loss: 0.0924 ||:  38%|###7      | 42/111 [00:29<00:50,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8396, UAS: 0.9249, LAS: 0.8627, UEM: 0.5504, LEM: 0.3155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8873, partial_loss/deprel_loss: 1.0102, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0786, loss: 0.8923, batch_reg_loss: 0.0929, reg_loss: 0.0925 ||:  41%|####      | 45/111 [00:31<00:47,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8389, UAS: 0.9246, LAS: 0.8622, UEM: 0.5363, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8750, partial_loss/deprel_loss: 0.9418, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0214, loss: 0.8949, batch_reg_loss: 0.0930, reg_loss: 0.0925 ||:  44%|####4     | 49/111 [00:33<00:42,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.9244, LAS: 0.8620, UEM: 0.5327, LEM: 0.2988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7190, partial_loss/deprel_loss: 0.8342, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9043, loss: 0.8976, batch_reg_loss: 0.0931, reg_loss: 0.0925 ||:  47%|####6     | 52/111 [00:35<00:40,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8847, UAS: 0.9237, LAS: 0.8612, UEM: 0.5251, LEM: 0.2915, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4009, partial_loss/deprel_loss: 0.6874, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7233, loss: 0.9062, batch_reg_loss: 0.0931, reg_loss: 0.0926 ||:  50%|####9     | 55/111 [00:37<00:38,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9240, LAS: 0.8615, UEM: 0.5296, LEM: 0.2938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3117, partial_loss/deprel_loss: 0.4649, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5275, loss: 0.9034, batch_reg_loss: 0.0932, reg_loss: 0.0926 ||:  52%|#####2    | 58/111 [00:40<00:37,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9247, LAS: 0.8623, UEM: 0.5344, LEM: 0.2969, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3854, partial_loss/deprel_loss: 0.5744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6299, loss: 0.8967, batch_reg_loss: 0.0933, reg_loss: 0.0926 ||:  55%|#####4    | 61/111 [00:42<00:35,  1.39it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7501, UAS: 0.9220, LAS: 0.8592, UEM: 0.5220, LEM: 0.2890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0578, partial_loss/deprel_loss: 1.6962, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8619, loss: 0.9225, batch_reg_loss: 0.0934, reg_loss: 0.0927 ||:  59%|#####8    | 65/111 [00:45<00:32,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8401, UAS: 0.9210, LAS: 0.8582, UEM: 0.5109, LEM: 0.2804, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8382, partial_loss/deprel_loss: 0.9579, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0274, loss: 0.9295, batch_reg_loss: 0.0934, reg_loss: 0.0927 ||:  62%|######2   | 69/111 [00:47<00:27,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8715, UAS: 0.9208, LAS: 0.8578, UEM: 0.5065, LEM: 0.2749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5938, partial_loss/deprel_loss: 0.7648, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8241, loss: 0.9320, batch_reg_loss: 0.0935, reg_loss: 0.0928 ||:  66%|######5   | 73/111 [00:50<00:25,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8780, UAS: 0.9205, LAS: 0.8575, UEM: 0.5089, LEM: 0.2756, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4596, partial_loss/deprel_loss: 0.7226, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7637, loss: 0.9351, batch_reg_loss: 0.0936, reg_loss: 0.0928 ||:  69%|######9   | 77/111 [00:53<00:23,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8154, UAS: 0.9196, LAS: 0.8565, UEM: 0.5025, LEM: 0.2713, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3989, partial_loss/deprel_loss: 1.2230, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3519, loss: 0.9459, batch_reg_loss: 0.0937, reg_loss: 0.0929 ||:  73%|#######2  | 81/111 [00:55<00:19,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9202, LAS: 0.8571, UEM: 0.5031, LEM: 0.2700, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3432, partial_loss/deprel_loss: 0.5774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6244, loss: 0.9399, batch_reg_loss: 0.0938, reg_loss: 0.0929 ||:  77%|#######6  | 85/111 [00:57<00:16,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7840, UAS: 0.9193, LAS: 0.8562, UEM: 0.4962, LEM: 0.2652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9018, partial_loss/deprel_loss: 1.4183, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6089, loss: 0.9479, batch_reg_loss: 0.0939, reg_loss: 0.0929 ||:  80%|########  | 89/111 [01:01<00:15,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7733, UAS: 0.9190, LAS: 0.8557, UEM: 0.4967, LEM: 0.2642, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9213, partial_loss/deprel_loss: 1.5481, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7167, loss: 0.9522, batch_reg_loss: 0.0940, reg_loss: 0.0930 ||:  83%|########2 | 92/111 [01:03<00:13,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8547, UAS: 0.9182, LAS: 0.8549, UEM: 0.4904, LEM: 0.2589, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5844, partial_loss/deprel_loss: 0.8200, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8669, loss: 0.9578, batch_reg_loss: 0.0941, reg_loss: 0.0930 ||:  86%|########6 | 96/111 [01:05<00:10,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8160, UAS: 0.9179, LAS: 0.8545, UEM: 0.4835, LEM: 0.2533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3356, partial_loss/deprel_loss: 1.2480, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3597, loss: 0.9618, batch_reg_loss: 0.0942, reg_loss: 0.0931 ||:  90%|######### | 100/111 [01:08<00:07,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8480, UAS: 0.9185, LAS: 0.8549, UEM: 0.4847, LEM: 0.2529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8264, partial_loss/deprel_loss: 0.9697, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0353, loss: 0.9581, batch_reg_loss: 0.0942, reg_loss: 0.0931 ||:  93%|#########2| 103/111 [01:10<00:05,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9190, LAS: 0.8556, UEM: 0.5012, LEM: 0.2694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1585, partial_loss/deprel_loss: 0.3249, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3859, loss: 0.9525, batch_reg_loss: 0.0943, reg_loss: 0.0931 ||:  95%|#########5| 106/111 [01:12<00:03,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8343, UAS: 0.9174, LAS: 0.8537, UEM: 0.4963, LEM: 0.2666, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9702, partial_loss/deprel_loss: 0.9739, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0675, loss: 0.9691, batch_reg_loss: 0.0944, reg_loss: 0.0932 ||:  98%|#########8| 109/111 [01:14<00:01,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8448, UAS: 0.9175, LAS: 0.8538, UEM: 0.4941, LEM: 0.2641, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9358, partial_loss/deprel_loss: 0.9596, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0492, loss: 0.9684, batch_reg_loss: 0.0944, reg_loss: 0.0932 ||: 100%|##########| 111/111 [01:16<00:00,  1.46it/s]\n",
      "2023-04-06 23:17:24,438 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9379, LAS: 0.8819, UEM: 0.4929, LEM: 0.2476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8324, partial_loss/deprel_loss: 30.4534, partial_loss/cycle_loss: 0.0000, batch_loss: 24.5292, loss: 22.6841, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:08,  1.14it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8980, UAS: 0.9483, LAS: 0.8961, UEM: 0.7019, LEM: 0.4664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4225, partial_loss/deprel_loss: 25.9318, partial_loss/cycle_loss: 0.0000, batch_loss: 20.8300, loss: 21.0524, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:04<00:07,  1.09it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8710, UAS: 0.9460, LAS: 0.8899, UEM: 0.6444, LEM: 0.3815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6182, partial_loss/deprel_loss: 33.9471, partial_loss/cycle_loss: 0.0000, batch_loss: 27.2813, loss: 21.9483, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:07<00:04,  1.13it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9433, LAS: 0.8872, UEM: 0.6348, LEM: 0.3764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1976, partial_loss/deprel_loss: 23.3129, partial_loss/cycle_loss: 0.0000, batch_loss: 18.6898, loss: 24.3207, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:09<00:01,  1.10it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9382, LAS: 0.8808, UEM: 0.6098, LEM: 0.3497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5354, partial_loss/deprel_loss: 23.9953, partial_loss/cycle_loss: 0.0000, batch_loss: 19.3033, loss: 25.6272, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:11<00:00,  1.09it/s]\n",
      "2023-04-06 23:17:36,368 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:17:36,368 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-06 23:17:36,368 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 23:17:36,368 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 23:17:36,368 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-06 23:17:36,368 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-06 23:17:36,368 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.960  |    23.995\n",
      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.936  |     0.535\n",
      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.093  |     0.000\n",
      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - UEM                      |     0.494  |     0.610\n",
      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - LAS                      |     0.854  |     0.881\n",
      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - loss                     |     0.968  |    25.627\n",
      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - LEM                      |     0.264  |     0.350\n",
      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - UAS                      |     0.918  |     0.938\n",
      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - EM                       |     0.845  |     0.885\n",
      "2023-04-06 23:17:36,369 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:17:36,370 - INFO - combo.training.trainer - Epoch duration: 0:01:28.060274\n",
      "2023-04-06 23:17:36,370 - INFO - combo.training.trainer - Estimated training time remaining: 8:22:02\n",
      "2023-04-06 23:17:36,370 - INFO - allennlp.training.trainer - Epoch 21/399\n",
      "2023-04-06 23:17:36,370 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:17:36,371 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:17:36,376 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8363, UAS: 0.9258, LAS: 0.8623, UEM: 0.3812, LEM: 0.1341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0052, partial_loss/deprel_loss: 0.9565, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0607, loss: 0.9069, batch_reg_loss: 0.0945, reg_loss: 0.0944 ||:   3%|2         | 3/111 [00:02<01:17,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9203, LAS: 0.8558, UEM: 0.3611, LEM: 0.1313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3760, partial_loss/deprel_loss: 0.6124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6596, loss: 0.9642, batch_reg_loss: 0.0946, reg_loss: 0.0945 ||:   6%|6         | 7/111 [00:04<01:13,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8580, UAS: 0.9250, LAS: 0.8613, UEM: 0.3832, LEM: 0.1313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8690, partial_loss/deprel_loss: 0.9013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9895, loss: 0.9139, batch_reg_loss: 0.0947, reg_loss: 0.0945 ||:  10%|9         | 11/111 [00:07<01:07,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8533, UAS: 0.9155, LAS: 0.8505, UEM: 0.3310, LEM: 0.1096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7844, partial_loss/deprel_loss: 0.8858, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9602, loss: 0.9989, batch_reg_loss: 0.0947, reg_loss: 0.0946 ||:  14%|#3        | 15/111 [00:09<01:03,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8521, UAS: 0.9187, LAS: 0.8536, UEM: 0.3559, LEM: 0.1284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7069, partial_loss/deprel_loss: 0.9114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9654, loss: 0.9738, batch_reg_loss: 0.0948, reg_loss: 0.0946 ||:  17%|#7        | 19/111 [00:12<01:00,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8454, UAS: 0.9194, LAS: 0.8549, UEM: 0.3802, LEM: 0.1447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9340, partial_loss/deprel_loss: 0.8900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9937, loss: 0.9615, batch_reg_loss: 0.0949, reg_loss: 0.0947 ||:  21%|##        | 23/111 [00:14<00:56,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9213, LAS: 0.8573, UEM: 0.4043, LEM: 0.1632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3409, partial_loss/deprel_loss: 0.5584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6099, loss: 0.9402, batch_reg_loss: 0.0950, reg_loss: 0.0947 ||:  24%|##4       | 27/111 [00:17<00:52,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9229, LAS: 0.8593, UEM: 0.4209, LEM: 0.1772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3523, partial_loss/deprel_loss: 0.5628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6158, loss: 0.9247, batch_reg_loss: 0.0951, reg_loss: 0.0948 ||:  28%|##7       | 31/111 [00:19<00:51,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8642, UAS: 0.9226, LAS: 0.8594, UEM: 0.4405, LEM: 0.1987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7041, partial_loss/deprel_loss: 0.8753, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9363, loss: 0.9259, batch_reg_loss: 0.0952, reg_loss: 0.0948 ||:  32%|###1      | 35/111 [00:22<00:48,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8460, UAS: 0.9234, LAS: 0.8603, UEM: 0.4429, LEM: 0.2005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9610, partial_loss/deprel_loss: 0.8971, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0052, loss: 0.9134, batch_reg_loss: 0.0953, reg_loss: 0.0949 ||:  35%|###5      | 39/111 [00:25<00:46,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7296, UAS: 0.9207, LAS: 0.8576, UEM: 0.4694, LEM: 0.2335, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 3.0297, partial_loss/deprel_loss: 1.8059, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1460, loss: 0.9392, batch_reg_loss: 0.0953, reg_loss: 0.0949 ||:  38%|###7      | 42/111 [00:27<00:46,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8896, UAS: 0.9230, LAS: 0.8604, UEM: 0.4986, LEM: 0.2542, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4283, partial_loss/deprel_loss: 0.6117, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6704, loss: 0.9153, batch_reg_loss: 0.0954, reg_loss: 0.0949 ||:  41%|####      | 45/111 [00:29<00:45,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8595, UAS: 0.9227, LAS: 0.8601, UEM: 0.4996, LEM: 0.2565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7368, partial_loss/deprel_loss: 0.8730, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9412, loss: 0.9158, batch_reg_loss: 0.0954, reg_loss: 0.0950 ||:  43%|####3     | 48/111 [00:31<00:45,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8347, UAS: 0.9213, LAS: 0.8584, UEM: 0.4874, LEM: 0.2479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9492, partial_loss/deprel_loss: 1.1123, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1752, loss: 0.9301, batch_reg_loss: 0.0955, reg_loss: 0.0950 ||:  46%|####5     | 51/111 [00:34<00:43,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9193, LAS: 0.8562, UEM: 0.4801, LEM: 0.2417, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5844, partial_loss/deprel_loss: 0.7754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8328, loss: 0.9488, batch_reg_loss: 0.0956, reg_loss: 0.0950 ||:  49%|####8     | 54/111 [00:36<00:41,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8167, UAS: 0.9175, LAS: 0.8539, UEM: 0.4693, LEM: 0.2347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2272, partial_loss/deprel_loss: 1.2433, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3357, loss: 0.9674, batch_reg_loss: 0.0957, reg_loss: 0.0951 ||:  52%|#####2    | 58/111 [00:38<00:37,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9193, LAS: 0.8564, UEM: 0.5091, LEM: 0.2797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1029, partial_loss/deprel_loss: 0.2265, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2975, loss: 0.9466, batch_reg_loss: 0.0957, reg_loss: 0.0951 ||:  55%|#####4    | 61/111 [00:41<00:39,  1.26it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8577, UAS: 0.9187, LAS: 0.8552, UEM: 0.4985, LEM: 0.2708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6729, partial_loss/deprel_loss: 0.7973, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8682, loss: 0.9533, batch_reg_loss: 0.0958, reg_loss: 0.0951 ||:  59%|#####8    | 65/111 [00:44<00:33,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8202, UAS: 0.9188, LAS: 0.8557, UEM: 0.4976, LEM: 0.2690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3849, partial_loss/deprel_loss: 1.1817, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3182, loss: 0.9503, batch_reg_loss: 0.0959, reg_loss: 0.0952 ||:  61%|######1   | 68/111 [00:46<00:30,  1.39it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9184, LAS: 0.8552, UEM: 0.4954, LEM: 0.2681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2846, partial_loss/deprel_loss: 0.4353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5012, loss: 0.9528, batch_reg_loss: 0.0960, reg_loss: 0.0952 ||:  65%|######4   | 72/111 [00:48<00:27,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8599, UAS: 0.9177, LAS: 0.8545, UEM: 0.4896, LEM: 0.2640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8338, partial_loss/deprel_loss: 0.8384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9335, loss: 0.9619, batch_reg_loss: 0.0961, reg_loss: 0.0953 ||:  68%|######8   | 76/111 [00:51<00:23,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8785, UAS: 0.9189, LAS: 0.8556, UEM: 0.4982, LEM: 0.2668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3850, partial_loss/deprel_loss: 0.6036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6560, loss: 0.9503, batch_reg_loss: 0.0961, reg_loss: 0.0953 ||:  71%|#######1  | 79/111 [00:54<00:23,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7855, UAS: 0.9170, LAS: 0.8532, UEM: 0.4909, LEM: 0.2626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7202, partial_loss/deprel_loss: 1.4704, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6166, loss: 0.9708, batch_reg_loss: 0.0962, reg_loss: 0.0953 ||:  74%|#######3  | 82/111 [00:56<00:20,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8386, UAS: 0.9167, LAS: 0.8527, UEM: 0.4814, LEM: 0.2560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9546, partial_loss/deprel_loss: 1.0401, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1193, loss: 0.9757, batch_reg_loss: 0.0963, reg_loss: 0.0954 ||:  77%|#######7  | 86/111 [00:58<00:17,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8799, UAS: 0.9178, LAS: 0.8541, UEM: 0.4946, LEM: 0.2651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4311, partial_loss/deprel_loss: 0.6831, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7291, loss: 0.9636, batch_reg_loss: 0.0964, reg_loss: 0.0954 ||:  80%|########  | 89/111 [01:00<00:15,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8296, UAS: 0.9177, LAS: 0.8538, UEM: 0.4900, LEM: 0.2610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2122, partial_loss/deprel_loss: 1.0230, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1573, loss: 0.9669, batch_reg_loss: 0.0965, reg_loss: 0.0954 ||:  83%|########2 | 92/111 [01:02<00:13,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9007, UAS: 0.9174, LAS: 0.8535, UEM: 0.4914, LEM: 0.2603, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3006, partial_loss/deprel_loss: 0.5337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5836, loss: 0.9690, batch_reg_loss: 0.0965, reg_loss: 0.0955 ||:  86%|########5 | 95/111 [01:04<00:11,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8850, UAS: 0.9168, LAS: 0.8528, UEM: 0.4893, LEM: 0.2586, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4066, partial_loss/deprel_loss: 0.6253, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6781, loss: 0.9755, batch_reg_loss: 0.0966, reg_loss: 0.0955 ||:  88%|########8 | 98/111 [01:07<00:09,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8708, UAS: 0.9167, LAS: 0.8525, UEM: 0.4840, LEM: 0.2545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6369, partial_loss/deprel_loss: 0.7295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8077, loss: 0.9770, batch_reg_loss: 0.0967, reg_loss: 0.0955 ||:  91%|######### | 101/111 [01:09<00:06,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8529, UAS: 0.9169, LAS: 0.8528, UEM: 0.4859, LEM: 0.2553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8818, partial_loss/deprel_loss: 0.8098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9210, loss: 0.9743, batch_reg_loss: 0.0968, reg_loss: 0.0956 ||:  95%|#########4| 105/111 [01:11<00:04,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8621, UAS: 0.9174, LAS: 0.8535, UEM: 0.4861, LEM: 0.2537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5777, partial_loss/deprel_loss: 0.8117, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8617, loss: 0.9685, batch_reg_loss: 0.0968, reg_loss: 0.0956 ||:  97%|#########7| 108/111 [01:14<00:02,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8666, UAS: 0.9184, LAS: 0.8544, UEM: 0.4937, LEM: 0.2579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6128, partial_loss/deprel_loss: 0.8212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8764, loss: 0.9610, batch_reg_loss: 0.0969, reg_loss: 0.0956 ||: 100%|##########| 111/111 [01:16<00:00,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8666, UAS: 0.9184, LAS: 0.8544, UEM: 0.4937, LEM: 0.2579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6128, partial_loss/deprel_loss: 0.8212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8764, loss: 0.9610, batch_reg_loss: 0.0969, reg_loss: 0.0956 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.821  |       N/A\n",
      "2023-04-06 23:18:53,121 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.613  |       N/A\n",
      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.096  |       N/A\n",
      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - UEM                      |     0.494  |       N/A\n",
      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - LAS                      |     0.854  |       N/A\n",
      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - loss                     |     0.961  |       N/A\n",
      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - LEM                      |     0.258  |       N/A\n",
      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - UAS                      |     0.918  |       N/A\n",
      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - EM                       |     0.867  |       N/A\n",
      "2023-04-06 23:18:53,122 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:18:53,123 - INFO - combo.training.trainer - Epoch duration: 0:01:16.752609\n",
      "2023-04-06 23:18:53,123 - INFO - combo.training.trainer - Estimated training time remaining: 8:19:56\n",
      "2023-04-06 23:18:53,123 - INFO - allennlp.training.trainer - Epoch 22/399\n",
      "2023-04-06 23:18:53,123 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:18:53,123 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:18:53,130 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8548, UAS: 0.9361, LAS: 0.8734, UEM: 0.4864, LEM: 0.2167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8275, partial_loss/deprel_loss: 0.8561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9474, loss: 0.8003, batch_reg_loss: 0.0970, reg_loss: 0.0970 ||:   4%|3         | 4/111 [00:02<00:57,  1.86it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8194, UAS: 0.9300, LAS: 0.8699, UEM: 0.5067, LEM: 0.2404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4623, partial_loss/deprel_loss: 1.1682, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3241, loss: 0.8539, batch_reg_loss: 0.0971, reg_loss: 0.0970 ||:   7%|7         | 8/111 [00:04<00:56,  1.81it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8613, UAS: 0.9287, LAS: 0.8690, UEM: 0.4604, LEM: 0.2002, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7500, partial_loss/deprel_loss: 0.8352, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9153, loss: 0.8580, batch_reg_loss: 0.0971, reg_loss: 0.0970 ||:  11%|#         | 12/111 [00:06<00:56,  1.77it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9096, UAS: 0.9332, LAS: 0.8739, UEM: 0.5000, LEM: 0.2279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2665, partial_loss/deprel_loss: 0.4745, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5301, loss: 0.8228, batch_reg_loss: 0.0972, reg_loss: 0.0971 ||:  14%|#3        | 15/111 [00:08<00:58,  1.65it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8928, UAS: 0.9380, LAS: 0.8796, UEM: 0.5910, LEM: 0.3243, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4276, partial_loss/deprel_loss: 0.6461, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6996, loss: 0.7743, batch_reg_loss: 0.0973, reg_loss: 0.0971 ||:  16%|#6        | 18/111 [00:11<01:00,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8666, UAS: 0.9388, LAS: 0.8795, UEM: 0.5882, LEM: 0.3117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5401, partial_loss/deprel_loss: 0.7525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8074, loss: 0.7672, batch_reg_loss: 0.0973, reg_loss: 0.0971 ||:  19%|#8        | 21/111 [00:13<00:59,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8452, UAS: 0.9394, LAS: 0.8805, UEM: 0.5959, LEM: 0.3183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8269, partial_loss/deprel_loss: 0.9416, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0160, loss: 0.7596, batch_reg_loss: 0.0974, reg_loss: 0.0971 ||:  22%|##1       | 24/111 [00:15<00:58,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8729, UAS: 0.9385, LAS: 0.8795, UEM: 0.5779, LEM: 0.3048, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6153, partial_loss/deprel_loss: 0.8072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8663, loss: 0.7663, batch_reg_loss: 0.0974, reg_loss: 0.0972 ||:  24%|##4       | 27/111 [00:17<00:57,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8079, UAS: 0.9341, LAS: 0.8746, UEM: 0.5516, LEM: 0.2868, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8354, partial_loss/deprel_loss: 1.2851, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4926, loss: 0.8122, batch_reg_loss: 0.0975, reg_loss: 0.0972 ||:  28%|##7       | 31/111 [00:20<00:53,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8138, UAS: 0.9303, LAS: 0.8703, UEM: 0.5369, LEM: 0.2790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3798, partial_loss/deprel_loss: 1.2360, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3623, loss: 0.8503, batch_reg_loss: 0.0976, reg_loss: 0.0972 ||:  32%|###1      | 35/111 [00:22<00:51,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9314, LAS: 0.8718, UEM: 0.5791, LEM: 0.3318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3940, partial_loss/deprel_loss: 0.5500, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6164, loss: 0.8361, batch_reg_loss: 0.0976, reg_loss: 0.0973 ||:  34%|###4      | 38/111 [00:25<00:55,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8747, UAS: 0.9312, LAS: 0.8709, UEM: 0.5703, LEM: 0.3213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5884, partial_loss/deprel_loss: 0.7088, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7824, loss: 0.8412, batch_reg_loss: 0.0977, reg_loss: 0.0973 ||:  37%|###6      | 41/111 [00:27<00:52,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8714, UAS: 0.9275, LAS: 0.8665, UEM: 0.5581, LEM: 0.3114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6344, partial_loss/deprel_loss: 0.7415, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8178, loss: 0.8770, batch_reg_loss: 0.0977, reg_loss: 0.0973 ||:  40%|###9      | 44/111 [00:29<00:48,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8740, UAS: 0.9283, LAS: 0.8671, UEM: 0.5570, LEM: 0.3067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4666, partial_loss/deprel_loss: 0.6955, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7476, loss: 0.8715, batch_reg_loss: 0.0978, reg_loss: 0.0974 ||:  43%|####3     | 48/111 [00:32<00:44,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9256, LAS: 0.8640, UEM: 0.5457, LEM: 0.2997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4119, partial_loss/deprel_loss: 0.5915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6535, loss: 0.8893, batch_reg_loss: 0.0979, reg_loss: 0.0974 ||:  47%|####6     | 52/111 [00:35<00:40,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9268, LAS: 0.8653, UEM: 0.5666, LEM: 0.3207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1844, partial_loss/deprel_loss: 0.3684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4296, loss: 0.8788, batch_reg_loss: 0.0980, reg_loss: 0.0974 ||:  50%|####9     | 55/111 [00:37<00:40,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9261, LAS: 0.8643, UEM: 0.5619, LEM: 0.3160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3166, partial_loss/deprel_loss: 0.4570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5270, loss: 0.8857, batch_reg_loss: 0.0981, reg_loss: 0.0975 ||:  53%|#####3    | 59/111 [00:39<00:35,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7876, UAS: 0.9239, LAS: 0.8618, UEM: 0.5473, LEM: 0.3063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7525, partial_loss/deprel_loss: 1.3168, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5021, loss: 0.9059, batch_reg_loss: 0.0982, reg_loss: 0.0975 ||:  57%|#####6    | 63/111 [00:42<00:32,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8164, UAS: 0.9234, LAS: 0.8610, UEM: 0.5373, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3867, partial_loss/deprel_loss: 1.1551, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2997, loss: 0.9142, batch_reg_loss: 0.0982, reg_loss: 0.0976 ||:  59%|#####9    | 66/111 [00:44<00:30,  1.48it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8013, UAS: 0.9236, LAS: 0.8612, UEM: 0.5420, LEM: 0.3022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4252, partial_loss/deprel_loss: 1.3715, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4806, loss: 0.9127, batch_reg_loss: 0.0983, reg_loss: 0.0976 ||:  62%|######2   | 69/111 [00:47<00:30,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8822, UAS: 0.9236, LAS: 0.8613, UEM: 0.5379, LEM: 0.2975, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5400, partial_loss/deprel_loss: 0.6561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7313, loss: 0.9139, batch_reg_loss: 0.0984, reg_loss: 0.0976 ||:  65%|######4   | 72/111 [00:49<00:28,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8829, UAS: 0.9226, LAS: 0.8598, UEM: 0.5300, LEM: 0.2902, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5208, partial_loss/deprel_loss: 0.7197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7784, loss: 0.9243, batch_reg_loss: 0.0985, reg_loss: 0.0977 ||:  68%|######8   | 76/111 [00:51<00:24,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9214, LAS: 0.8586, UEM: 0.5237, LEM: 0.2858, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7298, partial_loss/deprel_loss: 0.7075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8105, loss: 0.9339, batch_reg_loss: 0.0986, reg_loss: 0.0977 ||:  72%|#######2  | 80/111 [00:54<00:21,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9218, LAS: 0.8591, UEM: 0.5252, LEM: 0.2861, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5913, partial_loss/deprel_loss: 0.7371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8066, loss: 0.9308, batch_reg_loss: 0.0986, reg_loss: 0.0977 ||:  75%|#######4  | 83/111 [00:56<00:19,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8156, UAS: 0.9213, LAS: 0.8584, UEM: 0.5176, LEM: 0.2797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4704, partial_loss/deprel_loss: 1.1766, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3341, loss: 0.9378, batch_reg_loss: 0.0987, reg_loss: 0.0978 ||:  78%|#######8  | 87/111 [00:59<00:16,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7587, UAS: 0.9197, LAS: 0.8566, UEM: 0.5081, LEM: 0.2734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3102, partial_loss/deprel_loss: 1.6186, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8557, loss: 0.9530, batch_reg_loss: 0.0988, reg_loss: 0.0978 ||:  82%|########1 | 91/111 [01:01<00:13,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8198, UAS: 0.9189, LAS: 0.8555, UEM: 0.4985, LEM: 0.2667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2651, partial_loss/deprel_loss: 1.0647, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2037, loss: 0.9623, batch_reg_loss: 0.0989, reg_loss: 0.0979 ||:  86%|########5 | 95/111 [01:04<00:10,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8740, UAS: 0.9190, LAS: 0.8555, UEM: 0.4983, LEM: 0.2662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5153, partial_loss/deprel_loss: 0.7901, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8342, loss: 0.9627, batch_reg_loss: 0.0990, reg_loss: 0.0979 ||:  89%|########9 | 99/111 [01:06<00:07,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8723, UAS: 0.9191, LAS: 0.8558, UEM: 0.5012, LEM: 0.2698, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5980, partial_loss/deprel_loss: 0.7163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7918, loss: 0.9603, batch_reg_loss: 0.0991, reg_loss: 0.0980 ||:  93%|#########2| 103/111 [01:09<00:05,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8520, UAS: 0.9187, LAS: 0.8553, UEM: 0.5018, LEM: 0.2701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8508, partial_loss/deprel_loss: 0.9035, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9922, loss: 0.9639, batch_reg_loss: 0.0992, reg_loss: 0.0980 ||:  96%|#########6| 107/111 [01:11<00:02,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9197, LAS: 0.8564, UEM: 0.5037, LEM: 0.2689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4395, partial_loss/deprel_loss: 0.6932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7417, loss: 0.9546, batch_reg_loss: 0.0993, reg_loss: 0.0981 ||: 100%|##########| 111/111 [01:14<00:00,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9197, LAS: 0.8564, UEM: 0.5037, LEM: 0.2689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4395, partial_loss/deprel_loss: 0.6932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7417, loss: 0.9546, batch_reg_loss: 0.0993, reg_loss: 0.0981 ||: 100%|##########| 111/111 [01:14<00:00,  1.50it/s]\n",
      "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-06 23:20:07,331 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.693  |       N/A\n",
      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.439  |       N/A\n",
      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.098  |       N/A\n",
      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - UEM                      |     0.504  |       N/A\n",
      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - LAS                      |     0.856  |       N/A\n",
      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - loss                     |     0.955  |       N/A\n",
      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - LEM                      |     0.269  |       N/A\n",
      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - UAS                      |     0.920  |       N/A\n",
      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - EM                       |     0.880  |       N/A\n",
      "2023-04-06 23:20:07,332 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:20:07,333 - INFO - combo.training.trainer - Epoch duration: 0:01:14.210037\n",
      "2023-04-06 23:20:07,333 - INFO - combo.training.trainer - Estimated training time remaining: 8:17:12\n",
      "2023-04-06 23:20:07,333 - INFO - allennlp.training.trainer - Epoch 23/399\n",
      "2023-04-06 23:20:07,333 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:20:07,334 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:20:07,340 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8385, UAS: 0.8949, LAS: 0.8287, UEM: 0.1098, LEM: 0.0122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1080, partial_loss/deprel_loss: 1.0936, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1958, loss: 1.2573, batch_reg_loss: 0.0994, reg_loss: 0.0993 ||:   3%|2         | 3/111 [00:02<01:12,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8446, UAS: 0.9162, LAS: 0.8520, UEM: 0.4313, LEM: 0.1854, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9910, partial_loss/deprel_loss: 0.9522, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0594, loss: 1.0167, batch_reg_loss: 0.0994, reg_loss: 0.0994 ||:   5%|5         | 6/111 [00:04<01:12,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8850, UAS: 0.9208, LAS: 0.8586, UEM: 0.4514, LEM: 0.1973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4497, partial_loss/deprel_loss: 0.7025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7515, loss: 0.9521, batch_reg_loss: 0.0995, reg_loss: 0.0994 ||:   9%|9         | 10/111 [00:06<01:06,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8790, UAS: 0.9220, LAS: 0.8594, UEM: 0.4382, LEM: 0.1919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5719, partial_loss/deprel_loss: 0.6911, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7669, loss: 0.9378, batch_reg_loss: 0.0996, reg_loss: 0.0994 ||:  12%|#1        | 13/111 [00:08<01:05,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8195, UAS: 0.9152, LAS: 0.8517, UEM: 0.4119, LEM: 0.1816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4563, partial_loss/deprel_loss: 1.1203, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2872, loss: 1.0058, batch_reg_loss: 0.0997, reg_loss: 0.0995 ||:  15%|#5        | 17/111 [00:11<01:02,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9212, LAS: 0.8597, UEM: 0.5133, LEM: 0.2807, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4697, partial_loss/deprel_loss: 0.6013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6747, loss: 0.9357, batch_reg_loss: 0.0997, reg_loss: 0.0995 ||:  18%|#8        | 20/111 [00:13<01:05,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7982, UAS: 0.9195, LAS: 0.8577, UEM: 0.4810, LEM: 0.2547, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6368, partial_loss/deprel_loss: 1.2883, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4579, loss: 0.9546, batch_reg_loss: 0.0998, reg_loss: 0.0996 ||:  22%|##1       | 24/111 [00:16<00:58,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8528, UAS: 0.9207, LAS: 0.8587, UEM: 0.4830, LEM: 0.2536, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7993, partial_loss/deprel_loss: 0.8640, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9510, loss: 0.9487, batch_reg_loss: 0.0999, reg_loss: 0.0996 ||:  24%|##4       | 27/111 [00:18<00:57,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9174, LAS: 0.8551, UEM: 0.4849, LEM: 0.2546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2721, partial_loss/deprel_loss: 0.4954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5507, loss: 0.9817, batch_reg_loss: 0.1000, reg_loss: 0.0996 ||:  27%|##7       | 30/111 [00:20<00:56,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8186, UAS: 0.9170, LAS: 0.8551, UEM: 0.4742, LEM: 0.2476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2339, partial_loss/deprel_loss: 1.1452, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2630, loss: 0.9804, batch_reg_loss: 0.1000, reg_loss: 0.0997 ||:  30%|##9       | 33/111 [00:22<00:54,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9191, LAS: 0.8576, UEM: 0.5179, LEM: 0.2871, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1584, partial_loss/deprel_loss: 0.3758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4324, loss: 0.9551, batch_reg_loss: 0.1001, reg_loss: 0.0997 ||:  32%|###2      | 36/111 [00:24<00:52,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9208, LAS: 0.8592, UEM: 0.5176, LEM: 0.2831, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3242, partial_loss/deprel_loss: 0.5435, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5999, loss: 0.9375, batch_reg_loss: 0.1002, reg_loss: 0.0998 ||:  36%|###6      | 40/111 [00:27<00:49,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9215, LAS: 0.8597, UEM: 0.5178, LEM: 0.2790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4017, partial_loss/deprel_loss: 0.5735, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6394, loss: 0.9290, batch_reg_loss: 0.1003, reg_loss: 0.0998 ||:  39%|###8      | 43/111 [00:29<00:47,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9230, LAS: 0.8616, UEM: 0.5530, LEM: 0.3230, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0951, partial_loss/deprel_loss: 0.2286, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3023, loss: 0.9164, batch_reg_loss: 0.1003, reg_loss: 0.0998 ||:  41%|####1     | 46/111 [00:31<00:48,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8862, UAS: 0.9233, LAS: 0.8621, UEM: 0.5553, LEM: 0.3236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4974, partial_loss/deprel_loss: 0.6754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7402, loss: 0.9117, batch_reg_loss: 0.1004, reg_loss: 0.0999 ||:  44%|####4     | 49/111 [00:34<00:45,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8017, UAS: 0.9220, LAS: 0.8608, UEM: 0.5543, LEM: 0.3267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5379, partial_loss/deprel_loss: 1.2708, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4247, loss: 0.9204, batch_reg_loss: 0.1005, reg_loss: 0.0999 ||:  48%|####7     | 53/111 [00:36<00:41,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9218, LAS: 0.8605, UEM: 0.5487, LEM: 0.3212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3058, partial_loss/deprel_loss: 0.5159, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5744, loss: 0.9219, batch_reg_loss: 0.1005, reg_loss: 0.0999 ||:  50%|#####     | 56/111 [00:38<00:39,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9142, UAS: 0.9226, LAS: 0.8614, UEM: 0.5549, LEM: 0.3237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1668, partial_loss/deprel_loss: 0.4572, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4997, loss: 0.9170, batch_reg_loss: 0.1006, reg_loss: 0.1000 ||:  53%|#####3    | 59/111 [00:41<00:38,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9232, LAS: 0.8619, UEM: 0.5563, LEM: 0.3225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5530, partial_loss/deprel_loss: 0.6772, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7530, loss: 0.9111, batch_reg_loss: 0.1007, reg_loss: 0.1000 ||:  56%|#####5    | 62/111 [00:43<00:36,  1.34it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8724, UAS: 0.9238, LAS: 0.8623, UEM: 0.5494, LEM: 0.3132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4779, partial_loss/deprel_loss: 0.8325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8623, loss: 0.9075, batch_reg_loss: 0.1008, reg_loss: 0.1000 ||:  59%|#####9    | 66/111 [00:46<00:32,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8420, UAS: 0.9234, LAS: 0.8620, UEM: 0.5454, LEM: 0.3091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9666, partial_loss/deprel_loss: 0.9580, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0606, loss: 0.9100, batch_reg_loss: 0.1008, reg_loss: 0.1001 ||:  62%|######2   | 69/111 [00:48<00:29,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9209, LAS: 0.8594, UEM: 0.5390, LEM: 0.3046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5884, partial_loss/deprel_loss: 0.8047, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8623, loss: 0.9318, batch_reg_loss: 0.1009, reg_loss: 0.1001 ||:  65%|######4   | 72/111 [00:50<00:27,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8647, UAS: 0.9218, LAS: 0.8603, UEM: 0.5415, LEM: 0.3048, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6952, partial_loss/deprel_loss: 0.8219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8975, loss: 0.9227, batch_reg_loss: 0.1009, reg_loss: 0.1001 ||:  68%|######7   | 75/111 [00:52<00:26,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8815, UAS: 0.9209, LAS: 0.8591, UEM: 0.5355, LEM: 0.2978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5396, partial_loss/deprel_loss: 0.6414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7220, loss: 0.9309, batch_reg_loss: 0.1010, reg_loss: 0.1002 ||:  71%|#######1  | 79/111 [00:55<00:23,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9214, LAS: 0.8597, UEM: 0.5347, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3550, partial_loss/deprel_loss: 0.5707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6287, loss: 0.9262, batch_reg_loss: 0.1011, reg_loss: 0.1002 ||:  74%|#######3  | 82/111 [00:57<00:20,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.9216, LAS: 0.8599, UEM: 0.5292, LEM: 0.2913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1648, partial_loss/deprel_loss: 1.1497, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2539, loss: 0.9257, batch_reg_loss: 0.1012, reg_loss: 0.1003 ||:  77%|#######7  | 86/111 [00:59<00:16,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8274, UAS: 0.9212, LAS: 0.8595, UEM: 0.5286, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1797, partial_loss/deprel_loss: 1.0297, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1609, loss: 0.9283, batch_reg_loss: 0.1013, reg_loss: 0.1003 ||:  80%|########  | 89/111 [01:02<00:15,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8444, UAS: 0.9205, LAS: 0.8586, UEM: 0.5206, LEM: 0.2867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8560, partial_loss/deprel_loss: 0.8923, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9864, loss: 0.9342, batch_reg_loss: 0.1013, reg_loss: 0.1003 ||:  83%|########2 | 92/111 [01:04<00:13,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8405, UAS: 0.9196, LAS: 0.8574, UEM: 0.5135, LEM: 0.2820, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8253, partial_loss/deprel_loss: 0.8840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9737, loss: 0.9429, batch_reg_loss: 0.1014, reg_loss: 0.1004 ||:  86%|########5 | 95/111 [01:06<00:11,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8775, UAS: 0.9202, LAS: 0.8579, UEM: 0.5121, LEM: 0.2781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4252, partial_loss/deprel_loss: 0.6383, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6971, loss: 0.9379, batch_reg_loss: 0.1015, reg_loss: 0.1004 ||:  88%|########8 | 98/111 [01:08<00:09,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9202, LAS: 0.8578, UEM: 0.5151, LEM: 0.2800, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3950, partial_loss/deprel_loss: 0.6499, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7004, loss: 0.9367, batch_reg_loss: 0.1015, reg_loss: 0.1004 ||:  91%|######### | 101/111 [01:10<00:07,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8758, UAS: 0.9204, LAS: 0.8580, UEM: 0.5113, LEM: 0.2761, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5823, partial_loss/deprel_loss: 0.7403, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8103, loss: 0.9358, batch_reg_loss: 0.1016, reg_loss: 0.1005 ||:  94%|#########3| 104/111 [01:13<00:05,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8119, UAS: 0.9201, LAS: 0.8575, UEM: 0.5075, LEM: 0.2724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3702, partial_loss/deprel_loss: 1.1280, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2781, loss: 0.9388, batch_reg_loss: 0.1017, reg_loss: 0.1005 ||:  96%|#########6| 107/111 [01:15<00:02,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9199, LAS: 0.8573, UEM: 0.5026, LEM: 0.2678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5529, partial_loss/deprel_loss: 0.7012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7733, loss: 0.9416, batch_reg_loss: 0.1018, reg_loss: 0.1005 ||: 100%|##########| 111/111 [01:17<00:00,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9199, LAS: 0.8573, UEM: 0.5026, LEM: 0.2678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5529, partial_loss/deprel_loss: 0.7012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7733, loss: 0.9416, batch_reg_loss: 0.1018, reg_loss: 0.1005 ||: 100%|##########| 111/111 [01:17<00:00,  1.43it/s]\n",
      "2023-04-06 23:21:25,103 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:21:25,103 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:21:25,103 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.701  |       N/A\n",
      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.553  |       N/A\n",
      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.101  |       N/A\n",
      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - UEM                      |     0.503  |       N/A\n",
      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - LAS                      |     0.857  |       N/A\n",
      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - loss                     |     0.942  |       N/A\n",
      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - LEM                      |     0.268  |       N/A\n",
      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - UAS                      |     0.920  |       N/A\n",
      "2023-04-06 23:21:25,104 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:21:25,105 - INFO - combo.training.tensorboard_writer - EM                       |     0.879  |       N/A\n",
      "2023-04-06 23:21:25,105 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:21:25,105 - INFO - combo.training.trainer - Epoch duration: 0:01:17.771978\n",
      "2023-04-06 23:21:25,105 - INFO - combo.training.trainer - Estimated training time remaining: 8:15:32\n",
      "2023-04-06 23:21:25,105 - INFO - allennlp.training.trainer - Epoch 24/399\n",
      "2023-04-06 23:21:25,106 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:21:25,106 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:21:25,112 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9498, LAS: 0.8965, UEM: 0.6134, LEM: 0.3227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4244, partial_loss/deprel_loss: 0.5337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6136, loss: 0.6403, batch_reg_loss: 0.1018, reg_loss: 0.1018 ||:   3%|2         | 3/111 [00:02<01:13,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7832, UAS: 0.9222, LAS: 0.8663, UEM: 0.5378, LEM: 0.2658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0726, partial_loss/deprel_loss: 1.2622, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5262, loss: 0.8804, batch_reg_loss: 0.1019, reg_loss: 0.1018 ||:   5%|5         | 6/111 [00:04<01:12,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9254, LAS: 0.8696, UEM: 0.5613, LEM: 0.2977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2665, partial_loss/deprel_loss: 0.4438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5103, loss: 0.8574, batch_reg_loss: 0.1020, reg_loss: 0.1019 ||:   8%|8         | 9/111 [00:06<01:13,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9290, LAS: 0.8697, UEM: 0.5375, LEM: 0.2582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5027, partial_loss/deprel_loss: 0.7213, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7796, loss: 0.8491, batch_reg_loss: 0.1021, reg_loss: 0.1019 ||:  12%|#1        | 13/111 [00:08<01:05,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8115, UAS: 0.9180, LAS: 0.8568, UEM: 0.4769, LEM: 0.2268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3171, partial_loss/deprel_loss: 1.1869, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3151, loss: 0.9530, batch_reg_loss: 0.1021, reg_loss: 0.1020 ||:  15%|#5        | 17/111 [00:11<01:01,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8866, UAS: 0.9202, LAS: 0.8585, UEM: 0.4617, LEM: 0.2124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5182, partial_loss/deprel_loss: 0.6378, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7161, loss: 0.9386, batch_reg_loss: 0.1022, reg_loss: 0.1020 ||:  19%|#8        | 21/111 [00:13<00:57,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8729, UAS: 0.9191, LAS: 0.8573, UEM: 0.4431, LEM: 0.1985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5818, partial_loss/deprel_loss: 0.7437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8136, loss: 0.9558, batch_reg_loss: 0.1023, reg_loss: 0.1020 ||:  22%|##1       | 24/111 [00:15<00:57,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8420, UAS: 0.9207, LAS: 0.8589, UEM: 0.4550, LEM: 0.2127, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7988, partial_loss/deprel_loss: 0.9206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9986, loss: 0.9407, batch_reg_loss: 0.1024, reg_loss: 0.1021 ||:  25%|##5       | 28/111 [00:18<00:54,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8407, UAS: 0.9219, LAS: 0.8599, UEM: 0.4545, LEM: 0.2086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9907, partial_loss/deprel_loss: 0.9659, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0733, loss: 0.9309, batch_reg_loss: 0.1025, reg_loss: 0.1021 ||:  28%|##7       | 31/111 [00:20<00:53,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8286, UAS: 0.9239, LAS: 0.8630, UEM: 0.5199, LEM: 0.2897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1700, partial_loss/deprel_loss: 1.1138, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2275, loss: 0.9088, batch_reg_loss: 0.1025, reg_loss: 0.1022 ||:  31%|###       | 34/111 [00:22<00:55,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9237, LAS: 0.8628, UEM: 0.5208, LEM: 0.2880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3895, partial_loss/deprel_loss: 0.6072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6663, loss: 0.9085, batch_reg_loss: 0.1026, reg_loss: 0.1022 ||:  34%|###4      | 38/111 [00:25<00:50,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8645, UAS: 0.9219, LAS: 0.8612, UEM: 0.5116, LEM: 0.2786, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6607, partial_loss/deprel_loss: 0.7658, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8475, loss: 0.9216, batch_reg_loss: 0.1027, reg_loss: 0.1022 ||:  38%|###7      | 42/111 [00:27<00:45,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7785, UAS: 0.9207, LAS: 0.8600, UEM: 0.5061, LEM: 0.2746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8828, partial_loss/deprel_loss: 1.4185, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6141, loss: 0.9324, batch_reg_loss: 0.1028, reg_loss: 0.1023 ||:  41%|####1     | 46/111 [00:30<00:42,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8119, UAS: 0.9206, LAS: 0.8598, UEM: 0.4985, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5178, partial_loss/deprel_loss: 1.2824, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4323, loss: 0.9363, batch_reg_loss: 0.1028, reg_loss: 0.1023 ||:  45%|####5     | 50/111 [00:33<00:40,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9025, UAS: 0.9225, LAS: 0.8620, UEM: 0.5273, LEM: 0.2958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3015, partial_loss/deprel_loss: 0.4830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5496, loss: 0.9186, batch_reg_loss: 0.1029, reg_loss: 0.1024 ||:  48%|####7     | 53/111 [00:35<00:39,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8645, UAS: 0.9225, LAS: 0.8617, UEM: 0.5194, LEM: 0.2878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6157, partial_loss/deprel_loss: 0.7654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8384, loss: 0.9208, batch_reg_loss: 0.1030, reg_loss: 0.1024 ||:  50%|#####     | 56/111 [00:37<00:37,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9223, LAS: 0.8611, UEM: 0.5155, LEM: 0.2832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3731, partial_loss/deprel_loss: 0.6492, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6971, loss: 0.9261, batch_reg_loss: 0.1030, reg_loss: 0.1024 ||:  53%|#####3    | 59/111 [00:39<00:36,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8623, UAS: 0.9211, LAS: 0.8598, UEM: 0.5063, LEM: 0.2758, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7221, partial_loss/deprel_loss: 0.8030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8899, loss: 0.9367, batch_reg_loss: 0.1031, reg_loss: 0.1025 ||:  56%|#####5    | 62/111 [00:41<00:33,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8357, UAS: 0.9183, LAS: 0.8566, UEM: 0.4943, LEM: 0.2676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0037, partial_loss/deprel_loss: 0.9773, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0858, loss: 0.9632, batch_reg_loss: 0.1032, reg_loss: 0.1025 ||:  59%|#####9    | 66/111 [00:44<00:30,  1.48it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8227, UAS: 0.9178, LAS: 0.8557, UEM: 0.4850, LEM: 0.2602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1411, partial_loss/deprel_loss: 1.1626, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2616, loss: 0.9685, batch_reg_loss: 0.1033, reg_loss: 0.1025 ||:  63%|######3   | 70/111 [00:46<00:27,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9048, UAS: 0.9189, LAS: 0.8569, UEM: 0.4977, LEM: 0.2705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2746, partial_loss/deprel_loss: 0.5005, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5587, loss: 0.9568, batch_reg_loss: 0.1034, reg_loss: 0.1026 ||:  67%|######6   | 74/111 [00:49<00:24,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8208, UAS: 0.9177, LAS: 0.8557, UEM: 0.4966, LEM: 0.2701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6101, partial_loss/deprel_loss: 1.1479, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3438, loss: 0.9684, batch_reg_loss: 0.1035, reg_loss: 0.1026 ||:  69%|######9   | 77/111 [00:51<00:23,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8717, UAS: 0.9174, LAS: 0.8554, UEM: 0.4877, LEM: 0.2624, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6921, partial_loss/deprel_loss: 0.7516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8433, loss: 0.9711, batch_reg_loss: 0.1036, reg_loss: 0.1027 ||:  73%|#######2  | 81/111 [00:54<00:20,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8650, UAS: 0.9177, LAS: 0.8554, UEM: 0.4819, LEM: 0.2561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5465, partial_loss/deprel_loss: 0.7612, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8219, loss: 0.9704, batch_reg_loss: 0.1036, reg_loss: 0.1027 ||:  77%|#######6  | 85/111 [00:56<00:16,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9183, LAS: 0.8559, UEM: 0.4814, LEM: 0.2532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6801, partial_loss/deprel_loss: 0.8225, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8978, loss: 0.9660, batch_reg_loss: 0.1037, reg_loss: 0.1028 ||:  80%|########  | 89/111 [00:59<00:14,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8791, UAS: 0.9192, LAS: 0.8571, UEM: 0.4872, LEM: 0.2573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5869, partial_loss/deprel_loss: 0.6416, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7345, loss: 0.9550, batch_reg_loss: 0.1038, reg_loss: 0.1028 ||:  84%|########3 | 93/111 [01:01<00:11,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9200, LAS: 0.8581, UEM: 0.4941, LEM: 0.2628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2738, partial_loss/deprel_loss: 0.4538, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5217, loss: 0.9464, batch_reg_loss: 0.1039, reg_loss: 0.1028 ||:  87%|########7 | 97/111 [01:05<00:09,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9204, LAS: 0.8585, UEM: 0.5007, LEM: 0.2680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4079, partial_loss/deprel_loss: 0.5752, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6458, loss: 0.9437, batch_reg_loss: 0.1040, reg_loss: 0.1029 ||:  91%|######### | 101/111 [01:07<00:07,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9208, LAS: 0.8587, UEM: 0.5012, LEM: 0.2663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3307, partial_loss/deprel_loss: 0.5607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6188, loss: 0.9398, batch_reg_loss: 0.1041, reg_loss: 0.1029 ||:  94%|#########3| 104/111 [01:10<00:04,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8782, UAS: 0.9209, LAS: 0.8588, UEM: 0.4988, LEM: 0.2634, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5770, partial_loss/deprel_loss: 0.6887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7704, loss: 0.9390, batch_reg_loss: 0.1041, reg_loss: 0.1030 ||:  96%|#########6| 107/111 [01:12<00:02,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7959, UAS: 0.9205, LAS: 0.8584, UEM: 0.5038, LEM: 0.2702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6188, partial_loss/deprel_loss: 1.3442, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5033, loss: 0.9428, batch_reg_loss: 0.1042, reg_loss: 0.1030 ||:  99%|#########9| 110/111 [01:14<00:00,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9208, LAS: 0.8587, UEM: 0.5047, LEM: 0.2705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3658, partial_loss/deprel_loss: 0.5668, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6308, loss: 0.9400, batch_reg_loss: 0.1042, reg_loss: 0.1030 ||: 100%|##########| 111/111 [01:15<00:00,  1.48it/s]\n",
      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.567  |       N/A\n",
      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.366  |       N/A\n",
      "2023-04-06 23:22:40,312 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.103  |       N/A\n",
      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - UEM                      |     0.505  |       N/A\n",
      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - LAS                      |     0.859  |       N/A\n",
      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - loss                     |     0.940  |       N/A\n",
      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - LEM                      |     0.270  |       N/A\n",
      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - UAS                      |     0.921  |       N/A\n",
      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - EM                       |     0.892  |       N/A\n",
      "2023-04-06 23:22:40,313 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:22:40,314 - INFO - combo.training.trainer - Epoch duration: 0:01:15.208139\n",
      "2023-04-06 23:22:40,314 - INFO - combo.training.trainer - Estimated training time remaining: 8:13:15\n",
      "2023-04-06 23:22:40,314 - INFO - allennlp.training.trainer - Epoch 25/399\n",
      "2023-04-06 23:22:40,314 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:22:40,314 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:22:40,320 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9344, LAS: 0.8797, UEM: 0.4935, LEM: 0.2495, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6547, partial_loss/deprel_loss: 0.8121, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8849, loss: 0.7391, batch_reg_loss: 0.1042, reg_loss: 0.1042 ||:   3%|2         | 3/111 [00:02<01:15,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8283, UAS: 0.9349, LAS: 0.8766, UEM: 0.4955, LEM: 0.2317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0891, partial_loss/deprel_loss: 1.0617, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1715, loss: 0.7907, batch_reg_loss: 0.1043, reg_loss: 0.1043 ||:   5%|5         | 6/111 [00:04<01:13,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8172, UAS: 0.9163, LAS: 0.8558, UEM: 0.4640, LEM: 0.2246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3905, partial_loss/deprel_loss: 1.1573, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3083, loss: 0.9494, batch_reg_loss: 0.1044, reg_loss: 0.1043 ||:   9%|9         | 10/111 [00:06<01:08,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8936, UAS: 0.9227, LAS: 0.8621, UEM: 0.4577, LEM: 0.2099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4299, partial_loss/deprel_loss: 0.6033, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6731, loss: 0.9065, batch_reg_loss: 0.1045, reg_loss: 0.1043 ||:  13%|#2        | 14/111 [00:09<01:05,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8750, UAS: 0.9247, LAS: 0.8645, UEM: 0.4702, LEM: 0.2253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6388, partial_loss/deprel_loss: 0.7764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8534, loss: 0.8863, batch_reg_loss: 0.1045, reg_loss: 0.1044 ||:  15%|#5        | 17/111 [00:11<01:07,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8458, UAS: 0.9276, LAS: 0.8682, UEM: 0.5241, LEM: 0.2942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8834, partial_loss/deprel_loss: 0.9625, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0513, loss: 0.8611, batch_reg_loss: 0.1046, reg_loss: 0.1044 ||:  18%|#8        | 20/111 [00:14<01:05,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8113, UAS: 0.9243, LAS: 0.8644, UEM: 0.4944, LEM: 0.2741, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5374, partial_loss/deprel_loss: 1.1203, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3084, loss: 0.8922, batch_reg_loss: 0.1047, reg_loss: 0.1044 ||:  21%|##        | 23/111 [00:16<01:02,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9286, LAS: 0.8690, UEM: 0.5379, LEM: 0.2997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3213, partial_loss/deprel_loss: 0.5448, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6048, loss: 0.8552, batch_reg_loss: 0.1047, reg_loss: 0.1045 ||:  23%|##3       | 26/111 [00:18<01:00,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7784, UAS: 0.9271, LAS: 0.8676, UEM: 0.5357, LEM: 0.2948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1583, partial_loss/deprel_loss: 1.3522, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6182, loss: 0.8713, batch_reg_loss: 0.1048, reg_loss: 0.1045 ||:  27%|##7       | 30/111 [00:20<00:55,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9030, UAS: 0.9281, LAS: 0.8688, UEM: 0.5477, LEM: 0.3002, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3166, partial_loss/deprel_loss: 0.4624, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5381, loss: 0.8613, batch_reg_loss: 0.1049, reg_loss: 0.1045 ||:  30%|##9       | 33/111 [00:22<00:53,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8912, UAS: 0.9289, LAS: 0.8693, UEM: 0.5395, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3442, partial_loss/deprel_loss: 0.6002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6539, loss: 0.8581, batch_reg_loss: 0.1049, reg_loss: 0.1046 ||:  32%|###2      | 36/111 [00:24<00:51,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8346, UAS: 0.9285, LAS: 0.8688, UEM: 0.5242, LEM: 0.2751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1629, partial_loss/deprel_loss: 1.0839, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2047, loss: 0.8636, batch_reg_loss: 0.1050, reg_loss: 0.1046 ||:  36%|###6      | 40/111 [00:27<00:47,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7681, UAS: 0.9278, LAS: 0.8681, UEM: 0.5437, LEM: 0.2940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1504, partial_loss/deprel_loss: 1.4375, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6852, loss: 0.8681, batch_reg_loss: 0.1051, reg_loss: 0.1046 ||:  39%|###8      | 43/111 [00:29<00:48,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9259, LAS: 0.8659, UEM: 0.5305, LEM: 0.2850, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6785, partial_loss/deprel_loss: 0.7163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8139, loss: 0.8856, batch_reg_loss: 0.1052, reg_loss: 0.1047 ||:  42%|####2     | 47/111 [00:32<00:43,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8641, UAS: 0.9249, LAS: 0.8648, UEM: 0.5189, LEM: 0.2751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6368, partial_loss/deprel_loss: 0.7374, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8225, loss: 0.8922, batch_reg_loss: 0.1052, reg_loss: 0.1047 ||:  45%|####5     | 50/111 [00:34<00:42,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9007, UAS: 0.9257, LAS: 0.8655, UEM: 0.5205, LEM: 0.2743, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3766, partial_loss/deprel_loss: 0.6185, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6754, loss: 0.8873, batch_reg_loss: 0.1053, reg_loss: 0.1047 ||:  48%|####7     | 53/111 [00:36<00:40,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9251, LAS: 0.8652, UEM: 0.5197, LEM: 0.2753, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2680, partial_loss/deprel_loss: 0.4119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4885, loss: 0.8925, batch_reg_loss: 0.1054, reg_loss: 0.1048 ||:  50%|#####     | 56/111 [00:38<00:38,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8824, UAS: 0.9268, LAS: 0.8674, UEM: 0.5477, LEM: 0.3105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4947, partial_loss/deprel_loss: 0.7372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7941, loss: 0.8777, batch_reg_loss: 0.1054, reg_loss: 0.1048 ||:  53%|#####3    | 59/111 [00:41<00:39,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8073, UAS: 0.9261, LAS: 0.8666, UEM: 0.5477, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6483, partial_loss/deprel_loss: 1.1254, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3354, loss: 0.8834, batch_reg_loss: 0.1055, reg_loss: 0.1048 ||:  56%|#####5    | 62/111 [00:43<00:36,  1.33it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9259, LAS: 0.8663, UEM: 0.5460, LEM: 0.3070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3969, partial_loss/deprel_loss: 0.5212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6019, loss: 0.8849, batch_reg_loss: 0.1056, reg_loss: 0.1049 ||:  59%|#####9    | 66/111 [00:46<00:32,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8236, UAS: 0.9236, LAS: 0.8636, UEM: 0.5365, LEM: 0.3013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2846, partial_loss/deprel_loss: 1.1375, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2725, loss: 0.9055, batch_reg_loss: 0.1056, reg_loss: 0.1049 ||:  62%|######2   | 69/111 [00:48<00:30,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8148, UAS: 0.9225, LAS: 0.8623, UEM: 0.5268, LEM: 0.2954, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3223, partial_loss/deprel_loss: 1.2582, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3767, loss: 0.9208, batch_reg_loss: 0.1057, reg_loss: 0.1050 ||:  65%|######4   | 72/111 [00:50<00:27,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7637, UAS: 0.9220, LAS: 0.8616, UEM: 0.5317, LEM: 0.3009, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9413, partial_loss/deprel_loss: 1.3939, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6091, loss: 0.9239, batch_reg_loss: 0.1058, reg_loss: 0.1050 ||:  68%|######7   | 75/111 [00:52<00:25,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8565, UAS: 0.9222, LAS: 0.8616, UEM: 0.5255, LEM: 0.2946, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7652, partial_loss/deprel_loss: 0.8632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9495, loss: 0.9231, batch_reg_loss: 0.1058, reg_loss: 0.1050 ||:  70%|#######   | 78/111 [00:54<00:23,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9232, LAS: 0.8625, UEM: 0.5251, LEM: 0.2903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4565, partial_loss/deprel_loss: 0.7356, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7857, loss: 0.9174, batch_reg_loss: 0.1059, reg_loss: 0.1050 ||:  73%|#######2  | 81/111 [00:56<00:21,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8333, UAS: 0.9231, LAS: 0.8623, UEM: 0.5156, LEM: 0.2836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0232, partial_loss/deprel_loss: 1.1543, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2341, loss: 0.9186, batch_reg_loss: 0.1060, reg_loss: 0.1051 ||:  77%|#######6  | 85/111 [00:59<00:17,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9037, UAS: 0.9238, LAS: 0.8630, UEM: 0.5193, LEM: 0.2842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2800, partial_loss/deprel_loss: 0.5071, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5677, loss: 0.9128, batch_reg_loss: 0.1061, reg_loss: 0.1051 ||:  80%|########  | 89/111 [01:01<00:15,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8337, UAS: 0.9241, LAS: 0.8633, UEM: 0.5179, LEM: 0.2819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0860, partial_loss/deprel_loss: 1.0809, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1880, loss: 0.9103, batch_reg_loss: 0.1062, reg_loss: 0.1052 ||:  83%|########2 | 92/111 [01:04<00:13,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8234, UAS: 0.9244, LAS: 0.8636, UEM: 0.5232, LEM: 0.2852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2385, partial_loss/deprel_loss: 1.0176, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1680, loss: 0.9053, batch_reg_loss: 0.1062, reg_loss: 0.1052 ||:  86%|########6 | 96/111 [01:06<00:10,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8460, UAS: 0.9233, LAS: 0.8623, UEM: 0.5169, LEM: 0.2813, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8967, partial_loss/deprel_loss: 0.9467, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0430, loss: 0.9148, batch_reg_loss: 0.1063, reg_loss: 0.1052 ||:  89%|########9 | 99/111 [01:08<00:08,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9238, LAS: 0.8630, UEM: 0.5188, LEM: 0.2829, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3748, partial_loss/deprel_loss: 0.5105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5897, loss: 0.9090, batch_reg_loss: 0.1064, reg_loss: 0.1053 ||:  92%|#########1| 102/111 [01:11<00:06,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8596, UAS: 0.9231, LAS: 0.8623, UEM: 0.5110, LEM: 0.2775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7957, partial_loss/deprel_loss: 0.8864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9747, loss: 0.9154, batch_reg_loss: 0.1064, reg_loss: 0.1053 ||:  95%|#########5| 106/111 [01:14<00:03,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7423, UAS: 0.9219, LAS: 0.8609, UEM: 0.5056, LEM: 0.2734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.8168, partial_loss/deprel_loss: 1.8275, partial_loss/cycle_loss: 0.0000, batch_loss: 2.1319, loss: 0.9278, batch_reg_loss: 0.1065, reg_loss: 0.1054 ||:  99%|#########9| 110/111 [01:16<00:00,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9221, LAS: 0.8612, UEM: 0.5086, LEM: 0.2752, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3234, partial_loss/deprel_loss: 0.5511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6121, loss: 0.9250, batch_reg_loss: 0.1065, reg_loss: 0.1054 ||: 100%|##########| 111/111 [01:17<00:00,  1.43it/s]\n",
      "2023-04-06 23:23:58,213 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9630, LAS: 0.9177, UEM: 0.8159, LEM: 0.5815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1737, partial_loss/deprel_loss: 20.5474, partial_loss/cycle_loss: 0.0000, batch_loss: 16.4726, loss: 21.0144, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:09,  1.11it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8646, UAS: 0.9472, LAS: 0.8955, UEM: 0.7141, LEM: 0.4812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0153, partial_loss/deprel_loss: 43.3811, partial_loss/cycle_loss: 0.0000, batch_loss: 34.9080, loss: 25.5731, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:04<00:07,  1.05it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8756, UAS: 0.9444, LAS: 0.8901, UEM: 0.6600, LEM: 0.4105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7415, partial_loss/deprel_loss: 29.8373, partial_loss/cycle_loss: 0.0000, batch_loss: 24.0182, loss: 24.7509, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:07<00:04,  1.06it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9176, UAS: 0.9442, LAS: 0.8901, UEM: 0.6403, LEM: 0.3835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3994, partial_loss/deprel_loss: 17.6347, partial_loss/cycle_loss: 0.0000, batch_loss: 14.1877, loss: 24.6526, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:10<00:01,  1.06it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9044, UAS: 0.9410, LAS: 0.8860, UEM: 0.6232, LEM: 0.3617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3976, partial_loss/deprel_loss: 24.4861, partial_loss/cycle_loss: 0.0000, batch_loss: 19.6684, loss: 25.9867, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.06it/s]\n",
      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.551  |    24.486\n",
      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.323  |     0.398\n",
      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.105  |     0.000\n",
      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - UEM                      |     0.509  |     0.623\n",
      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - LAS                      |     0.861  |     0.886\n",
      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - loss                     |     0.925  |    25.987\n",
      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:24:10,534 - INFO - combo.training.tensorboard_writer - LEM                      |     0.275  |     0.362\n",
      "2023-04-06 23:24:10,535 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-06 23:24:10,535 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-06 23:24:10,535 - INFO - combo.training.tensorboard_writer - UAS                      |     0.922  |     0.941\n",
      "2023-04-06 23:24:10,535 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-06 23:24:10,535 - INFO - combo.training.tensorboard_writer - EM                       |     0.893  |     0.904\n",
      "2023-04-06 23:24:10,535 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:24:10,535 - INFO - combo.training.trainer - Epoch duration: 0:01:30.221589\n",
      "2023-04-06 23:24:10,535 - INFO - combo.training.trainer - Estimated training time remaining: 8:14:38\n",
      "2023-04-06 23:24:10,536 - INFO - allennlp.training.trainer - Epoch 26/399\n",
      "2023-04-06 23:24:10,536 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:24:10,536 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:24:10,542 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9080, UAS: 0.9545, LAS: 0.9014, UEM: 0.6867, LEM: 0.3821, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3364, partial_loss/deprel_loss: 0.5464, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6110, loss: 0.6380, batch_reg_loss: 0.1066, reg_loss: 0.1066 ||:   3%|2         | 3/111 [00:02<01:20,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8532, UAS: 0.9292, LAS: 0.8709, UEM: 0.5445, LEM: 0.2801, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7835, partial_loss/deprel_loss: 0.8604, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9517, loss: 0.8619, batch_reg_loss: 0.1067, reg_loss: 0.1066 ||:   6%|6         | 7/111 [00:04<01:14,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9296, LAS: 0.8722, UEM: 0.6059, LEM: 0.3815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1357, partial_loss/deprel_loss: 0.2700, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3499, loss: 0.8487, batch_reg_loss: 0.1068, reg_loss: 0.1067 ||:   9%|9         | 10/111 [00:07<01:14,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8605, UAS: 0.9257, LAS: 0.8661, UEM: 0.5670, LEM: 0.3431, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8304, partial_loss/deprel_loss: 0.8325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9389, loss: 0.8925, batch_reg_loss: 0.1068, reg_loss: 0.1067 ||:  13%|#2        | 14/111 [00:09<01:07,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9232, LAS: 0.8619, UEM: 0.5243, LEM: 0.3034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5089, partial_loss/deprel_loss: 0.7516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8100, loss: 0.9244, batch_reg_loss: 0.1069, reg_loss: 0.1068 ||:  16%|#6        | 18/111 [00:11<01:01,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8921, UAS: 0.9243, LAS: 0.8631, UEM: 0.5139, LEM: 0.2889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3767, partial_loss/deprel_loss: 0.5236, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6012, loss: 0.9069, batch_reg_loss: 0.1070, reg_loss: 0.1068 ||:  19%|#8        | 21/111 [00:14<01:02,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9241, LAS: 0.8641, UEM: 0.5164, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2933, partial_loss/deprel_loss: 0.4944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5612, loss: 0.9046, batch_reg_loss: 0.1071, reg_loss: 0.1068 ||:  23%|##2       | 25/111 [00:16<00:57,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8872, UAS: 0.9258, LAS: 0.8660, UEM: 0.5084, LEM: 0.2739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4166, partial_loss/deprel_loss: 0.6166, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6837, loss: 0.8859, batch_reg_loss: 0.1072, reg_loss: 0.1069 ||:  26%|##6       | 29/111 [00:19<00:55,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9258, LAS: 0.8655, UEM: 0.5043, LEM: 0.2665, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2740, partial_loss/deprel_loss: 0.5245, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5816, loss: 0.8904, batch_reg_loss: 0.1073, reg_loss: 0.1069 ||:  30%|##9       | 33/111 [00:21<00:51,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9282, LAS: 0.8682, UEM: 0.5457, LEM: 0.3078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1732, partial_loss/deprel_loss: 0.4463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4990, loss: 0.8672, batch_reg_loss: 0.1073, reg_loss: 0.1069 ||:  32%|###2      | 36/111 [00:23<00:49,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8977, UAS: 0.9276, LAS: 0.8675, UEM: 0.5649, LEM: 0.3241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3104, partial_loss/deprel_loss: 0.5077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5757, loss: 0.8686, batch_reg_loss: 0.1074, reg_loss: 0.1070 ||:  35%|###5      | 39/111 [00:26<00:48,  1.48it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9282, LAS: 0.8683, UEM: 0.5682, LEM: 0.3254, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2328, partial_loss/deprel_loss: 0.4289, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4971, loss: 0.8663, batch_reg_loss: 0.1075, reg_loss: 0.1070 ||:  39%|###8      | 43/111 [00:28<00:44,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9305, LAS: 0.8712, UEM: 0.5994, LEM: 0.3625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3668, partial_loss/deprel_loss: 0.6581, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7074, loss: 0.8445, batch_reg_loss: 0.1075, reg_loss: 0.1071 ||:  42%|####2     | 47/111 [00:31<00:42,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8464, UAS: 0.9285, LAS: 0.8689, UEM: 0.5846, LEM: 0.3499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8792, partial_loss/deprel_loss: 0.9102, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0116, loss: 0.8637, batch_reg_loss: 0.1076, reg_loss: 0.1071 ||:  46%|####5     | 51/111 [00:33<00:39,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9282, LAS: 0.8684, UEM: 0.5741, LEM: 0.3397, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4152, partial_loss/deprel_loss: 0.6219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6883, loss: 0.8696, batch_reg_loss: 0.1077, reg_loss: 0.1071 ||:  50%|####9     | 55/111 [00:36<00:36,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9289, LAS: 0.8689, UEM: 0.5806, LEM: 0.3403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3748, partial_loss/deprel_loss: 0.6606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7112, loss: 0.8649, batch_reg_loss: 0.1078, reg_loss: 0.1072 ||:  53%|#####3    | 59/111 [00:39<00:35,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8305, UAS: 0.9287, LAS: 0.8687, UEM: 0.5776, LEM: 0.3373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1911, partial_loss/deprel_loss: 1.0662, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1991, loss: 0.8640, batch_reg_loss: 0.1078, reg_loss: 0.1072 ||:  56%|#####5    | 62/111 [00:41<00:34,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8407, UAS: 0.9283, LAS: 0.8684, UEM: 0.5685, LEM: 0.3305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0422, partial_loss/deprel_loss: 0.9557, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0810, loss: 0.8660, batch_reg_loss: 0.1079, reg_loss: 0.1073 ||:  59%|#####9    | 66/111 [00:43<00:30,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9273, LAS: 0.8673, UEM: 0.5602, LEM: 0.3234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4067, partial_loss/deprel_loss: 0.6749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7293, loss: 0.8741, batch_reg_loss: 0.1080, reg_loss: 0.1073 ||:  63%|######3   | 70/111 [00:46<00:27,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8612, UAS: 0.9263, LAS: 0.8659, UEM: 0.5479, LEM: 0.3142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7849, partial_loss/deprel_loss: 0.7782, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8876, loss: 0.8835, batch_reg_loss: 0.1081, reg_loss: 0.1073 ||:  67%|######6   | 74/111 [00:48<00:23,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8505, UAS: 0.9263, LAS: 0.8660, UEM: 0.5435, LEM: 0.3093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8610, partial_loss/deprel_loss: 0.9041, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0036, loss: 0.8832, batch_reg_loss: 0.1082, reg_loss: 0.1074 ||:  70%|#######   | 78/111 [00:51<00:21,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8460, UAS: 0.9239, LAS: 0.8632, UEM: 0.5339, LEM: 0.3026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0083, partial_loss/deprel_loss: 0.9057, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0345, loss: 0.9074, batch_reg_loss: 0.1083, reg_loss: 0.1074 ||:  74%|#######3  | 82/111 [00:54<00:19,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9232, LAS: 0.8625, UEM: 0.5256, LEM: 0.2958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4858, partial_loss/deprel_loss: 0.6129, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6958, loss: 0.9146, batch_reg_loss: 0.1083, reg_loss: 0.1075 ||:  77%|#######7  | 86/111 [00:57<00:16,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8379, UAS: 0.9209, LAS: 0.8601, UEM: 0.5163, LEM: 0.2898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1256, partial_loss/deprel_loss: 0.9807, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1181, loss: 0.9341, batch_reg_loss: 0.1084, reg_loss: 0.1075 ||:  81%|########1 | 90/111 [00:59<00:14,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8978, UAS: 0.9218, LAS: 0.8611, UEM: 0.5218, LEM: 0.2919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3100, partial_loss/deprel_loss: 0.5110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5793, loss: 0.9257, batch_reg_loss: 0.1085, reg_loss: 0.1075 ||:  84%|########3 | 93/111 [01:02<00:12,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8807, UAS: 0.9222, LAS: 0.8613, UEM: 0.5183, LEM: 0.2878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5588, partial_loss/deprel_loss: 0.6559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7451, loss: 0.9237, batch_reg_loss: 0.1086, reg_loss: 0.1076 ||:  86%|########6 | 96/111 [01:04<00:10,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8350, UAS: 0.9224, LAS: 0.8615, UEM: 0.5172, LEM: 0.2867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0468, partial_loss/deprel_loss: 1.0077, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1242, loss: 0.9211, batch_reg_loss: 0.1087, reg_loss: 0.1076 ||:  90%|######### | 100/111 [01:06<00:07,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9214, LAS: 0.8605, UEM: 0.5132, LEM: 0.2837, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4873, partial_loss/deprel_loss: 0.6853, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7544, loss: 0.9311, batch_reg_loss: 0.1087, reg_loss: 0.1076 ||:  93%|#########2| 103/111 [01:08<00:05,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8679, UAS: 0.9221, LAS: 0.8612, UEM: 0.5180, LEM: 0.2852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7112, partial_loss/deprel_loss: 0.8132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9016, loss: 0.9247, batch_reg_loss: 0.1088, reg_loss: 0.1077 ||:  95%|#########5| 106/111 [01:11<00:03,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8232, UAS: 0.9214, LAS: 0.8602, UEM: 0.5101, LEM: 0.2792, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2259, partial_loss/deprel_loss: 1.2003, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3143, loss: 0.9326, batch_reg_loss: 0.1089, reg_loss: 0.1077 ||:  99%|#########9| 110/111 [01:13<00:00,  1.45it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9217, LAS: 0.8605, UEM: 0.5109, LEM: 0.2788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3606, partial_loss/deprel_loss: 0.6149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6730, loss: 0.9302, batch_reg_loss: 0.1089, reg_loss: 0.1077 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
      "2023-04-06 23:25:25,100 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.615  |       N/A\n",
      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.361  |       N/A\n",
      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.108  |       N/A\n",
      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - UEM                      |     0.511  |       N/A\n",
      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - LAS                      |     0.861  |       N/A\n",
      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - loss                     |     0.930  |       N/A\n",
      "2023-04-06 23:25:25,101 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:25:25,102 - INFO - combo.training.tensorboard_writer - LEM                      |     0.279  |       N/A\n",
      "2023-04-06 23:25:25,102 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:25:25,102 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:25:25,102 - INFO - combo.training.tensorboard_writer - UAS                      |     0.922  |       N/A\n",
      "2023-04-06 23:25:25,102 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:25:25,102 - INFO - combo.training.tensorboard_writer - EM                       |     0.898  |       N/A\n",
      "2023-04-06 23:25:25,102 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:25:25,102 - INFO - combo.training.trainer - Epoch duration: 0:01:14.566974\n",
      "2023-04-06 23:25:25,103 - INFO - combo.training.trainer - Estimated training time remaining: 8:12:13\n",
      "2023-04-06 23:25:25,103 - INFO - allennlp.training.trainer - Epoch 27/399\n",
      "2023-04-06 23:25:25,103 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:25:25,103 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:25:25,110 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8523, UAS: 0.9369, LAS: 0.8747, UEM: 0.5058, LEM: 0.2442, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8675, partial_loss/deprel_loss: 1.0086, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0894, loss: 0.8187, batch_reg_loss: 0.1090, reg_loss: 0.1090 ||:   4%|3         | 4/111 [00:02<01:07,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9336, LAS: 0.8740, UEM: 0.5125, LEM: 0.2599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3637, partial_loss/deprel_loss: 0.5490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6210, loss: 0.8310, batch_reg_loss: 0.1091, reg_loss: 0.1090 ||:   7%|7         | 8/111 [00:05<01:06,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8245, UAS: 0.9243, LAS: 0.8646, UEM: 0.5087, LEM: 0.2633, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3445, partial_loss/deprel_loss: 1.1262, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2790, loss: 0.9138, batch_reg_loss: 0.1091, reg_loss: 0.1090 ||:  10%|9         | 11/111 [00:07<01:06,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8379, UAS: 0.9269, LAS: 0.8667, UEM: 0.5467, LEM: 0.3056, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8799, partial_loss/deprel_loss: 1.0002, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0854, loss: 0.8886, batch_reg_loss: 0.1092, reg_loss: 0.1091 ||:  13%|#2        | 14/111 [00:09<01:05,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9294, LAS: 0.8700, UEM: 0.5552, LEM: 0.3033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3805, partial_loss/deprel_loss: 0.5957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6619, loss: 0.8598, batch_reg_loss: 0.1093, reg_loss: 0.1091 ||:  15%|#5        | 17/111 [00:11<01:03,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9265, LAS: 0.8674, UEM: 0.5617, LEM: 0.3090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2696, partial_loss/deprel_loss: 0.4384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5139, loss: 0.8870, batch_reg_loss: 0.1093, reg_loss: 0.1091 ||:  19%|#8        | 21/111 [00:14<01:01,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8317, UAS: 0.9271, LAS: 0.8678, UEM: 0.5447, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1042, partial_loss/deprel_loss: 0.9767, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1116, loss: 0.8804, batch_reg_loss: 0.1094, reg_loss: 0.1092 ||:  23%|##2       | 25/111 [00:16<00:55,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8788, UAS: 0.9287, LAS: 0.8691, UEM: 0.5503, LEM: 0.3007, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5186, partial_loss/deprel_loss: 0.7539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8163, loss: 0.8661, batch_reg_loss: 0.1095, reg_loss: 0.1092 ||:  26%|##6       | 29/111 [00:19<00:52,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8669, UAS: 0.9292, LAS: 0.8690, UEM: 0.5347, LEM: 0.2819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6542, partial_loss/deprel_loss: 0.8093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8878, loss: 0.8647, batch_reg_loss: 0.1096, reg_loss: 0.1093 ||:  30%|##9       | 33/111 [00:21<00:49,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7760, UAS: 0.9264, LAS: 0.8662, UEM: 0.5149, LEM: 0.2670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9272, partial_loss/deprel_loss: 1.4164, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6282, loss: 0.8847, batch_reg_loss: 0.1097, reg_loss: 0.1093 ||:  33%|###3      | 37/111 [00:24<00:46,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8203, UAS: 0.9237, LAS: 0.8637, UEM: 0.5148, LEM: 0.2693, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4669, partial_loss/deprel_loss: 1.0744, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2626, loss: 0.9017, batch_reg_loss: 0.1097, reg_loss: 0.1093 ||:  37%|###6      | 41/111 [00:27<00:47,  1.48it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9233, LAS: 0.8630, UEM: 0.5048, LEM: 0.2601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5881, partial_loss/deprel_loss: 0.7383, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8181, loss: 0.9055, batch_reg_loss: 0.1098, reg_loss: 0.1094 ||:  41%|####      | 45/111 [00:29<00:43,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8337, UAS: 0.9229, LAS: 0.8620, UEM: 0.4906, LEM: 0.2502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1077, partial_loss/deprel_loss: 1.0868, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2009, loss: 0.9135, batch_reg_loss: 0.1099, reg_loss: 0.1094 ||:  44%|####4     | 49/111 [00:32<00:42,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8291, UAS: 0.9227, LAS: 0.8618, UEM: 0.4889, LEM: 0.2509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1882, partial_loss/deprel_loss: 1.1634, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2784, loss: 0.9169, batch_reg_loss: 0.1100, reg_loss: 0.1095 ||:  48%|####7     | 53/111 [00:35<00:38,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9214, LAS: 0.8604, UEM: 0.5006, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1371, partial_loss/deprel_loss: 0.2988, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3766, loss: 0.9293, batch_reg_loss: 0.1101, reg_loss: 0.1095 ||:  51%|#####1    | 57/111 [00:37<00:35,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8270, UAS: 0.9216, LAS: 0.8607, UEM: 0.4967, LEM: 0.2637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3575, partial_loss/deprel_loss: 1.1842, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3291, loss: 0.9275, batch_reg_loss: 0.1102, reg_loss: 0.1095 ||:  55%|#####4    | 61/111 [00:40<00:33,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9224, LAS: 0.8614, UEM: 0.4990, LEM: 0.2618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3941, partial_loss/deprel_loss: 0.6425, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7031, loss: 0.9222, batch_reg_loss: 0.1103, reg_loss: 0.1096 ||:  59%|#####8    | 65/111 [00:43<00:31,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8837, UAS: 0.9221, LAS: 0.8608, UEM: 0.4882, LEM: 0.2540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5820, partial_loss/deprel_loss: 0.7200, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8027, loss: 0.9284, batch_reg_loss: 0.1104, reg_loss: 0.1096 ||:  62%|######2   | 69/111 [00:45<00:27,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7939, UAS: 0.9217, LAS: 0.8602, UEM: 0.4867, LEM: 0.2522, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4043, partial_loss/deprel_loss: 1.2781, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4138, loss: 0.9343, batch_reg_loss: 0.1105, reg_loss: 0.1097 ||:  66%|######5   | 73/111 [00:48<00:25,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8337, UAS: 0.9218, LAS: 0.8604, UEM: 0.4876, LEM: 0.2539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1732, partial_loss/deprel_loss: 1.1097, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2329, loss: 0.9349, batch_reg_loss: 0.1105, reg_loss: 0.1097 ||:  68%|######8   | 76/111 [00:50<00:23,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7630, UAS: 0.9204, LAS: 0.8589, UEM: 0.4799, LEM: 0.2490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.3397, partial_loss/deprel_loss: 1.4709, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7552, loss: 0.9468, batch_reg_loss: 0.1106, reg_loss: 0.1098 ||:  72%|#######2  | 80/111 [00:53<00:20,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9212, LAS: 0.8595, UEM: 0.4774, LEM: 0.2459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4129, partial_loss/deprel_loss: 0.5541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6366, loss: 0.9420, batch_reg_loss: 0.1107, reg_loss: 0.1098 ||:  76%|#######5  | 84/111 [00:55<00:17,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8835, UAS: 0.9211, LAS: 0.8593, UEM: 0.4725, LEM: 0.2413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4724, partial_loss/deprel_loss: 0.6431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7198, loss: 0.9422, batch_reg_loss: 0.1108, reg_loss: 0.1098 ||:  79%|#######9  | 88/111 [00:58<00:15,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8946, UAS: 0.9214, LAS: 0.8598, UEM: 0.4746, LEM: 0.2414, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3605, partial_loss/deprel_loss: 0.5323, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6088, loss: 0.9386, batch_reg_loss: 0.1109, reg_loss: 0.1099 ||:  83%|########2 | 92/111 [01:00<00:12,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9217, LAS: 0.8601, UEM: 0.4750, LEM: 0.2411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2847, partial_loss/deprel_loss: 0.5046, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5715, loss: 0.9359, batch_reg_loss: 0.1109, reg_loss: 0.1099 ||:  86%|########6 | 96/111 [01:03<00:09,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9220, LAS: 0.8605, UEM: 0.4788, LEM: 0.2450, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2380, partial_loss/deprel_loss: 0.4325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5046, loss: 0.9335, batch_reg_loss: 0.1110, reg_loss: 0.1100 ||:  90%|######### | 100/111 [01:05<00:07,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9146, UAS: 0.9226, LAS: 0.8612, UEM: 0.4877, LEM: 0.2515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1806, partial_loss/deprel_loss: 0.4301, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4913, loss: 0.9288, batch_reg_loss: 0.1111, reg_loss: 0.1100 ||:  94%|#########3| 104/111 [01:08<00:04,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8623, UAS: 0.9225, LAS: 0.8610, UEM: 0.4866, LEM: 0.2516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6775, partial_loss/deprel_loss: 0.9319, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9922, loss: 0.9303, batch_reg_loss: 0.1112, reg_loss: 0.1101 ||:  97%|#########7| 108/111 [01:11<00:02,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9492, UAS: 0.9236, LAS: 0.8623, UEM: 0.5071, LEM: 0.2749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0673, partial_loss/deprel_loss: 0.2098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2925, loss: 0.9200, batch_reg_loss: 0.1112, reg_loss: 0.1101 ||: 100%|##########| 111/111 [01:14<00:00,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9492, UAS: 0.9236, LAS: 0.8623, UEM: 0.5071, LEM: 0.2749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0673, partial_loss/deprel_loss: 0.2098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2925, loss: 0.9200, batch_reg_loss: 0.1112, reg_loss: 0.1101 ||: 100%|##########| 111/111 [01:14<00:00,  1.50it/s]\n",
      "2023-04-06 23:26:39,190 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:26:39,190 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:26:39,190 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.210  |       N/A\n",
      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.067  |       N/A\n",
      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.110  |       N/A\n",
      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - UEM                      |     0.507  |       N/A\n",
      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - LAS                      |     0.862  |       N/A\n",
      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - loss                     |     0.920  |       N/A\n",
      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - LEM                      |     0.275  |       N/A\n",
      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:26:39,191 - INFO - combo.training.tensorboard_writer - UAS                      |     0.924  |       N/A\n",
      "2023-04-06 23:26:39,192 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:26:39,192 - INFO - combo.training.tensorboard_writer - EM                       |     0.949  |       N/A\n",
      "2023-04-06 23:26:39,192 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:26:39,192 - INFO - combo.training.trainer - Epoch duration: 0:01:14.089580\n",
      "2023-04-06 23:26:39,192 - INFO - combo.training.trainer - Estimated training time remaining: 8:09:46\n",
      "2023-04-06 23:26:39,192 - INFO - allennlp.training.trainer - Epoch 28/399\n",
      "2023-04-06 23:26:39,193 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:26:39,193 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:26:39,200 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9141, UAS: 0.9165, LAS: 0.8582, UEM: 0.6021, LEM: 0.3938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2068, partial_loss/deprel_loss: 0.4027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4748, loss: 0.9632, batch_reg_loss: 0.1113, reg_loss: 0.1113 ||:   3%|2         | 3/111 [00:02<01:20,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8479, UAS: 0.9296, LAS: 0.8705, UEM: 0.5821, LEM: 0.3469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8214, partial_loss/deprel_loss: 1.0063, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0807, loss: 0.8797, batch_reg_loss: 0.1114, reg_loss: 0.1113 ||:   5%|5         | 6/111 [00:04<01:16,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9309, LAS: 0.8722, UEM: 0.5280, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8053, partial_loss/deprel_loss: 0.8538, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9555, loss: 0.8659, batch_reg_loss: 0.1114, reg_loss: 0.1113 ||:   8%|8         | 9/111 [00:06<01:14,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9298, LAS: 0.8711, UEM: 0.5151, LEM: 0.2832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4062, partial_loss/deprel_loss: 0.5566, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6380, loss: 0.8682, batch_reg_loss: 0.1115, reg_loss: 0.1114 ||:  12%|#1        | 13/111 [00:09<01:09,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9512, UAS: 0.9341, LAS: 0.8772, UEM: 0.6051, LEM: 0.3936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0950, partial_loss/deprel_loss: 0.1922, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2843, loss: 0.8222, batch_reg_loss: 0.1115, reg_loss: 0.1114 ||:  14%|#4        | 16/111 [00:11<01:08,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9353, LAS: 0.8781, UEM: 0.5912, LEM: 0.3662, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3400, partial_loss/deprel_loss: 0.5233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5982, loss: 0.8082, batch_reg_loss: 0.1116, reg_loss: 0.1114 ||:  17%|#7        | 19/111 [00:13<01:06,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8460, UAS: 0.9338, LAS: 0.8764, UEM: 0.5584, LEM: 0.3338, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8651, partial_loss/deprel_loss: 0.8871, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9944, loss: 0.8188, batch_reg_loss: 0.1117, reg_loss: 0.1115 ||:  21%|##        | 23/111 [00:16<01:00,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9134, UAS: 0.9357, LAS: 0.8784, UEM: 0.5772, LEM: 0.3459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1911, partial_loss/deprel_loss: 0.4073, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4758, loss: 0.7985, batch_reg_loss: 0.1117, reg_loss: 0.1115 ||:  23%|##3       | 26/111 [00:18<01:00,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8446, UAS: 0.9333, LAS: 0.8759, UEM: 0.5707, LEM: 0.3427, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0747, partial_loss/deprel_loss: 0.9027, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0489, loss: 0.8142, batch_reg_loss: 0.1118, reg_loss: 0.1115 ||:  26%|##6       | 29/111 [00:20<00:58,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8281, UAS: 0.9316, LAS: 0.8740, UEM: 0.5647, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2179, partial_loss/deprel_loss: 1.0295, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1790, loss: 0.8310, batch_reg_loss: 0.1118, reg_loss: 0.1116 ||:  29%|##8       | 32/111 [00:22<00:58,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8395, UAS: 0.9268, LAS: 0.8688, UEM: 0.5456, LEM: 0.3239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0683, partial_loss/deprel_loss: 0.9735, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1044, loss: 0.8689, batch_reg_loss: 0.1119, reg_loss: 0.1116 ||:  32%|###1      | 35/111 [00:25<00:56,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8979, UAS: 0.9256, LAS: 0.8672, UEM: 0.5327, LEM: 0.3104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3730, partial_loss/deprel_loss: 0.5946, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6623, loss: 0.8821, batch_reg_loss: 0.1120, reg_loss: 0.1116 ||:  35%|###5      | 39/111 [00:27<00:49,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9262, LAS: 0.8679, UEM: 0.5237, LEM: 0.3000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4640, partial_loss/deprel_loss: 0.6099, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6928, loss: 0.8753, batch_reg_loss: 0.1121, reg_loss: 0.1117 ||:  39%|###8      | 43/111 [00:30<00:46,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8842, UAS: 0.9260, LAS: 0.8675, UEM: 0.5286, LEM: 0.2976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5349, partial_loss/deprel_loss: 0.5833, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6858, loss: 0.8760, batch_reg_loss: 0.1122, reg_loss: 0.1117 ||:  42%|####2     | 47/111 [00:32<00:42,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8339, UAS: 0.9248, LAS: 0.8660, UEM: 0.5233, LEM: 0.2962, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2239, partial_loss/deprel_loss: 1.0366, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1863, loss: 0.8865, batch_reg_loss: 0.1123, reg_loss: 0.1117 ||:  46%|####5     | 51/111 [00:35<00:40,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9241, LAS: 0.8651, UEM: 0.5362, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4257, partial_loss/deprel_loss: 0.6319, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7030, loss: 0.8954, batch_reg_loss: 0.1123, reg_loss: 0.1118 ||:  49%|####8     | 54/111 [00:37<00:40,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9245, LAS: 0.8652, UEM: 0.5354, LEM: 0.3005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3021, partial_loss/deprel_loss: 0.5010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5736, loss: 0.8952, batch_reg_loss: 0.1124, reg_loss: 0.1118 ||:  51%|#####1    | 57/111 [00:39<00:37,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8413, UAS: 0.9239, LAS: 0.8643, UEM: 0.5229, LEM: 0.2924, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0378, partial_loss/deprel_loss: 1.0526, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1621, loss: 0.9046, batch_reg_loss: 0.1125, reg_loss: 0.1118 ||:  54%|#####4    | 60/111 [00:41<00:35,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8561, UAS: 0.9243, LAS: 0.8646, UEM: 0.5144, LEM: 0.2832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8400, partial_loss/deprel_loss: 0.8978, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9988, loss: 0.9017, batch_reg_loss: 0.1125, reg_loss: 0.1119 ||:  58%|#####7    | 64/111 [00:44<00:31,  1.49it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9241, LAS: 0.8643, UEM: 0.5133, LEM: 0.2813, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3304, partial_loss/deprel_loss: 0.5270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6003, loss: 0.9049, batch_reg_loss: 0.1126, reg_loss: 0.1119 ||:  61%|######1   | 68/111 [00:47<00:29,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9236, LAS: 0.8637, UEM: 0.5139, LEM: 0.2831, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3526, partial_loss/deprel_loss: 0.4551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5473, loss: 0.9107, batch_reg_loss: 0.1127, reg_loss: 0.1120 ||:  64%|######3   | 71/111 [00:49<00:27,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8335, UAS: 0.9230, LAS: 0.8629, UEM: 0.5046, LEM: 0.2758, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1078, partial_loss/deprel_loss: 1.0005, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1347, loss: 0.9176, batch_reg_loss: 0.1128, reg_loss: 0.1120 ||:  68%|######7   | 75/111 [00:51<00:23,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8978, UAS: 0.9228, LAS: 0.8627, UEM: 0.5046, LEM: 0.2741, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3583, partial_loss/deprel_loss: 0.5200, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6006, loss: 0.9189, batch_reg_loss: 0.1129, reg_loss: 0.1120 ||:  71%|#######1  | 79/111 [00:54<00:21,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8541, UAS: 0.9231, LAS: 0.8629, UEM: 0.4983, LEM: 0.2688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7399, partial_loss/deprel_loss: 0.8801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9650, loss: 0.9165, batch_reg_loss: 0.1130, reg_loss: 0.1121 ||:  75%|#######4  | 83/111 [00:56<00:17,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8520, UAS: 0.9215, LAS: 0.8608, UEM: 0.4888, LEM: 0.2624, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8571, partial_loss/deprel_loss: 0.8282, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9470, loss: 0.9335, batch_reg_loss: 0.1131, reg_loss: 0.1121 ||:  78%|#######8  | 87/111 [00:59<00:15,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9220, LAS: 0.8617, UEM: 0.4992, LEM: 0.2722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3817, partial_loss/deprel_loss: 0.4937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5845, loss: 0.9263, batch_reg_loss: 0.1131, reg_loss: 0.1122 ||:  82%|########1 | 91/111 [01:02<00:13,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8676, UAS: 0.9226, LAS: 0.8625, UEM: 0.5122, LEM: 0.2863, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7510, partial_loss/deprel_loss: 0.7480, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8618, loss: 0.9195, batch_reg_loss: 0.1132, reg_loss: 0.1122 ||:  86%|########5 | 95/111 [01:04<00:10,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8863, UAS: 0.9221, LAS: 0.8619, UEM: 0.5084, LEM: 0.2824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4955, partial_loss/deprel_loss: 0.6987, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7713, loss: 0.9258, batch_reg_loss: 0.1133, reg_loss: 0.1122 ||:  88%|########8 | 98/111 [01:07<00:08,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9228, LAS: 0.8628, UEM: 0.5095, LEM: 0.2814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4700, partial_loss/deprel_loss: 0.6280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7098, loss: 0.9194, batch_reg_loss: 0.1134, reg_loss: 0.1123 ||:  91%|######### | 101/111 [01:09<00:07,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9230, LAS: 0.8630, UEM: 0.5087, LEM: 0.2790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3940, partial_loss/deprel_loss: 0.6215, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6894, loss: 0.9173, batch_reg_loss: 0.1134, reg_loss: 0.1123 ||:  94%|#########3| 104/111 [01:11<00:05,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8717, UAS: 0.9233, LAS: 0.8633, UEM: 0.5091, LEM: 0.2789, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6688, partial_loss/deprel_loss: 0.7718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8647, loss: 0.9148, batch_reg_loss: 0.1135, reg_loss: 0.1123 ||:  96%|#########6| 107/111 [01:13<00:02,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8285, UAS: 0.9229, LAS: 0.8628, UEM: 0.5057, LEM: 0.2769, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1495, partial_loss/deprel_loss: 1.0547, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1872, loss: 0.9196, batch_reg_loss: 0.1136, reg_loss: 0.1124 ||: 100%|##########| 111/111 [01:16<00:00,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8285, UAS: 0.9229, LAS: 0.8628, UEM: 0.5057, LEM: 0.2769, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1495, partial_loss/deprel_loss: 1.0547, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1872, loss: 0.9196, batch_reg_loss: 0.1136, reg_loss: 0.1124 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.055  |       N/A\n",
      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.150  |       N/A\n",
      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.112  |       N/A\n",
      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - UEM                      |     0.506  |       N/A\n",
      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - LAS                      |     0.863  |       N/A\n",
      "2023-04-06 23:27:55,558 - INFO - combo.training.tensorboard_writer - loss                     |     0.920  |       N/A\n",
      "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - LEM                      |     0.277  |       N/A\n",
      "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - UAS                      |     0.923  |       N/A\n",
      "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - EM                       |     0.829  |       N/A\n",
      "2023-04-06 23:27:55,559 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:27:55,560 - INFO - combo.training.trainer - Epoch duration: 0:01:16.367015\n",
      "2023-04-06 23:27:55,560 - INFO - combo.training.trainer - Estimated training time remaining: 8:07:53\n",
      "2023-04-06 23:27:55,560 - INFO - allennlp.training.trainer - Epoch 29/399\n",
      "2023-04-06 23:27:55,560 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:27:55,560 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:27:55,567 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9484, LAS: 0.8952, UEM: 0.6497, LEM: 0.3616, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3046, partial_loss/deprel_loss: 0.4306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5190, loss: 0.6486, batch_reg_loss: 0.1136, reg_loss: 0.1136 ||:   3%|2         | 3/111 [00:02<01:22,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8304, UAS: 0.9318, LAS: 0.8774, UEM: 0.5448, LEM: 0.2959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2572, partial_loss/deprel_loss: 1.0995, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2447, loss: 0.8080, batch_reg_loss: 0.1137, reg_loss: 0.1136 ||:   5%|5         | 6/111 [00:04<01:20,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8513, UAS: 0.9304, LAS: 0.8744, UEM: 0.4970, LEM: 0.2492, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9037, partial_loss/deprel_loss: 0.8621, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9842, loss: 0.8255, batch_reg_loss: 0.1138, reg_loss: 0.1137 ||:   8%|8         | 9/111 [00:06<01:16,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8404, UAS: 0.9234, LAS: 0.8670, UEM: 0.5124, LEM: 0.2688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1069, partial_loss/deprel_loss: 1.0057, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1398, loss: 0.8843, batch_reg_loss: 0.1138, reg_loss: 0.1137 ||:  11%|#         | 12/111 [00:09<01:14,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9279, LAS: 0.8722, UEM: 0.5277, LEM: 0.2683, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5707, partial_loss/deprel_loss: 0.5580, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6744, loss: 0.8422, batch_reg_loss: 0.1139, reg_loss: 0.1137 ||:  14%|#3        | 15/111 [00:11<01:10,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9297, LAS: 0.8731, UEM: 0.5152, LEM: 0.2573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8735, partial_loss/deprel_loss: 0.9656, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0611, loss: 0.8408, batch_reg_loss: 0.1139, reg_loss: 0.1138 ||:  16%|#6        | 18/111 [00:13<01:07,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8382, UAS: 0.9254, LAS: 0.8680, UEM: 0.4779, LEM: 0.2334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1899, partial_loss/deprel_loss: 0.9413, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1050, loss: 0.8777, batch_reg_loss: 0.1140, reg_loss: 0.1138 ||:  20%|#9        | 22/111 [00:15<01:00,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9146, UAS: 0.9271, LAS: 0.8695, UEM: 0.4928, LEM: 0.2473, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1706, partial_loss/deprel_loss: 0.4245, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4878, loss: 0.8677, batch_reg_loss: 0.1141, reg_loss: 0.1138 ||:  23%|##3       | 26/111 [00:18<00:56,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9297, LAS: 0.8723, UEM: 0.5254, LEM: 0.2732, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3101, partial_loss/deprel_loss: 0.5013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5773, loss: 0.8417, batch_reg_loss: 0.1142, reg_loss: 0.1139 ||:  26%|##6       | 29/111 [00:20<00:57,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8395, UAS: 0.9264, LAS: 0.8679, UEM: 0.4938, LEM: 0.2548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9940, partial_loss/deprel_loss: 0.9541, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0763, loss: 0.8794, batch_reg_loss: 0.1143, reg_loss: 0.1139 ||:  30%|##9       | 33/111 [00:22<00:52,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9259, LAS: 0.8670, UEM: 0.4878, LEM: 0.2516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3425, partial_loss/deprel_loss: 0.5836, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6497, loss: 0.8870, batch_reg_loss: 0.1143, reg_loss: 0.1140 ||:  32%|###2      | 36/111 [00:25<00:51,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8347, UAS: 0.9254, LAS: 0.8666, UEM: 0.4828, LEM: 0.2487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2760, partial_loss/deprel_loss: 1.0077, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1758, loss: 0.8918, batch_reg_loss: 0.1144, reg_loss: 0.1140 ||:  35%|###5      | 39/111 [00:27<00:50,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8323, UAS: 0.9239, LAS: 0.8647, UEM: 0.4670, LEM: 0.2391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2418, partial_loss/deprel_loss: 0.9941, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1581, loss: 0.9075, batch_reg_loss: 0.1144, reg_loss: 0.1140 ||:  38%|###7      | 42/111 [00:29<00:48,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9235, LAS: 0.8640, UEM: 0.4682, LEM: 0.2383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3704, partial_loss/deprel_loss: 0.5971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6663, loss: 0.9136, batch_reg_loss: 0.1145, reg_loss: 0.1140 ||:  41%|####      | 45/111 [00:31<00:47,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8413, UAS: 0.9244, LAS: 0.8653, UEM: 0.4755, LEM: 0.2426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0601, partial_loss/deprel_loss: 1.0311, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1515, loss: 0.9071, batch_reg_loss: 0.1146, reg_loss: 0.1141 ||:  43%|####3     | 48/111 [00:34<00:48,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8119, UAS: 0.9235, LAS: 0.8643, UEM: 0.4635, LEM: 0.2325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5594, partial_loss/deprel_loss: 1.1760, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3673, loss: 0.9154, batch_reg_loss: 0.1147, reg_loss: 0.1141 ||:  47%|####6     | 52/111 [00:36<00:42,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8303, UAS: 0.9236, LAS: 0.8641, UEM: 0.4612, LEM: 0.2281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1919, partial_loss/deprel_loss: 1.0681, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2076, loss: 0.9156, batch_reg_loss: 0.1147, reg_loss: 0.1142 ||:  50%|####9     | 55/111 [00:38<00:40,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8623, UAS: 0.9229, LAS: 0.8635, UEM: 0.4512, LEM: 0.2224, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7935, partial_loss/deprel_loss: 0.7807, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8981, loss: 0.9207, batch_reg_loss: 0.1148, reg_loss: 0.1142 ||:  53%|#####3    | 59/111 [00:41<00:36,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8556, UAS: 0.9232, LAS: 0.8639, UEM: 0.4533, LEM: 0.2245, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7478, partial_loss/deprel_loss: 0.9507, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0250, loss: 0.9175, batch_reg_loss: 0.1149, reg_loss: 0.1142 ||:  57%|#####6    | 63/111 [00:44<00:32,  1.46it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9243, LAS: 0.8649, UEM: 0.4697, LEM: 0.2379, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2051, partial_loss/deprel_loss: 0.3932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4706, loss: 0.9061, batch_reg_loss: 0.1150, reg_loss: 0.1143 ||:  60%|######    | 67/111 [00:46<00:30,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9244, LAS: 0.8650, UEM: 0.4710, LEM: 0.2382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3257, partial_loss/deprel_loss: 0.4715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5574, loss: 0.9044, batch_reg_loss: 0.1151, reg_loss: 0.1143 ||:  64%|######3   | 71/111 [00:49<00:26,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9256, LAS: 0.8662, UEM: 0.4812, LEM: 0.2444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3156, partial_loss/deprel_loss: 0.4371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5280, loss: 0.8951, batch_reg_loss: 0.1151, reg_loss: 0.1144 ||:  68%|######7   | 75/111 [00:52<00:24,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8323, UAS: 0.9258, LAS: 0.8662, UEM: 0.4778, LEM: 0.2398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0733, partial_loss/deprel_loss: 1.0164, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1430, loss: 0.8939, batch_reg_loss: 0.1152, reg_loss: 0.1144 ||:  71%|#######1  | 79/111 [00:54<00:20,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8683, UAS: 0.9250, LAS: 0.8653, UEM: 0.4695, LEM: 0.2337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6336, partial_loss/deprel_loss: 0.7658, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8547, loss: 0.9007, batch_reg_loss: 0.1153, reg_loss: 0.1144 ||:  75%|#######4  | 83/111 [00:57<00:18,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8341, UAS: 0.9255, LAS: 0.8657, UEM: 0.4783, LEM: 0.2420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0986, partial_loss/deprel_loss: 1.0203, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1513, loss: 0.8969, batch_reg_loss: 0.1154, reg_loss: 0.1145 ||:  78%|#######8  | 87/111 [00:59<00:15,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.9263, LAS: 0.8668, UEM: 0.4890, LEM: 0.2493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6777, partial_loss/deprel_loss: 0.7179, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8253, loss: 0.8871, batch_reg_loss: 0.1154, reg_loss: 0.1145 ||:  82%|########1 | 91/111 [01:02<00:13,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7511, UAS: 0.9233, LAS: 0.8634, UEM: 0.4815, LEM: 0.2455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6230, partial_loss/deprel_loss: 1.7261, partial_loss/cycle_loss: 0.0000, batch_loss: 2.0210, loss: 0.9162, batch_reg_loss: 0.1155, reg_loss: 0.1146 ||:  86%|########5 | 95/111 [01:05<00:10,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8200, UAS: 0.9234, LAS: 0.8636, UEM: 0.4813, LEM: 0.2444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2783, partial_loss/deprel_loss: 1.1654, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3036, loss: 0.9147, batch_reg_loss: 0.1156, reg_loss: 0.1146 ||:  89%|########9 | 99/111 [01:07<00:07,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7740, UAS: 0.9232, LAS: 0.8632, UEM: 0.4859, LEM: 0.2475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9147, partial_loss/deprel_loss: 1.3908, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6113, loss: 0.9170, batch_reg_loss: 0.1157, reg_loss: 0.1146 ||:  93%|#########2| 103/111 [01:10<00:05,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9528, UAS: 0.9242, LAS: 0.8645, UEM: 0.5148, LEM: 0.2843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0692, partial_loss/deprel_loss: 0.2025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2916, loss: 0.9075, batch_reg_loss: 0.1158, reg_loss: 0.1147 ||:  95%|#########5| 106/111 [01:14<00:04,  1.16it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9248, LAS: 0.8652, UEM: 0.5157, LEM: 0.2832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3227, partial_loss/deprel_loss: 0.4945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5760, loss: 0.9015, batch_reg_loss: 0.1159, reg_loss: 0.1147 ||:  99%|#########9| 110/111 [01:17<00:00,  1.26it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7932, UAS: 0.9241, LAS: 0.8645, UEM: 0.5140, LEM: 0.2822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8952, partial_loss/deprel_loss: 1.3438, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5700, loss: 0.9075, batch_reg_loss: 0.1159, reg_loss: 0.1147 ||: 100%|##########| 111/111 [01:17<00:00,  1.43it/s]\n",
      "2023-04-06 23:29:13,387 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:29:13,387 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:29:13,387 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:29:13,387 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:29:13,387 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.344  |       N/A\n",
      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.895  |       N/A\n",
      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.115  |       N/A\n",
      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - UEM                      |     0.514  |       N/A\n",
      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - LAS                      |     0.865  |       N/A\n",
      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - loss                     |     0.908  |       N/A\n",
      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - LEM                      |     0.282  |       N/A\n",
      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - UAS                      |     0.924  |       N/A\n",
      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - EM                       |     0.793  |       N/A\n",
      "2023-04-06 23:29:13,388 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:29:13,389 - INFO - combo.training.trainer - Epoch duration: 0:01:17.829257\n",
      "2023-04-06 23:29:13,389 - INFO - combo.training.trainer - Estimated training time remaining: 8:06:21\n",
      "2023-04-06 23:29:13,389 - INFO - allennlp.training.trainer - Epoch 30/399\n",
      "2023-04-06 23:29:13,389 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:29:13,390 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:29:13,396 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8497, UAS: 0.9423, LAS: 0.8831, UEM: 0.5266, LEM: 0.2405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8957, partial_loss/deprel_loss: 0.8831, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0016, loss: 0.7764, batch_reg_loss: 0.1160, reg_loss: 0.1159 ||:   4%|3         | 4/111 [00:02<01:10,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8156, UAS: 0.9297, LAS: 0.8704, UEM: 0.4777, LEM: 0.2176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4410, partial_loss/deprel_loss: 1.0704, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2605, loss: 0.8706, batch_reg_loss: 0.1160, reg_loss: 0.1160 ||:   6%|6         | 7/111 [00:04<01:10,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7884, UAS: 0.9209, LAS: 0.8615, UEM: 0.4229, LEM: 0.1835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9655, partial_loss/deprel_loss: 1.3005, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5497, loss: 0.9493, batch_reg_loss: 0.1161, reg_loss: 0.1160 ||:  10%|9         | 11/111 [00:07<01:05,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8993, UAS: 0.9205, LAS: 0.8604, UEM: 0.4367, LEM: 0.2013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3561, partial_loss/deprel_loss: 0.5195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6030, loss: 0.9509, batch_reg_loss: 0.1162, reg_loss: 0.1160 ||:  13%|#2        | 14/111 [00:09<01:05,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8844, UAS: 0.9244, LAS: 0.8644, UEM: 0.4492, LEM: 0.2016, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4715, partial_loss/deprel_loss: 0.6246, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7102, loss: 0.9135, batch_reg_loss: 0.1162, reg_loss: 0.1161 ||:  15%|#5        | 17/111 [00:11<01:07,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8499, UAS: 0.9269, LAS: 0.8684, UEM: 0.4862, LEM: 0.2381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1172, partial_loss/deprel_loss: 0.9006, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0602, loss: 0.8846, batch_reg_loss: 0.1163, reg_loss: 0.1161 ||:  18%|#8        | 20/111 [00:13<01:05,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8651, UAS: 0.9247, LAS: 0.8656, UEM: 0.4565, LEM: 0.2166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6565, partial_loss/deprel_loss: 0.8579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9340, loss: 0.9051, batch_reg_loss: 0.1164, reg_loss: 0.1161 ||:  22%|##1       | 24/111 [00:16<00:59,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7923, UAS: 0.9189, LAS: 0.8592, UEM: 0.4360, LEM: 0.2045, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9101, partial_loss/deprel_loss: 1.2817, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5238, loss: 0.9555, batch_reg_loss: 0.1164, reg_loss: 0.1162 ||:  24%|##4       | 27/111 [00:18<00:57,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8100, UAS: 0.9204, LAS: 0.8606, UEM: 0.4805, LEM: 0.2478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4343, partial_loss/deprel_loss: 1.1992, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3628, loss: 0.9425, batch_reg_loss: 0.1165, reg_loss: 0.1162 ||:  27%|##7       | 30/111 [00:20<00:58,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8969, UAS: 0.9195, LAS: 0.8595, UEM: 0.4778, LEM: 0.2454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3692, partial_loss/deprel_loss: 0.5469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6280, loss: 0.9496, batch_reg_loss: 0.1166, reg_loss: 0.1162 ||:  31%|###       | 34/111 [00:23<00:54,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8410, UAS: 0.9186, LAS: 0.8582, UEM: 0.4590, LEM: 0.2313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0912, partial_loss/deprel_loss: 0.9415, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0881, loss: 0.9539, batch_reg_loss: 0.1167, reg_loss: 0.1163 ||:  34%|###4      | 38/111 [00:26<00:49,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9054, UAS: 0.9205, LAS: 0.8606, UEM: 0.4768, LEM: 0.2436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2957, partial_loss/deprel_loss: 0.4494, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5354, loss: 0.9355, batch_reg_loss: 0.1168, reg_loss: 0.1163 ||:  38%|###7      | 42/111 [00:28<00:47,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7559, UAS: 0.9180, LAS: 0.8576, UEM: 0.4588, LEM: 0.2320, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.5943, partial_loss/deprel_loss: 1.6157, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9283, loss: 0.9636, batch_reg_loss: 0.1169, reg_loss: 0.1164 ||:  41%|####1     | 46/111 [00:31<00:44,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8097, UAS: 0.9180, LAS: 0.8578, UEM: 0.4674, LEM: 0.2415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4850, partial_loss/deprel_loss: 1.1822, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3597, loss: 0.9619, batch_reg_loss: 0.1169, reg_loss: 0.1164 ||:  44%|####4     | 49/111 [00:33<00:44,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8284, UAS: 0.9181, LAS: 0.8578, UEM: 0.4559, LEM: 0.2312, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1495, partial_loss/deprel_loss: 1.0793, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2104, loss: 0.9637, batch_reg_loss: 0.1170, reg_loss: 0.1165 ||:  48%|####7     | 53/111 [00:36<00:40,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8493, UAS: 0.9192, LAS: 0.8589, UEM: 0.4595, LEM: 0.2339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8674, partial_loss/deprel_loss: 1.0027, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0928, loss: 0.9569, batch_reg_loss: 0.1171, reg_loss: 0.1165 ||:  51%|#####1    | 57/111 [00:39<00:36,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9202, LAS: 0.8601, UEM: 0.4839, LEM: 0.2551, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1942, partial_loss/deprel_loss: 0.3969, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4736, loss: 0.9449, batch_reg_loss: 0.1172, reg_loss: 0.1165 ||:  55%|#####4    | 61/111 [00:41<00:33,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8669, UAS: 0.9211, LAS: 0.8613, UEM: 0.4880, LEM: 0.2559, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6812, partial_loss/deprel_loss: 0.7970, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8911, loss: 0.9362, batch_reg_loss: 0.1173, reg_loss: 0.1166 ||:  58%|#####7    | 64/111 [00:43<00:31,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8444, UAS: 0.9211, LAS: 0.8612, UEM: 0.4893, LEM: 0.2595, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9298, partial_loss/deprel_loss: 0.8934, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0180, loss: 0.9348, batch_reg_loss: 0.1173, reg_loss: 0.1166 ||:  60%|######    | 67/111 [00:46<00:31,  1.42it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8758, UAS: 0.9214, LAS: 0.8614, UEM: 0.4829, LEM: 0.2532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5818, partial_loss/deprel_loss: 0.6596, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7614, loss: 0.9320, batch_reg_loss: 0.1174, reg_loss: 0.1166 ||:  63%|######3   | 70/111 [00:48<00:28,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8274, UAS: 0.9210, LAS: 0.8611, UEM: 0.4750, LEM: 0.2475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3160, partial_loss/deprel_loss: 1.0731, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2391, loss: 0.9346, batch_reg_loss: 0.1175, reg_loss: 0.1167 ||:  67%|######6   | 74/111 [00:50<00:25,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9217, LAS: 0.8620, UEM: 0.4883, LEM: 0.2643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1238, partial_loss/deprel_loss: 0.2637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3533, loss: 0.9277, batch_reg_loss: 0.1175, reg_loss: 0.1167 ||:  69%|######9   | 77/111 [00:52<00:22,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8894, UAS: 0.9227, LAS: 0.8631, UEM: 0.4886, LEM: 0.2645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4876, partial_loss/deprel_loss: 0.5759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6759, loss: 0.9184, batch_reg_loss: 0.1176, reg_loss: 0.1168 ||:  73%|#######2  | 81/111 [00:55<00:19,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9236, LAS: 0.8643, UEM: 0.4999, LEM: 0.2729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2840, partial_loss/deprel_loss: 0.4352, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5226, loss: 0.9100, batch_reg_loss: 0.1177, reg_loss: 0.1168 ||:  77%|#######6  | 85/111 [00:58<00:18,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9548, UAS: 0.9248, LAS: 0.8659, UEM: 0.5212, LEM: 0.2985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0727, partial_loss/deprel_loss: 0.1867, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2816, loss: 0.8990, batch_reg_loss: 0.1177, reg_loss: 0.1168 ||:  79%|#######9  | 88/111 [01:00<00:16,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9253, LAS: 0.8663, UEM: 0.5287, LEM: 0.3033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3533, partial_loss/deprel_loss: 0.6083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6751, loss: 0.8959, batch_reg_loss: 0.1178, reg_loss: 0.1169 ||:  82%|########1 | 91/111 [01:02<00:14,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8822, UAS: 0.9255, LAS: 0.8665, UEM: 0.5249, LEM: 0.2978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5523, partial_loss/deprel_loss: 0.6384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7391, loss: 0.8944, batch_reg_loss: 0.1179, reg_loss: 0.1169 ||:  86%|########5 | 95/111 [01:05<00:10,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8749, UAS: 0.9255, LAS: 0.8662, UEM: 0.5190, LEM: 0.2914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5470, partial_loss/deprel_loss: 0.7722, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8451, loss: 0.8972, batch_reg_loss: 0.1179, reg_loss: 0.1169 ||:  89%|########9 | 99/111 [01:07<00:07,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8835, UAS: 0.9260, LAS: 0.8667, UEM: 0.5188, LEM: 0.2890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5216, partial_loss/deprel_loss: 0.6458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7390, loss: 0.8915, batch_reg_loss: 0.1180, reg_loss: 0.1170 ||:  93%|#########2| 103/111 [01:10<00:05,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9252, LAS: 0.8656, UEM: 0.5142, LEM: 0.2854, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5122, partial_loss/deprel_loss: 0.7142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7919, loss: 0.9013, batch_reg_loss: 0.1181, reg_loss: 0.1170 ||:  95%|#########5| 106/111 [01:12<00:03,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8074, UAS: 0.9252, LAS: 0.8657, UEM: 0.5133, LEM: 0.2834, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5927, partial_loss/deprel_loss: 1.2844, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4642, loss: 0.9032, batch_reg_loss: 0.1181, reg_loss: 0.1171 ||:  99%|#########9| 110/111 [01:15<00:00,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7988, UAS: 0.9247, LAS: 0.8651, UEM: 0.5116, LEM: 0.2824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6141, partial_loss/deprel_loss: 1.2865, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4702, loss: 0.9083, batch_reg_loss: 0.1182, reg_loss: 0.1171 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
      "2023-04-06 23:30:29,126 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8614, UAS: 0.9506, LAS: 0.8947, UEM: 0.6800, LEM: 0.3545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0408, partial_loss/deprel_loss: 44.2188, partial_loss/cycle_loss: 0.0000, batch_loss: 35.5832, loss: 24.8075, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:09,  1.09it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9196, UAS: 0.9518, LAS: 0.8976, UEM: 0.6637, LEM: 0.3517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3898, partial_loss/deprel_loss: 17.7429, partial_loss/cycle_loss: 0.0000, batch_loss: 14.2723, loss: 22.5560, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:06,  1.08it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9389, LAS: 0.8836, UEM: 0.6104, LEM: 0.3091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9587, partial_loss/deprel_loss: 37.7004, partial_loss/cycle_loss: 0.0000, batch_loss: 30.3521, loss: 26.7216, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:07<00:04,  1.04it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8765, UAS: 0.9361, LAS: 0.8796, UEM: 0.5538, LEM: 0.2631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6483, partial_loss/deprel_loss: 35.0183, partial_loss/cycle_loss: 0.0000, batch_loss: 28.1443, loss: 27.8730, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:10<00:01,  1.05it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9399, LAS: 0.8846, UEM: 0.6236, LEM: 0.3534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1799, partial_loss/deprel_loss: 20.4384, partial_loss/cycle_loss: 0.0000, batch_loss: 16.3867, loss: 26.3771, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.06it/s]\n",
      "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-06 23:30:41,442 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.286  |    20.438\n",
      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.614  |     0.180\n",
      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.117  |     0.000\n",
      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - UEM                      |     0.512  |     0.624\n",
      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - LAS                      |     0.865  |     0.885\n",
      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - loss                     |     0.908  |    26.377\n",
      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - LEM                      |     0.282  |     0.353\n",
      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - UAS                      |     0.925  |     0.940\n",
      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - EM                       |     0.799  |     0.937\n",
      "2023-04-06 23:30:41,443 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:30:41,444 - INFO - combo.training.trainer - Epoch duration: 0:01:28.054718\n",
      "2023-04-06 23:30:41,444 - INFO - combo.training.trainer - Estimated training time remaining: 8:06:52\n",
      "2023-04-06 23:30:41,444 - INFO - allennlp.training.trainer - Epoch 31/399\n",
      "2023-04-06 23:30:41,444 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:30:41,445 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:30:41,452 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8748, UAS: 0.9334, LAS: 0.8786, UEM: 0.4443, LEM: 0.1990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7236, partial_loss/deprel_loss: 0.7101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8310, loss: 0.8045, batch_reg_loss: 0.1182, reg_loss: 0.1182 ||:   4%|3         | 4/111 [00:02<01:04,  1.65it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8270, UAS: 0.9250, LAS: 0.8677, UEM: 0.5060, LEM: 0.2710, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1941, partial_loss/deprel_loss: 1.0869, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2266, loss: 0.8819, batch_reg_loss: 0.1183, reg_loss: 0.1182 ||:   6%|6         | 7/111 [00:04<01:04,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9246, LAS: 0.8647, UEM: 0.5259, LEM: 0.2646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3370, partial_loss/deprel_loss: 0.5980, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6641, loss: 0.9099, batch_reg_loss: 0.1184, reg_loss: 0.1183 ||:   9%|9         | 10/111 [00:06<01:06,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8079, UAS: 0.9163, LAS: 0.8569, UEM: 0.4684, LEM: 0.2328, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7216, partial_loss/deprel_loss: 1.2022, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4245, loss: 0.9877, batch_reg_loss: 0.1184, reg_loss: 0.1183 ||:  12%|#1        | 13/111 [00:08<01:05,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9163, LAS: 0.8573, UEM: 0.4320, LEM: 0.2074, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4364, partial_loss/deprel_loss: 0.6180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7002, loss: 0.9823, batch_reg_loss: 0.1185, reg_loss: 0.1183 ||:  15%|#5        | 17/111 [00:11<01:00,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9544, UAS: 0.9213, LAS: 0.8638, UEM: 0.5339, LEM: 0.3317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0738, partial_loss/deprel_loss: 0.1916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2866, loss: 0.9381, batch_reg_loss: 0.1186, reg_loss: 0.1184 ||:  19%|#8        | 21/111 [00:13<00:59,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7860, UAS: 0.9181, LAS: 0.8604, UEM: 0.5074, LEM: 0.3103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8301, partial_loss/deprel_loss: 1.2250, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4647, loss: 0.9604, batch_reg_loss: 0.1187, reg_loss: 0.1184 ||:  22%|##1       | 24/111 [00:16<00:59,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8936, UAS: 0.9206, LAS: 0.8625, UEM: 0.5125, LEM: 0.3077, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4054, partial_loss/deprel_loss: 0.6092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6872, loss: 0.9412, batch_reg_loss: 0.1188, reg_loss: 0.1185 ||:  25%|##5       | 28/111 [00:18<00:56,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8894, UAS: 0.9232, LAS: 0.8654, UEM: 0.5107, LEM: 0.2988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5208, partial_loss/deprel_loss: 0.6426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7371, loss: 0.9181, batch_reg_loss: 0.1189, reg_loss: 0.1185 ||:  29%|##8       | 32/111 [00:21<00:52,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8736, UAS: 0.9209, LAS: 0.8630, UEM: 0.5014, LEM: 0.2881, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6350, partial_loss/deprel_loss: 0.7174, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8199, loss: 0.9377, batch_reg_loss: 0.1189, reg_loss: 0.1186 ||:  32%|###2      | 36/111 [00:23<00:49,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8600, UAS: 0.9208, LAS: 0.8625, UEM: 0.4858, LEM: 0.2724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7292, partial_loss/deprel_loss: 0.8410, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9377, loss: 0.9367, batch_reg_loss: 0.1190, reg_loss: 0.1186 ||:  36%|###6      | 40/111 [00:26<00:45,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8642, UAS: 0.9211, LAS: 0.8619, UEM: 0.4705, LEM: 0.2575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7919, partial_loss/deprel_loss: 0.9952, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0737, loss: 0.9432, batch_reg_loss: 0.1191, reg_loss: 0.1186 ||:  40%|###9      | 44/111 [00:28<00:41,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8376, UAS: 0.9221, LAS: 0.8633, UEM: 0.4997, LEM: 0.2905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0615, partial_loss/deprel_loss: 1.0132, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1421, loss: 0.9287, batch_reg_loss: 0.1192, reg_loss: 0.1187 ||:  43%|####3     | 48/111 [00:31<00:41,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8288, UAS: 0.9231, LAS: 0.8644, UEM: 0.5092, LEM: 0.2947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0852, partial_loss/deprel_loss: 1.0912, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2093, loss: 0.9185, batch_reg_loss: 0.1193, reg_loss: 0.1187 ||:  47%|####6     | 52/111 [00:34<00:41,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7887, UAS: 0.9225, LAS: 0.8640, UEM: 0.5098, LEM: 0.2945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1006, partial_loss/deprel_loss: 1.3113, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5885, loss: 0.9214, batch_reg_loss: 0.1194, reg_loss: 0.1188 ||:  50%|####9     | 55/111 [00:37<00:40,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8872, UAS: 0.9226, LAS: 0.8640, UEM: 0.5125, LEM: 0.2936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3773, partial_loss/deprel_loss: 0.6483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7135, loss: 0.9201, batch_reg_loss: 0.1194, reg_loss: 0.1188 ||:  52%|#####2    | 58/111 [00:39<00:39,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8890, UAS: 0.9233, LAS: 0.8648, UEM: 0.5058, LEM: 0.2846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5661, partial_loss/deprel_loss: 0.6365, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7419, loss: 0.9154, batch_reg_loss: 0.1195, reg_loss: 0.1188 ||:  56%|#####5    | 62/111 [00:41<00:33,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8473, UAS: 0.9228, LAS: 0.8639, UEM: 0.4991, LEM: 0.2779, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0141, partial_loss/deprel_loss: 0.9395, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0740, loss: 0.9225, batch_reg_loss: 0.1196, reg_loss: 0.1189 ||:  59%|#####9    | 66/111 [00:44<00:29,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9241, LAS: 0.8651, UEM: 0.5039, LEM: 0.2764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4332, partial_loss/deprel_loss: 0.6507, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7269, loss: 0.9121, batch_reg_loss: 0.1197, reg_loss: 0.1189 ||:  63%|######3   | 70/111 [00:46<00:26,  1.54it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8310, UAS: 0.9232, LAS: 0.8641, UEM: 0.4970, LEM: 0.2715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0867, partial_loss/deprel_loss: 0.9831, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1236, loss: 0.9186, batch_reg_loss: 0.1197, reg_loss: 0.1190 ||:  67%|######6   | 74/111 [00:49<00:23,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9234, LAS: 0.8646, UEM: 0.4956, LEM: 0.2692, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3508, partial_loss/deprel_loss: 0.4847, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5778, loss: 0.9129, batch_reg_loss: 0.1198, reg_loss: 0.1190 ||:  70%|#######   | 78/111 [00:51<00:21,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8663, UAS: 0.9245, LAS: 0.8657, UEM: 0.4978, LEM: 0.2687, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6454, partial_loss/deprel_loss: 0.8686, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9439, loss: 0.9062, batch_reg_loss: 0.1199, reg_loss: 0.1191 ||:  74%|#######3  | 82/111 [00:54<00:18,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8569, UAS: 0.9247, LAS: 0.8661, UEM: 0.5063, LEM: 0.2793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8980, partial_loss/deprel_loss: 0.8663, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9927, loss: 0.9016, batch_reg_loss: 0.1200, reg_loss: 0.1191 ||:  77%|#######7  | 86/111 [00:57<00:16,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9053, UAS: 0.9252, LAS: 0.8666, UEM: 0.5083, LEM: 0.2791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2980, partial_loss/deprel_loss: 0.4854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5679, loss: 0.8977, batch_reg_loss: 0.1200, reg_loss: 0.1191 ||:  80%|########  | 89/111 [00:59<00:14,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8134, UAS: 0.9248, LAS: 0.8661, UEM: 0.5076, LEM: 0.2791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3499, partial_loss/deprel_loss: 1.1000, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2701, loss: 0.9023, batch_reg_loss: 0.1201, reg_loss: 0.1192 ||:  83%|########2 | 92/111 [01:01<00:13,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8550, UAS: 0.9230, LAS: 0.8643, UEM: 0.4989, LEM: 0.2738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0115, partial_loss/deprel_loss: 0.9014, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0436, loss: 0.9173, batch_reg_loss: 0.1202, reg_loss: 0.1192 ||:  86%|########6 | 96/111 [01:04<00:10,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9076, UAS: 0.9233, LAS: 0.8645, UEM: 0.4989, LEM: 0.2735, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2969, partial_loss/deprel_loss: 0.4878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5699, loss: 0.9146, batch_reg_loss: 0.1202, reg_loss: 0.1192 ||:  89%|########9 | 99/111 [01:06<00:08,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8444, UAS: 0.9238, LAS: 0.8649, UEM: 0.5049, LEM: 0.2769, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8979, partial_loss/deprel_loss: 0.9199, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0358, loss: 0.9114, batch_reg_loss: 0.1203, reg_loss: 0.1193 ||:  92%|#########1| 102/111 [01:08<00:06,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8377, UAS: 0.9244, LAS: 0.8655, UEM: 0.5149, LEM: 0.2847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1225, partial_loss/deprel_loss: 1.0132, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1554, loss: 0.9060, batch_reg_loss: 0.1204, reg_loss: 0.1193 ||:  95%|#########4| 105/111 [01:10<00:04,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9240, LAS: 0.8650, UEM: 0.5085, LEM: 0.2798, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4996, partial_loss/deprel_loss: 0.6632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7509, loss: 0.9104, batch_reg_loss: 0.1205, reg_loss: 0.1193 ||:  98%|#########8| 109/111 [01:13<00:01,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9245, LAS: 0.8656, UEM: 0.5131, LEM: 0.2829, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4847, partial_loss/deprel_loss: 0.6092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7048, loss: 0.9049, batch_reg_loss: 0.1205, reg_loss: 0.1194 ||: 100%|##########| 111/111 [01:14<00:00,  1.48it/s]\n",
      "2023-04-06 23:31:56,226 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:31:56,226 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:31:56,226 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:31:56,226 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:31:56,226 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:31:56,226 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:31:56,226 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.609  |       N/A\n",
      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.485  |       N/A\n",
      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.119  |       N/A\n",
      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - UEM                      |     0.513  |       N/A\n",
      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - LAS                      |     0.866  |       N/A\n",
      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - loss                     |     0.905  |       N/A\n",
      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - LEM                      |     0.283  |       N/A\n",
      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - UAS                      |     0.925  |       N/A\n",
      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - EM                       |     0.891  |       N/A\n",
      "2023-04-06 23:31:56,227 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:31:56,228 - INFO - combo.training.trainer - Epoch duration: 0:01:14.783878\n",
      "2023-04-06 23:31:56,228 - INFO - combo.training.trainer - Estimated training time remaining: 8:04:42\n",
      "2023-04-06 23:31:56,228 - INFO - allennlp.training.trainer - Epoch 32/399\n",
      "2023-04-06 23:31:56,228 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:31:56,229 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:31:56,236 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8339, UAS: 0.9280, LAS: 0.8652, UEM: 0.3878, LEM: 0.1763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0858, partial_loss/deprel_loss: 1.0690, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1930, loss: 0.9121, batch_reg_loss: 0.1206, reg_loss: 0.1205 ||:   4%|3         | 4/111 [00:02<01:12,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8781, UAS: 0.9222, LAS: 0.8593, UEM: 0.3942, LEM: 0.1663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5145, partial_loss/deprel_loss: 0.7455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8199, loss: 0.9508, batch_reg_loss: 0.1206, reg_loss: 0.1206 ||:   6%|6         | 7/111 [00:04<01:11,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9268, LAS: 0.8661, UEM: 0.4804, LEM: 0.2334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3036, partial_loss/deprel_loss: 0.5117, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5908, loss: 0.8993, batch_reg_loss: 0.1207, reg_loss: 0.1206 ||:   9%|9         | 10/111 [00:06<01:08,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8563, UAS: 0.9294, LAS: 0.8701, UEM: 0.4779, LEM: 0.2266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7947, partial_loss/deprel_loss: 0.9712, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0567, loss: 0.8729, batch_reg_loss: 0.1207, reg_loss: 0.1206 ||:  12%|#1        | 13/111 [00:08<01:07,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8592, UAS: 0.9245, LAS: 0.8648, UEM: 0.4336, LEM: 0.2022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7990, partial_loss/deprel_loss: 0.7857, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9092, loss: 0.9191, batch_reg_loss: 0.1208, reg_loss: 0.1207 ||:  14%|#4        | 16/111 [00:11<01:05,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9516, UAS: 0.9268, LAS: 0.8677, UEM: 0.5322, LEM: 0.3289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0926, partial_loss/deprel_loss: 0.2178, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3136, loss: 0.8968, batch_reg_loss: 0.1209, reg_loss: 0.1207 ||:  17%|#7        | 19/111 [00:13<01:05,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8848, UAS: 0.9291, LAS: 0.8698, UEM: 0.5301, LEM: 0.3121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5335, partial_loss/deprel_loss: 0.6623, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7575, loss: 0.8739, batch_reg_loss: 0.1209, reg_loss: 0.1207 ||:  20%|#9        | 22/111 [00:15<01:06,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8973, UAS: 0.9269, LAS: 0.8675, UEM: 0.5307, LEM: 0.3049, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3634, partial_loss/deprel_loss: 0.5300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6176, loss: 0.8880, batch_reg_loss: 0.1210, reg_loss: 0.1207 ||:  23%|##2       | 25/111 [00:18<01:04,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8435, UAS: 0.9255, LAS: 0.8662, UEM: 0.5171, LEM: 0.2944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1714, partial_loss/deprel_loss: 1.0061, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1602, loss: 0.9002, batch_reg_loss: 0.1210, reg_loss: 0.1208 ||:  25%|##5       | 28/111 [00:20<01:03,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9248, LAS: 0.8655, UEM: 0.5165, LEM: 0.2950, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2944, partial_loss/deprel_loss: 0.4554, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5443, loss: 0.9082, batch_reg_loss: 0.1211, reg_loss: 0.1208 ||:  28%|##7       | 31/111 [00:22<01:01,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9272, LAS: 0.8687, UEM: 0.5406, LEM: 0.3166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1706, partial_loss/deprel_loss: 0.3330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4217, loss: 0.8810, batch_reg_loss: 0.1211, reg_loss: 0.1208 ||:  31%|###       | 34/111 [00:25<00:59,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9299, LAS: 0.8714, UEM: 0.5655, LEM: 0.3288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1528, partial_loss/deprel_loss: 0.3993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4713, loss: 0.8544, batch_reg_loss: 0.1212, reg_loss: 0.1209 ||:  34%|###4      | 38/111 [00:27<00:54,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7832, UAS: 0.9285, LAS: 0.8704, UEM: 0.5675, LEM: 0.3304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1536, partial_loss/deprel_loss: 1.2558, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5566, loss: 0.8616, batch_reg_loss: 0.1213, reg_loss: 0.1209 ||:  37%|###6      | 41/111 [00:30<00:53,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9300, LAS: 0.8721, UEM: 0.5725, LEM: 0.3317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3764, partial_loss/deprel_loss: 0.4992, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5959, loss: 0.8479, batch_reg_loss: 0.1213, reg_loss: 0.1209 ||:  40%|###9      | 44/111 [00:32<00:50,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8943, UAS: 0.9297, LAS: 0.8715, UEM: 0.5590, LEM: 0.3199, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3903, partial_loss/deprel_loss: 0.6036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6823, loss: 0.8563, batch_reg_loss: 0.1214, reg_loss: 0.1210 ||:  43%|####3     | 48/111 [00:35<00:46,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8898, UAS: 0.9309, LAS: 0.8732, UEM: 0.5558, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4737, partial_loss/deprel_loss: 0.6535, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7390, loss: 0.8460, batch_reg_loss: 0.1215, reg_loss: 0.1210 ||:  47%|####6     | 52/111 [00:37<00:41,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8597, UAS: 0.9302, LAS: 0.8723, UEM: 0.5439, LEM: 0.3032, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6993, partial_loss/deprel_loss: 0.7695, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8770, loss: 0.8525, batch_reg_loss: 0.1215, reg_loss: 0.1210 ||:  50%|#####     | 56/111 [00:40<00:37,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8500, UAS: 0.9306, LAS: 0.8729, UEM: 0.5460, LEM: 0.3052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0724, partial_loss/deprel_loss: 1.0548, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1799, loss: 0.8494, batch_reg_loss: 0.1216, reg_loss: 0.1211 ||:  53%|#####3    | 59/111 [00:42<00:37,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8331, UAS: 0.9290, LAS: 0.8712, UEM: 0.5358, LEM: 0.2987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2836, partial_loss/deprel_loss: 0.9883, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1690, loss: 0.8636, batch_reg_loss: 0.1216, reg_loss: 0.1211 ||:  56%|#####5    | 62/111 [00:44<00:34,  1.41it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9293, LAS: 0.8715, UEM: 0.5296, LEM: 0.2908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6870, partial_loss/deprel_loss: 0.7730, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8775, loss: 0.8617, batch_reg_loss: 0.1217, reg_loss: 0.1211 ||:  59%|#####9    | 66/111 [00:47<00:30,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8233, UAS: 0.9263, LAS: 0.8683, UEM: 0.5209, LEM: 0.2855, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4318, partial_loss/deprel_loss: 1.0938, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2831, loss: 0.8883, batch_reg_loss: 0.1218, reg_loss: 0.1211 ||:  62%|######2   | 69/111 [00:49<00:28,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8648, UAS: 0.9263, LAS: 0.8683, UEM: 0.5139, LEM: 0.2789, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7876, partial_loss/deprel_loss: 0.7696, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8951, loss: 0.8890, batch_reg_loss: 0.1218, reg_loss: 0.1212 ||:  66%|######5   | 73/111 [00:51<00:24,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8262, UAS: 0.9260, LAS: 0.8681, UEM: 0.5085, LEM: 0.2743, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1389, partial_loss/deprel_loss: 1.0152, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1619, loss: 0.8884, batch_reg_loss: 0.1219, reg_loss: 0.1212 ||:  69%|######9   | 77/111 [00:54<00:22,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9255, LAS: 0.8675, UEM: 0.5156, LEM: 0.2866, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1239, partial_loss/deprel_loss: 0.2815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3720, loss: 0.8924, batch_reg_loss: 0.1220, reg_loss: 0.1213 ||:  73%|#######2  | 81/111 [00:57<00:19,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9251, LAS: 0.8669, UEM: 0.5146, LEM: 0.2873, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3275, partial_loss/deprel_loss: 0.4241, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5269, loss: 0.8963, batch_reg_loss: 0.1221, reg_loss: 0.1213 ||:  77%|#######6  | 85/111 [00:59<00:17,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8477, UAS: 0.9257, LAS: 0.8675, UEM: 0.5170, LEM: 0.2874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8591, partial_loss/deprel_loss: 0.9767, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0754, loss: 0.8924, batch_reg_loss: 0.1222, reg_loss: 0.1213 ||:  79%|#######9  | 88/111 [01:02<00:16,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9166, UAS: 0.9258, LAS: 0.8675, UEM: 0.5237, LEM: 0.2936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1875, partial_loss/deprel_loss: 0.3560, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4446, loss: 0.8923, batch_reg_loss: 0.1222, reg_loss: 0.1214 ||:  82%|########1 | 91/111 [01:04<00:14,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9017, UAS: 0.9254, LAS: 0.8670, UEM: 0.5240, LEM: 0.2931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3555, partial_loss/deprel_loss: 0.5276, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6155, loss: 0.8989, batch_reg_loss: 0.1223, reg_loss: 0.1214 ||:  86%|########5 | 95/111 [01:07<00:11,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8443, UAS: 0.9248, LAS: 0.8662, UEM: 0.5177, LEM: 0.2888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9644, partial_loss/deprel_loss: 0.8869, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0248, loss: 0.9030, batch_reg_loss: 0.1224, reg_loss: 0.1214 ||:  88%|########8 | 98/111 [01:09<00:09,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8596, UAS: 0.9248, LAS: 0.8662, UEM: 0.5197, LEM: 0.2904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6818, partial_loss/deprel_loss: 0.8229, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9171, loss: 0.9023, batch_reg_loss: 0.1225, reg_loss: 0.1215 ||:  92%|#########1| 102/111 [01:11<00:06,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8629, UAS: 0.9248, LAS: 0.8661, UEM: 0.5155, LEM: 0.2858, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8211, partial_loss/deprel_loss: 0.8211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9436, loss: 0.9038, batch_reg_loss: 0.1226, reg_loss: 0.1215 ||:  95%|#########5| 106/111 [01:14<00:03,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8603, UAS: 0.9251, LAS: 0.8664, UEM: 0.5153, LEM: 0.2849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7650, partial_loss/deprel_loss: 0.8273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9375, loss: 0.9013, batch_reg_loss: 0.1226, reg_loss: 0.1215 ||:  99%|#########9| 110/111 [01:16<00:00,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8006, UAS: 0.9245, LAS: 0.8658, UEM: 0.5134, LEM: 0.2838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5343, partial_loss/deprel_loss: 1.2796, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4532, loss: 0.9062, batch_reg_loss: 0.1227, reg_loss: 0.1215 ||: 100%|##########| 111/111 [01:17<00:00,  1.43it/s]\n",
      "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 23:33:13,713 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.280  |       N/A\n",
      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.534  |       N/A\n",
      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.122  |       N/A\n",
      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - UEM                      |     0.513  |       N/A\n",
      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - LAS                      |     0.866  |       N/A\n",
      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - loss                     |     0.906  |       N/A\n",
      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - LEM                      |     0.284  |       N/A\n",
      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - UAS                      |     0.925  |       N/A\n",
      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - EM                       |     0.801  |       N/A\n",
      "2023-04-06 23:33:13,714 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:33:13,715 - INFO - combo.training.trainer - Epoch duration: 0:01:17.486642\n",
      "2023-04-06 23:33:13,715 - INFO - combo.training.trainer - Estimated training time remaining: 8:03:06\n",
      "2023-04-06 23:33:13,715 - INFO - allennlp.training.trainer - Epoch 33/399\n",
      "2023-04-06 23:33:13,715 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:33:13,716 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:33:13,722 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8321, UAS: 0.9211, LAS: 0.8634, UEM: 0.2448, LEM: 0.0606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2054, partial_loss/deprel_loss: 0.9809, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1485, loss: 0.9179, batch_reg_loss: 0.1227, reg_loss: 0.1227 ||:   4%|3         | 4/111 [00:02<01:16,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8664, UAS: 0.9216, LAS: 0.8649, UEM: 0.4007, LEM: 0.2139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8307, partial_loss/deprel_loss: 0.7976, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9270, loss: 0.9128, batch_reg_loss: 0.1228, reg_loss: 0.1227 ||:   6%|6         | 7/111 [00:05<01:17,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9301, LAS: 0.8748, UEM: 0.4858, LEM: 0.2617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5363, partial_loss/deprel_loss: 0.5515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6713, loss: 0.8323, batch_reg_loss: 0.1229, reg_loss: 0.1228 ||:   9%|9         | 10/111 [00:07<01:16,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.9291, LAS: 0.8730, UEM: 0.4607, LEM: 0.2289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6542, partial_loss/deprel_loss: 0.7278, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8360, loss: 0.8399, batch_reg_loss: 0.1229, reg_loss: 0.1228 ||:  13%|#2        | 14/111 [00:10<01:09,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8337, UAS: 0.9238, LAS: 0.8661, UEM: 0.4238, LEM: 0.2058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1477, partial_loss/deprel_loss: 1.0175, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1666, loss: 0.9019, batch_reg_loss: 0.1230, reg_loss: 0.1228 ||:  15%|#5        | 17/111 [00:12<01:06,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9052, UAS: 0.9265, LAS: 0.8681, UEM: 0.4492, LEM: 0.2182, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2747, partial_loss/deprel_loss: 0.4835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5648, loss: 0.8846, batch_reg_loss: 0.1231, reg_loss: 0.1229 ||:  18%|#8        | 20/111 [00:14<01:03,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7840, UAS: 0.9254, LAS: 0.8666, UEM: 0.4648, LEM: 0.2258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8170, partial_loss/deprel_loss: 1.3568, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5720, loss: 0.8961, batch_reg_loss: 0.1231, reg_loss: 0.1229 ||:  21%|##        | 23/111 [00:16<01:02,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8408, UAS: 0.9235, LAS: 0.8644, UEM: 0.4432, LEM: 0.2090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1372, partial_loss/deprel_loss: 0.9852, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1388, loss: 0.9177, batch_reg_loss: 0.1232, reg_loss: 0.1229 ||:  24%|##4       | 27/111 [00:18<00:57,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9265, LAS: 0.8682, UEM: 0.4929, LEM: 0.2502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2421, partial_loss/deprel_loss: 0.4143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5031, loss: 0.8827, batch_reg_loss: 0.1232, reg_loss: 0.1230 ||:  27%|##7       | 30/111 [00:21<00:56,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8520, UAS: 0.9256, LAS: 0.8672, UEM: 0.4734, LEM: 0.2367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9719, partial_loss/deprel_loss: 0.9334, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0644, loss: 0.8918, batch_reg_loss: 0.1233, reg_loss: 0.1230 ||:  30%|##9       | 33/111 [00:23<00:53,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8678, UAS: 0.9268, LAS: 0.8684, UEM: 0.4827, LEM: 0.2445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6742, partial_loss/deprel_loss: 0.7842, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8856, loss: 0.8809, batch_reg_loss: 0.1234, reg_loss: 0.1230 ||:  32%|###2      | 36/111 [00:25<00:52,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9268, LAS: 0.8687, UEM: 0.4928, LEM: 0.2582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1770, partial_loss/deprel_loss: 0.3684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4536, loss: 0.8786, batch_reg_loss: 0.1235, reg_loss: 0.1231 ||:  36%|###6      | 40/111 [00:27<00:47,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7844, UAS: 0.9267, LAS: 0.8682, UEM: 0.4953, LEM: 0.2548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8813, partial_loss/deprel_loss: 1.3088, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5469, loss: 0.8836, batch_reg_loss: 0.1235, reg_loss: 0.1231 ||:  40%|###9      | 44/111 [00:30<00:44,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8473, UAS: 0.9241, LAS: 0.8655, UEM: 0.4929, LEM: 0.2566, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8672, partial_loss/deprel_loss: 0.9594, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0645, loss: 0.9084, batch_reg_loss: 0.1236, reg_loss: 0.1231 ||:  43%|####3     | 48/111 [00:33<00:42,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9233, LAS: 0.8647, UEM: 0.4857, LEM: 0.2512, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4534, partial_loss/deprel_loss: 0.5398, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6462, loss: 0.9137, batch_reg_loss: 0.1237, reg_loss: 0.1232 ||:  47%|####6     | 52/111 [00:35<00:39,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9234, LAS: 0.8646, UEM: 0.4809, LEM: 0.2454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4625, partial_loss/deprel_loss: 0.5691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6716, loss: 0.9135, batch_reg_loss: 0.1238, reg_loss: 0.1232 ||:  50%|#####     | 56/111 [00:38<00:38,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9234, LAS: 0.8646, UEM: 0.5000, LEM: 0.2691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1320, partial_loss/deprel_loss: 0.2790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3734, loss: 0.9154, batch_reg_loss: 0.1239, reg_loss: 0.1233 ||:  54%|#####4    | 60/111 [00:41<00:35,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9247, LAS: 0.8660, UEM: 0.5193, LEM: 0.2878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2943, partial_loss/deprel_loss: 0.4989, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5819, loss: 0.9023, batch_reg_loss: 0.1239, reg_loss: 0.1233 ||:  57%|#####6    | 63/111 [00:44<00:37,  1.27it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8493, UAS: 0.9245, LAS: 0.8655, UEM: 0.5094, LEM: 0.2790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8338, partial_loss/deprel_loss: 0.9125, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0207, loss: 0.9076, batch_reg_loss: 0.1240, reg_loss: 0.1233 ||:  60%|######    | 67/111 [00:47<00:32,  1.35it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8462, UAS: 0.9238, LAS: 0.8647, UEM: 0.5004, LEM: 0.2726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0190, partial_loss/deprel_loss: 0.8973, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0457, loss: 0.9132, batch_reg_loss: 0.1241, reg_loss: 0.1234 ||:  63%|######3   | 70/111 [00:49<00:29,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8830, UAS: 0.9256, LAS: 0.8670, UEM: 0.5380, LEM: 0.3134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5388, partial_loss/deprel_loss: 0.6799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7758, loss: 0.8967, batch_reg_loss: 0.1241, reg_loss: 0.1234 ||:  66%|######5   | 73/111 [00:51<00:28,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9259, LAS: 0.8673, UEM: 0.5356, LEM: 0.3106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4678, partial_loss/deprel_loss: 0.5111, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6266, loss: 0.8944, batch_reg_loss: 0.1242, reg_loss: 0.1234 ||:  68%|######8   | 76/111 [00:53<00:26,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9264, LAS: 0.8678, UEM: 0.5363, LEM: 0.3104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5585, partial_loss/deprel_loss: 0.7297, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8197, loss: 0.8902, batch_reg_loss: 0.1242, reg_loss: 0.1235 ||:  71%|#######1  | 79/111 [00:56<00:24,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7776, UAS: 0.9260, LAS: 0.8674, UEM: 0.5386, LEM: 0.3097, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2130, partial_loss/deprel_loss: 1.3757, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6674, loss: 0.8933, batch_reg_loss: 0.1243, reg_loss: 0.1235 ||:  74%|#######3  | 82/111 [00:58<00:22,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8544, UAS: 0.9256, LAS: 0.8668, UEM: 0.5348, LEM: 0.3058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7456, partial_loss/deprel_loss: 0.7852, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9016, loss: 0.8981, batch_reg_loss: 0.1244, reg_loss: 0.1235 ||:  77%|#######6  | 85/111 [01:00<00:19,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9255, LAS: 0.8665, UEM: 0.5300, LEM: 0.3019, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5330, partial_loss/deprel_loss: 0.6727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7692, loss: 0.8982, batch_reg_loss: 0.1244, reg_loss: 0.1236 ||:  80%|########  | 89/111 [01:03<00:15,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9262, LAS: 0.8673, UEM: 0.5294, LEM: 0.2988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4852, partial_loss/deprel_loss: 0.6245, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7211, loss: 0.8921, batch_reg_loss: 0.1245, reg_loss: 0.1236 ||:  83%|########2 | 92/111 [01:05<00:13,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9261, LAS: 0.8670, UEM: 0.5272, LEM: 0.2958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3968, partial_loss/deprel_loss: 0.5528, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6462, loss: 0.8936, batch_reg_loss: 0.1246, reg_loss: 0.1236 ||:  86%|########6 | 96/111 [01:08<00:10,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8171, UAS: 0.9254, LAS: 0.8662, UEM: 0.5244, LEM: 0.2939, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5442, partial_loss/deprel_loss: 0.9765, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2147, loss: 0.8996, batch_reg_loss: 0.1246, reg_loss: 0.1237 ||:  89%|########9 | 99/111 [01:10<00:08,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8560, UAS: 0.9260, LAS: 0.8668, UEM: 0.5231, LEM: 0.2913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7287, partial_loss/deprel_loss: 0.8699, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9663, loss: 0.8954, batch_reg_loss: 0.1247, reg_loss: 0.1237 ||:  93%|#########2| 103/111 [01:12<00:05,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8983, UAS: 0.9264, LAS: 0.8673, UEM: 0.5263, LEM: 0.2927, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4031, partial_loss/deprel_loss: 0.6182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6999, loss: 0.8923, batch_reg_loss: 0.1248, reg_loss: 0.1237 ||:  95%|#########5| 106/111 [01:14<00:03,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8152, UAS: 0.9260, LAS: 0.8666, UEM: 0.5221, LEM: 0.2898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2286, partial_loss/deprel_loss: 1.1836, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3174, loss: 0.8969, batch_reg_loss: 0.1249, reg_loss: 0.1238 ||:  99%|#########9| 110/111 [01:17<00:00,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8837, UAS: 0.9261, LAS: 0.8668, UEM: 0.5215, LEM: 0.2886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5971, partial_loss/deprel_loss: 0.7101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8123, loss: 0.8961, batch_reg_loss: 0.1249, reg_loss: 0.1238 ||: 100%|##########| 111/111 [01:17<00:00,  1.42it/s]\n",
      "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:34:31,637 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.710  |       N/A\n",
      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.597  |       N/A\n",
      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.124  |       N/A\n",
      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - UEM                      |     0.522  |       N/A\n",
      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - LAS                      |     0.867  |       N/A\n",
      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - loss                     |     0.896  |       N/A\n",
      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - LEM                      |     0.289  |       N/A\n",
      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - UAS                      |     0.926  |       N/A\n",
      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - EM                       |     0.884  |       N/A\n",
      "2023-04-06 23:34:31,638 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:34:31,639 - INFO - combo.training.trainer - Epoch duration: 0:01:17.923745\n",
      "2023-04-06 23:34:31,639 - INFO - combo.training.trainer - Estimated training time remaining: 8:01:36\n",
      "2023-04-06 23:34:31,639 - INFO - allennlp.training.trainer - Epoch 34/399\n",
      "2023-04-06 23:34:31,639 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:34:31,640 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:34:31,646 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8560, UAS: 0.9111, LAS: 0.8494, UEM: 0.1556, LEM: 0.0333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7581, partial_loss/deprel_loss: 0.8816, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9818, loss: 1.0546, batch_reg_loss: 0.1249, reg_loss: 0.1249 ||:   3%|2         | 3/111 [00:02<01:13,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9056, LAS: 0.8439, UEM: 0.2538, LEM: 0.0790, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4955, partial_loss/deprel_loss: 0.6868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7736, loss: 1.0748, batch_reg_loss: 0.1250, reg_loss: 0.1249 ||:   5%|5         | 6/111 [00:04<01:12,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7825, UAS: 0.9077, LAS: 0.8464, UEM: 0.3817, LEM: 0.1861, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7655, partial_loss/deprel_loss: 1.2883, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5088, loss: 1.0438, batch_reg_loss: 0.1251, reg_loss: 0.1250 ||:   8%|8         | 9/111 [00:06<01:09,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8766, UAS: 0.9136, LAS: 0.8528, UEM: 0.3986, LEM: 0.1842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6326, partial_loss/deprel_loss: 0.7305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8360, loss: 1.0011, batch_reg_loss: 0.1251, reg_loss: 0.1250 ||:  11%|#         | 12/111 [00:08<01:09,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8578, UAS: 0.9196, LAS: 0.8600, UEM: 0.4359, LEM: 0.1994, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0891, partial_loss/deprel_loss: 0.8639, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0341, loss: 0.9523, batch_reg_loss: 0.1252, reg_loss: 0.1250 ||:  14%|#4        | 16/111 [00:10<01:04,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.9183, LAS: 0.8599, UEM: 0.4232, LEM: 0.1982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4165, partial_loss/deprel_loss: 1.0787, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2716, loss: 0.9521, batch_reg_loss: 0.1253, reg_loss: 0.1251 ||:  18%|#8        | 20/111 [00:13<01:00,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9221, LAS: 0.8642, UEM: 0.4556, LEM: 0.2267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4718, partial_loss/deprel_loss: 0.5684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6744, loss: 0.9203, batch_reg_loss: 0.1253, reg_loss: 0.1251 ||:  21%|##        | 23/111 [00:15<01:01,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8940, UAS: 0.9262, LAS: 0.8687, UEM: 0.4854, LEM: 0.2382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4130, partial_loss/deprel_loss: 0.5913, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6810, loss: 0.8882, batch_reg_loss: 0.1254, reg_loss: 0.1251 ||:  23%|##3       | 26/111 [00:18<01:00,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9281, LAS: 0.8704, UEM: 0.4951, LEM: 0.2408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3141, partial_loss/deprel_loss: 0.4727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5664, loss: 0.8715, batch_reg_loss: 0.1255, reg_loss: 0.1252 ||:  26%|##6       | 29/111 [00:20<00:59,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8954, UAS: 0.9292, LAS: 0.8718, UEM: 0.5290, LEM: 0.2772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3000, partial_loss/deprel_loss: 0.4808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5701, loss: 0.8581, batch_reg_loss: 0.1255, reg_loss: 0.1252 ||:  29%|##8       | 32/111 [00:22<00:59,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9294, LAS: 0.8719, UEM: 0.5231, LEM: 0.2740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3971, partial_loss/deprel_loss: 0.5997, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6847, loss: 0.8609, batch_reg_loss: 0.1256, reg_loss: 0.1252 ||:  32%|###2      | 36/111 [00:25<00:53,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8502, UAS: 0.9275, LAS: 0.8696, UEM: 0.5066, LEM: 0.2621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9660, partial_loss/deprel_loss: 0.8184, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9736, loss: 0.8780, batch_reg_loss: 0.1256, reg_loss: 0.1253 ||:  36%|###6      | 40/111 [00:27<00:48,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9269, LAS: 0.8686, UEM: 0.4966, LEM: 0.2515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4479, partial_loss/deprel_loss: 0.6066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7006, loss: 0.8859, batch_reg_loss: 0.1257, reg_loss: 0.1253 ||:  40%|###9      | 44/111 [00:30<00:45,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9260, LAS: 0.8677, UEM: 0.4901, LEM: 0.2465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5388, partial_loss/deprel_loss: 0.5948, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7094, loss: 0.8959, batch_reg_loss: 0.1258, reg_loss: 0.1253 ||:  42%|####2     | 47/111 [00:32<00:44,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9266, LAS: 0.8686, UEM: 0.4965, LEM: 0.2503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2710, partial_loss/deprel_loss: 0.4662, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5530, loss: 0.8885, batch_reg_loss: 0.1259, reg_loss: 0.1254 ||:  46%|####5     | 51/111 [00:35<00:40,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8409, UAS: 0.9264, LAS: 0.8687, UEM: 0.5060, LEM: 0.2660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0437, partial_loss/deprel_loss: 0.9126, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0648, loss: 0.8867, batch_reg_loss: 0.1259, reg_loss: 0.1254 ||:  49%|####8     | 54/111 [00:37<00:39,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8881, UAS: 0.9265, LAS: 0.8685, UEM: 0.4986, LEM: 0.2585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4914, partial_loss/deprel_loss: 0.6521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7459, loss: 0.8885, batch_reg_loss: 0.1260, reg_loss: 0.1254 ||:  51%|#####1    | 57/111 [00:39<00:37,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9267, LAS: 0.8690, UEM: 0.5166, LEM: 0.2750, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3150, partial_loss/deprel_loss: 0.4455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5455, loss: 0.8846, batch_reg_loss: 0.1261, reg_loss: 0.1255 ||:  54%|#####4    | 60/111 [00:41<00:36,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8927, UAS: 0.9268, LAS: 0.8693, UEM: 0.5151, LEM: 0.2750, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4608, partial_loss/deprel_loss: 0.5828, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6845, loss: 0.8828, batch_reg_loss: 0.1261, reg_loss: 0.1255 ||:  57%|#####6    | 63/111 [00:44<00:35,  1.35it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8797, UAS: 0.9262, LAS: 0.8687, UEM: 0.5069, LEM: 0.2689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5799, partial_loss/deprel_loss: 0.7299, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8261, loss: 0.8887, batch_reg_loss: 0.1262, reg_loss: 0.1255 ||:  59%|#####9    | 66/111 [00:46<00:32,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8858, UAS: 0.9267, LAS: 0.8691, UEM: 0.5082, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5195, partial_loss/deprel_loss: 0.6044, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7137, loss: 0.8859, batch_reg_loss: 0.1262, reg_loss: 0.1256 ||:  62%|######2   | 69/111 [00:48<00:31,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7946, UAS: 0.9255, LAS: 0.8676, UEM: 0.4995, LEM: 0.2632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6270, partial_loss/deprel_loss: 1.1887, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4026, loss: 0.8979, batch_reg_loss: 0.1263, reg_loss: 0.1256 ||:  65%|######4   | 72/111 [00:50<00:29,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8650, UAS: 0.9261, LAS: 0.8686, UEM: 0.5204, LEM: 0.2931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7267, partial_loss/deprel_loss: 0.8069, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9172, loss: 0.8909, batch_reg_loss: 0.1264, reg_loss: 0.1256 ||:  68%|######7   | 75/111 [00:53<00:27,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8154, UAS: 0.9257, LAS: 0.8678, UEM: 0.5206, LEM: 0.2942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2415, partial_loss/deprel_loss: 1.1330, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2811, loss: 0.8966, batch_reg_loss: 0.1264, reg_loss: 0.1257 ||:  71%|#######1  | 79/111 [00:55<00:23,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9256, LAS: 0.8678, UEM: 0.5151, LEM: 0.2893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6984, partial_loss/deprel_loss: 0.7058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8308, loss: 0.8966, batch_reg_loss: 0.1265, reg_loss: 0.1257 ||:  74%|#######3  | 82/111 [00:58<00:21,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8430, UAS: 0.9253, LAS: 0.8674, UEM: 0.5110, LEM: 0.2866, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1613, partial_loss/deprel_loss: 0.9831, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1453, loss: 0.9004, batch_reg_loss: 0.1266, reg_loss: 0.1257 ||:  77%|#######6  | 85/111 [01:00<00:18,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8593, UAS: 0.9256, LAS: 0.8676, UEM: 0.5044, LEM: 0.2798, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7210, partial_loss/deprel_loss: 0.8211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9277, loss: 0.8993, batch_reg_loss: 0.1266, reg_loss: 0.1258 ||:  80%|########  | 89/111 [01:02<00:14,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9267, LAS: 0.8690, UEM: 0.5185, LEM: 0.2945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1218, partial_loss/deprel_loss: 0.2729, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3694, loss: 0.8883, batch_reg_loss: 0.1267, reg_loss: 0.1258 ||:  84%|########3 | 93/111 [01:05<00:12,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8676, UAS: 0.9271, LAS: 0.8695, UEM: 0.5184, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8011, partial_loss/deprel_loss: 0.7246, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8667, loss: 0.8846, batch_reg_loss: 0.1268, reg_loss: 0.1258 ||:  87%|########7 | 97/111 [01:07<00:09,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8105, UAS: 0.9253, LAS: 0.8672, UEM: 0.5146, LEM: 0.2885, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3796, partial_loss/deprel_loss: 1.2244, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3823, loss: 0.9042, batch_reg_loss: 0.1269, reg_loss: 0.1259 ||:  91%|######### | 101/111 [01:10<00:06,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8849, UAS: 0.9253, LAS: 0.8672, UEM: 0.5136, LEM: 0.2872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4786, partial_loss/deprel_loss: 0.7123, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7925, loss: 0.9034, batch_reg_loss: 0.1270, reg_loss: 0.1259 ||:  95%|#########4| 105/111 [01:12<00:03,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9259, LAS: 0.8680, UEM: 0.5158, LEM: 0.2860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3995, partial_loss/deprel_loss: 0.4815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5921, loss: 0.8959, batch_reg_loss: 0.1270, reg_loss: 0.1260 ||:  98%|#########8| 109/111 [01:15<00:01,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8528, UAS: 0.9261, LAS: 0.8681, UEM: 0.5174, LEM: 0.2862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8394, partial_loss/deprel_loss: 0.8557, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9796, loss: 0.8944, batch_reg_loss: 0.1271, reg_loss: 0.1260 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
      "2023-04-06 23:35:48,409 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:35:48,409 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.856  |       N/A\n",
      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.839  |       N/A\n",
      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.126  |       N/A\n",
      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - UEM                      |     0.517  |       N/A\n",
      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - LAS                      |     0.868  |       N/A\n",
      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - loss                     |     0.894  |       N/A\n",
      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - LEM                      |     0.286  |       N/A\n",
      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - UAS                      |     0.926  |       N/A\n",
      "2023-04-06 23:35:48,410 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:35:48,411 - INFO - combo.training.tensorboard_writer - EM                       |     0.853  |       N/A\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-06 23:35:48,411 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:35:48,411 - INFO - combo.training.trainer - Epoch duration: 0:01:16.772068\n",
      "2023-04-06 23:35:48,411 - INFO - combo.training.trainer - Estimated training time remaining: 7:59:54\n",
      "2023-04-06 23:35:48,411 - INFO - allennlp.training.trainer - Epoch 35/399\n",
      "2023-04-06 23:35:48,411 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:35:48,412 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:35:48,418 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8295, UAS: 0.9216, LAS: 0.8633, UEM: 0.5277, LEM: 0.2900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1609, partial_loss/deprel_loss: 0.9063, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0844, loss: 0.8635, batch_reg_loss: 0.1272, reg_loss: 0.1271 ||:   4%|3         | 4/111 [00:02<01:10,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9235, LAS: 0.8655, UEM: 0.4402, LEM: 0.2191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5437, partial_loss/deprel_loss: 0.6562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7609, loss: 0.8720, batch_reg_loss: 0.1272, reg_loss: 0.1272 ||:   6%|6         | 7/111 [00:04<01:09,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9283, LAS: 0.8721, UEM: 0.5337, LEM: 0.3006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2537, partial_loss/deprel_loss: 0.4130, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5084, loss: 0.8287, batch_reg_loss: 0.1273, reg_loss: 0.1272 ||:  10%|9         | 11/111 [00:07<01:04,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9337, LAS: 0.8795, UEM: 0.6324, LEM: 0.4287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8339, partial_loss/deprel_loss: 0.8628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9844, loss: 0.7854, batch_reg_loss: 0.1274, reg_loss: 0.1272 ||:  13%|#2        | 14/111 [00:09<01:05,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8884, UAS: 0.9359, LAS: 0.8817, UEM: 0.6234, LEM: 0.4027, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4166, partial_loss/deprel_loss: 0.6455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7271, loss: 0.7716, batch_reg_loss: 0.1274, reg_loss: 0.1273 ||:  15%|#5        | 17/111 [00:11<01:03,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8421, UAS: 0.9321, LAS: 0.8770, UEM: 0.5887, LEM: 0.3752, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9956, partial_loss/deprel_loss: 0.8582, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0131, loss: 0.8049, batch_reg_loss: 0.1275, reg_loss: 0.1273 ||:  18%|#8        | 20/111 [00:13<01:02,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9340, LAS: 0.8787, UEM: 0.5950, LEM: 0.3729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3717, partial_loss/deprel_loss: 0.6203, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6981, loss: 0.7990, batch_reg_loss: 0.1275, reg_loss: 0.1273 ||:  21%|##        | 23/111 [00:15<01:01,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8278, UAS: 0.9337, LAS: 0.8779, UEM: 0.5850, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2579, partial_loss/deprel_loss: 0.9992, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1785, loss: 0.8028, batch_reg_loss: 0.1276, reg_loss: 0.1273 ||:  24%|##4       | 27/111 [00:17<00:55,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9350, LAS: 0.8794, UEM: 0.5883, LEM: 0.3559, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2687, partial_loss/deprel_loss: 0.4893, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5729, loss: 0.7937, batch_reg_loss: 0.1276, reg_loss: 0.1274 ||:  27%|##7       | 30/111 [00:20<00:55,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8737, UAS: 0.9357, LAS: 0.8800, UEM: 0.5762, LEM: 0.3392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6725, partial_loss/deprel_loss: 0.7140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8334, loss: 0.7902, batch_reg_loss: 0.1277, reg_loss: 0.1274 ||:  31%|###       | 34/111 [00:22<00:51,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8797, UAS: 0.9370, LAS: 0.8816, UEM: 0.5877, LEM: 0.3504, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5669, partial_loss/deprel_loss: 0.7290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8244, loss: 0.7811, batch_reg_loss: 0.1278, reg_loss: 0.1274 ||:  33%|###3      | 37/111 [00:24<00:50,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8203, UAS: 0.9350, LAS: 0.8792, UEM: 0.5682, LEM: 0.3341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2426, partial_loss/deprel_loss: 1.1232, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2749, loss: 0.8012, batch_reg_loss: 0.1278, reg_loss: 0.1275 ||:  37%|###6      | 41/111 [00:27<00:47,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7827, UAS: 0.9333, LAS: 0.8773, UEM: 0.5601, LEM: 0.3259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1731, partial_loss/deprel_loss: 1.4011, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6834, loss: 0.8193, batch_reg_loss: 0.1279, reg_loss: 0.1275 ||:  41%|####      | 45/111 [00:30<00:44,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8356, UAS: 0.9327, LAS: 0.8767, UEM: 0.5487, LEM: 0.3164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2953, partial_loss/deprel_loss: 0.9857, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1755, loss: 0.8261, batch_reg_loss: 0.1280, reg_loss: 0.1275 ||:  44%|####4     | 49/111 [00:32<00:41,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9332, LAS: 0.8771, UEM: 0.5407, LEM: 0.3053, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6257, partial_loss/deprel_loss: 0.8141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9044, loss: 0.8255, batch_reg_loss: 0.1280, reg_loss: 0.1276 ||:  48%|####7     | 53/111 [00:35<00:37,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8593, UAS: 0.9305, LAS: 0.8738, UEM: 0.5267, LEM: 0.2957, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7496, partial_loss/deprel_loss: 0.8220, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9356, loss: 0.8506, batch_reg_loss: 0.1281, reg_loss: 0.1276 ||:  51%|#####1    | 57/111 [00:37<00:34,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8758, UAS: 0.9294, LAS: 0.8723, UEM: 0.5206, LEM: 0.2915, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5661, partial_loss/deprel_loss: 0.6737, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7804, loss: 0.8612, batch_reg_loss: 0.1282, reg_loss: 0.1276 ||:  55%|#####4    | 61/111 [00:40<00:32,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8640, UAS: 0.9286, LAS: 0.8712, UEM: 0.5098, LEM: 0.2818, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6110, partial_loss/deprel_loss: 0.7682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8651, loss: 0.8717, batch_reg_loss: 0.1283, reg_loss: 0.1277 ||:  59%|#####8    | 65/111 [00:43<00:30,  1.53it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8624, UAS: 0.9255, LAS: 0.8680, UEM: 0.4994, LEM: 0.2757, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8341, partial_loss/deprel_loss: 0.8179, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9495, loss: 0.8981, batch_reg_loss: 0.1284, reg_loss: 0.1277 ||:  62%|######2   | 69/111 [00:45<00:28,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8583, UAS: 0.9260, LAS: 0.8685, UEM: 0.5123, LEM: 0.2920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7949, partial_loss/deprel_loss: 0.7780, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9098, loss: 0.8941, batch_reg_loss: 0.1284, reg_loss: 0.1278 ||:  65%|######4   | 72/111 [00:47<00:26,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7804, UAS: 0.9254, LAS: 0.8680, UEM: 0.5102, LEM: 0.2885, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1089, partial_loss/deprel_loss: 1.2912, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5832, loss: 0.8992, batch_reg_loss: 0.1285, reg_loss: 0.1278 ||:  68%|######7   | 75/111 [00:50<00:24,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9269, LAS: 0.8696, UEM: 0.5202, LEM: 0.2937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2120, partial_loss/deprel_loss: 0.3991, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4903, loss: 0.8862, batch_reg_loss: 0.1286, reg_loss: 0.1278 ||:  71%|#######1  | 79/111 [00:52<00:22,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9274, LAS: 0.8700, UEM: 0.5204, LEM: 0.2910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3154, partial_loss/deprel_loss: 0.4886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5826, loss: 0.8838, batch_reg_loss: 0.1287, reg_loss: 0.1279 ||:  74%|#######3  | 82/111 [00:55<00:20,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9041, UAS: 0.9281, LAS: 0.8709, UEM: 0.5253, LEM: 0.2929, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3072, partial_loss/deprel_loss: 0.4757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5707, loss: 0.8759, batch_reg_loss: 0.1287, reg_loss: 0.1279 ||:  77%|#######6  | 85/111 [00:57<00:18,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8220, UAS: 0.9270, LAS: 0.8697, UEM: 0.5177, LEM: 0.2879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3218, partial_loss/deprel_loss: 1.0454, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2295, loss: 0.8849, batch_reg_loss: 0.1288, reg_loss: 0.1279 ||:  79%|#######9  | 88/111 [00:59<00:17,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8171, UAS: 0.9260, LAS: 0.8684, UEM: 0.5104, LEM: 0.2823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4441, partial_loss/deprel_loss: 1.2558, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4223, loss: 0.8980, batch_reg_loss: 0.1288, reg_loss: 0.1279 ||:  83%|########2 | 92/111 [01:02<00:13,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9262, LAS: 0.8686, UEM: 0.5193, LEM: 0.2901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3134, partial_loss/deprel_loss: 0.4586, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5585, loss: 0.8958, batch_reg_loss: 0.1289, reg_loss: 0.1280 ||:  86%|########5 | 95/111 [01:04<00:11,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8623, UAS: 0.9256, LAS: 0.8679, UEM: 0.5131, LEM: 0.2854, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8674, partial_loss/deprel_loss: 0.8091, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9497, loss: 0.9019, batch_reg_loss: 0.1290, reg_loss: 0.1280 ||:  88%|########8 | 98/111 [01:06<00:09,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9268, LAS: 0.8692, UEM: 0.5273, LEM: 0.2957, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3296, partial_loss/deprel_loss: 0.4673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5688, loss: 0.8912, batch_reg_loss: 0.1290, reg_loss: 0.1280 ||:  91%|######### | 101/111 [01:08<00:07,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8077, UAS: 0.9265, LAS: 0.8689, UEM: 0.5272, LEM: 0.2951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5767, partial_loss/deprel_loss: 1.2628, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4546, loss: 0.8940, batch_reg_loss: 0.1291, reg_loss: 0.1281 ||:  94%|#########3| 104/111 [01:11<00:05,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8524, UAS: 0.9270, LAS: 0.8692, UEM: 0.5252, LEM: 0.2916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9199, partial_loss/deprel_loss: 0.9289, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0563, loss: 0.8924, batch_reg_loss: 0.1292, reg_loss: 0.1281 ||:  97%|#########7| 108/111 [01:13<00:02,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8770, UAS: 0.9271, LAS: 0.8694, UEM: 0.5212, LEM: 0.2884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5733, partial_loss/deprel_loss: 0.6382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7544, loss: 0.8907, batch_reg_loss: 0.1292, reg_loss: 0.1281 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
      "2023-04-06 23:37:04,098 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8198, UAS: 0.9346, LAS: 0.8832, UEM: 0.6393, LEM: 0.3707, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6542, partial_loss/deprel_loss: 60.5480, partial_loss/cycle_loss: 0.0000, batch_loss: 48.7692, loss: 28.2319, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:03<00:10,  1.05s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.9413, LAS: 0.8902, UEM: 0.6892, LEM: 0.4574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7597, partial_loss/deprel_loss: 30.7479, partial_loss/cycle_loss: 0.0000, batch_loss: 24.7503, loss: 26.1370, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:07,  1.02s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9004, UAS: 0.9440, LAS: 0.8904, UEM: 0.6567, LEM: 0.3837, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4145, partial_loss/deprel_loss: 24.9592, partial_loss/cycle_loss: 0.0000, batch_loss: 20.0503, loss: 25.0336, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  69%|######9   | 9/13 [00:08<00:03,  1.03it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8670, UAS: 0.9429, LAS: 0.8893, UEM: 0.6474, LEM: 0.3799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0086, partial_loss/deprel_loss: 44.8982, partial_loss/cycle_loss: 0.0000, batch_loss: 36.1203, loss: 26.7810, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  92%|#########2| 12/13 [00:11<00:00,  1.03it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9419, LAS: 0.8881, UEM: 0.6314, LEM: 0.3663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8470, partial_loss/deprel_loss: 31.8272, partial_loss/cycle_loss: 0.0000, batch_loss: 25.6312, loss: 26.6926, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.05it/s]\n",
      "2023-04-06 23:37:16,466 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.638  |    31.827\n",
      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.573  |     0.847\n",
      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.128  |     0.000\n",
      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - UEM                      |     0.521  |     0.631\n",
      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - LAS                      |     0.869  |     0.888\n",
      "2023-04-06 23:37:16,467 - INFO - combo.training.tensorboard_writer - loss                     |     0.891  |    26.693\n",
      "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - LEM                      |     0.288  |     0.366\n",
      "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - UAS                      |     0.927  |     0.942\n",
      "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - EM                       |     0.877  |     0.874\n",
      "2023-04-06 23:37:16,468 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:37:16,469 - INFO - combo.training.trainer - Epoch duration: 0:01:28.057300\n",
      "2023-04-06 23:37:16,469 - INFO - combo.training.trainer - Estimated training time remaining: 8:00:08\n",
      "2023-04-06 23:37:16,469 - INFO - allennlp.training.trainer - Epoch 36/399\n",
      "2023-04-06 23:37:16,469 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:37:16,469 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-06 23:37:16,477 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9452, LAS: 0.8924, UEM: 0.5289, LEM: 0.2663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4880, partial_loss/deprel_loss: 0.6698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7627, loss: 0.7053, batch_reg_loss: 0.1293, reg_loss: 0.1293 ||:   3%|2         | 3/111 [00:02<01:17,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7919, UAS: 0.9146, LAS: 0.8533, UEM: 0.4009, LEM: 0.1795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6848, partial_loss/deprel_loss: 1.3093, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5138, loss: 1.0154, batch_reg_loss: 0.1294, reg_loss: 0.1293 ||:   6%|6         | 7/111 [00:04<01:10,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9211, LAS: 0.8604, UEM: 0.4206, LEM: 0.1742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4597, partial_loss/deprel_loss: 0.6605, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7498, loss: 0.9638, batch_reg_loss: 0.1294, reg_loss: 0.1293 ||:   9%|9         | 10/111 [00:06<01:09,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8680, UAS: 0.9129, LAS: 0.8526, UEM: 0.3770, LEM: 0.1513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8000, partial_loss/deprel_loss: 0.7861, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9183, loss: 1.0215, batch_reg_loss: 0.1295, reg_loss: 0.1294 ||:  12%|#1        | 13/111 [00:08<01:07,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8891, UAS: 0.9189, LAS: 0.8602, UEM: 0.3997, LEM: 0.1637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4654, partial_loss/deprel_loss: 0.6501, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7427, loss: 0.9621, batch_reg_loss: 0.1295, reg_loss: 0.1294 ||:  14%|#4        | 16/111 [00:11<01:08,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8315, UAS: 0.9139, LAS: 0.8544, UEM: 0.3725, LEM: 0.1497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0556, partial_loss/deprel_loss: 1.0156, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1532, loss: 1.0103, batch_reg_loss: 0.1296, reg_loss: 0.1294 ||:  17%|#7        | 19/111 [00:13<01:05,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9164, LAS: 0.8573, UEM: 0.4090, LEM: 0.1805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3374, partial_loss/deprel_loss: 0.4859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5859, loss: 0.9840, batch_reg_loss: 0.1296, reg_loss: 0.1294 ||:  20%|#9        | 22/111 [00:15<01:03,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9540, UAS: 0.9206, LAS: 0.8620, UEM: 0.5124, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0660, partial_loss/deprel_loss: 0.1975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3009, loss: 0.9505, batch_reg_loss: 0.1297, reg_loss: 0.1295 ||:  23%|##2       | 25/111 [00:17<01:05,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8453, UAS: 0.9192, LAS: 0.8603, UEM: 0.4831, LEM: 0.2796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0821, partial_loss/deprel_loss: 0.8557, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0308, loss: 0.9618, batch_reg_loss: 0.1298, reg_loss: 0.1295 ||:  26%|##6       | 29/111 [00:20<00:58,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9221, LAS: 0.8634, UEM: 0.5052, LEM: 0.2917, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1437, partial_loss/deprel_loss: 0.3982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4772, loss: 0.9353, batch_reg_loss: 0.1299, reg_loss: 0.1295 ||:  29%|##8       | 32/111 [00:22<00:56,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8467, UAS: 0.9198, LAS: 0.8611, UEM: 0.4829, LEM: 0.2747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1443, partial_loss/deprel_loss: 0.8956, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0753, loss: 0.9539, batch_reg_loss: 0.1299, reg_loss: 0.1296 ||:  32%|###2      | 36/111 [00:25<00:52,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8848, UAS: 0.9206, LAS: 0.8620, UEM: 0.4807, LEM: 0.2668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6102, partial_loss/deprel_loss: 0.6688, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7871, loss: 0.9482, batch_reg_loss: 0.1300, reg_loss: 0.1296 ||:  35%|###5      | 39/111 [00:27<00:50,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8373, UAS: 0.9212, LAS: 0.8630, UEM: 0.4812, LEM: 0.2660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1409, partial_loss/deprel_loss: 1.0084, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1650, loss: 0.9400, batch_reg_loss: 0.1301, reg_loss: 0.1297 ||:  39%|###8      | 43/111 [00:29<00:46,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9227, LAS: 0.8648, UEM: 0.4976, LEM: 0.2776, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2244, partial_loss/deprel_loss: 0.4163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5081, loss: 0.9244, batch_reg_loss: 0.1302, reg_loss: 0.1297 ||:  42%|####2     | 47/111 [00:32<00:42,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9247, LAS: 0.8669, UEM: 0.5112, LEM: 0.2824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2245, partial_loss/deprel_loss: 0.4146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5068, loss: 0.9069, batch_reg_loss: 0.1302, reg_loss: 0.1297 ||:  45%|####5     | 50/111 [00:34<00:41,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8419, UAS: 0.9256, LAS: 0.8678, UEM: 0.5218, LEM: 0.2915, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9718, partial_loss/deprel_loss: 0.9520, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0862, loss: 0.8975, batch_reg_loss: 0.1303, reg_loss: 0.1298 ||:  48%|####7     | 53/111 [00:36<00:41,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8846, UAS: 0.9273, LAS: 0.8700, UEM: 0.5428, LEM: 0.3133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5033, partial_loss/deprel_loss: 0.6351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7391, loss: 0.8805, batch_reg_loss: 0.1304, reg_loss: 0.1298 ||:  51%|#####1    | 57/111 [00:39<00:37,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8903, UAS: 0.9283, LAS: 0.8711, UEM: 0.5485, LEM: 0.3151, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4286, partial_loss/deprel_loss: 0.5783, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6788, loss: 0.8710, batch_reg_loss: 0.1304, reg_loss: 0.1298 ||:  54%|#####4    | 60/111 [00:41<00:35,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9104, UAS: 0.9295, LAS: 0.8725, UEM: 0.5627, LEM: 0.3281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3033, partial_loss/deprel_loss: 0.4829, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5775, loss: 0.8593, batch_reg_loss: 0.1305, reg_loss: 0.1299 ||:  57%|#####6    | 63/111 [00:43<00:34,  1.40it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8837, UAS: 0.9297, LAS: 0.8727, UEM: 0.5516, LEM: 0.3177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5741, partial_loss/deprel_loss: 0.7504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8456, loss: 0.8591, batch_reg_loss: 0.1305, reg_loss: 0.1299 ||:  60%|######    | 67/111 [00:46<00:30,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8409, UAS: 0.9298, LAS: 0.8726, UEM: 0.5457, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1037, partial_loss/deprel_loss: 0.9766, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1326, loss: 0.8598, batch_reg_loss: 0.1306, reg_loss: 0.1299 ||:  64%|######3   | 71/111 [00:48<00:27,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9304, LAS: 0.8730, UEM: 0.5460, LEM: 0.3102, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3699, partial_loss/deprel_loss: 0.5524, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6465, loss: 0.8557, batch_reg_loss: 0.1306, reg_loss: 0.1300 ||:  68%|######7   | 75/111 [00:51<00:23,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8167, UAS: 0.9292, LAS: 0.8716, UEM: 0.5398, LEM: 0.3041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4855, partial_loss/deprel_loss: 1.0485, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2665, loss: 0.8661, batch_reg_loss: 0.1307, reg_loss: 0.1300 ||:  71%|#######1  | 79/111 [00:54<00:21,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9298, LAS: 0.8723, UEM: 0.5468, LEM: 0.3095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4292, partial_loss/deprel_loss: 0.6107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7051, loss: 0.8599, batch_reg_loss: 0.1307, reg_loss: 0.1300 ||:  75%|#######4  | 83/111 [00:57<00:19,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8879, UAS: 0.9290, LAS: 0.8713, UEM: 0.5385, LEM: 0.3022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5060, partial_loss/deprel_loss: 0.6993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7915, loss: 0.8692, batch_reg_loss: 0.1308, reg_loss: 0.1301 ||:  78%|#######8  | 87/111 [00:59<00:15,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8627, UAS: 0.9280, LAS: 0.8700, UEM: 0.5342, LEM: 0.2985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7672, partial_loss/deprel_loss: 0.9964, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0814, loss: 0.8801, batch_reg_loss: 0.1309, reg_loss: 0.1301 ||:  82%|########1 | 91/111 [01:01<00:12,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9272, LAS: 0.8690, UEM: 0.5320, LEM: 0.2974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2635, partial_loss/deprel_loss: 0.4135, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5145, loss: 0.8877, batch_reg_loss: 0.1310, reg_loss: 0.1301 ||:  86%|########5 | 95/111 [01:04<00:10,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9000, UAS: 0.9272, LAS: 0.8689, UEM: 0.5316, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3234, partial_loss/deprel_loss: 0.5304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6200, loss: 0.8883, batch_reg_loss: 0.1310, reg_loss: 0.1302 ||:  88%|########8 | 98/111 [01:07<00:09,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9277, LAS: 0.8693, UEM: 0.5311, LEM: 0.2932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3735, partial_loss/deprel_loss: 0.6150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6978, loss: 0.8848, batch_reg_loss: 0.1311, reg_loss: 0.1302 ||:  92%|#########1| 102/111 [01:09<00:05,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8988, UAS: 0.9277, LAS: 0.8695, UEM: 0.5285, LEM: 0.2901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4234, partial_loss/deprel_loss: 0.5900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6879, loss: 0.8845, batch_reg_loss: 0.1312, reg_loss: 0.1302 ||:  95%|#########5| 106/111 [01:12<00:03,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9270, LAS: 0.8688, UEM: 0.5260, LEM: 0.2884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2633, partial_loss/deprel_loss: 0.4330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5303, loss: 0.8900, batch_reg_loss: 0.1313, reg_loss: 0.1303 ||:  99%|#########9| 110/111 [01:15<00:00,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8737, UAS: 0.9271, LAS: 0.8689, UEM: 0.5252, LEM: 0.2873, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5826, partial_loss/deprel_loss: 0.7173, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8217, loss: 0.8894, batch_reg_loss: 0.1313, reg_loss: 0.1303 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
      "2023-04-06 23:38:32,176 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:38:32,176 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:38:32,176 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:38:32,176 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:38:32,176 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.717  |       N/A\n",
      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.583  |       N/A\n",
      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.130  |       N/A\n",
      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - UEM                      |     0.525  |       N/A\n",
      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - LAS                      |     0.869  |       N/A\n",
      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - loss                     |     0.889  |       N/A\n",
      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:38:32,177 - INFO - combo.training.tensorboard_writer - LEM                      |     0.287  |       N/A\n",
      "2023-04-06 23:38:32,178 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:38:32,178 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:38:32,178 - INFO - combo.training.tensorboard_writer - UAS                      |     0.927  |       N/A\n",
      "2023-04-06 23:38:32,178 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:38:32,178 - INFO - combo.training.tensorboard_writer - EM                       |     0.874  |       N/A\n",
      "2023-04-06 23:38:32,178 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:38:32,179 - INFO - combo.training.trainer - Epoch duration: 0:01:15.709732\n",
      "2023-04-06 23:38:32,179 - INFO - combo.training.trainer - Estimated training time remaining: 7:58:15\n",
      "2023-04-06 23:38:32,179 - INFO - allennlp.training.trainer - Epoch 37/399\n",
      "2023-04-06 23:38:32,179 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:38:32,179 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:38:32,188 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9011, UAS: 0.9332, LAS: 0.8765, UEM: 0.4678, LEM: 0.2122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3651, partial_loss/deprel_loss: 0.4818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5898, loss: 0.8393, batch_reg_loss: 0.1314, reg_loss: 0.1314 ||:   4%|3         | 4/111 [00:02<01:08,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8846, UAS: 0.9418, LAS: 0.8880, UEM: 0.6776, LEM: 0.4819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5287, partial_loss/deprel_loss: 0.6488, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7562, loss: 0.7479, batch_reg_loss: 0.1315, reg_loss: 0.1314 ||:   6%|6         | 7/111 [00:05<01:12,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9401, LAS: 0.8861, UEM: 0.6351, LEM: 0.4231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3285, partial_loss/deprel_loss: 0.5358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6258, loss: 0.7604, batch_reg_loss: 0.1315, reg_loss: 0.1314 ||:   9%|9         | 10/111 [00:07<01:09,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8978, UAS: 0.9390, LAS: 0.8841, UEM: 0.5888, LEM: 0.3604, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3963, partial_loss/deprel_loss: 0.5860, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6797, loss: 0.7824, batch_reg_loss: 0.1316, reg_loss: 0.1315 ||:  13%|#2        | 14/111 [00:09<01:03,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8355, UAS: 0.9365, LAS: 0.8814, UEM: 0.5696, LEM: 0.3415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2521, partial_loss/deprel_loss: 0.9936, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1770, loss: 0.8040, batch_reg_loss: 0.1316, reg_loss: 0.1315 ||:  15%|#5        | 17/111 [00:11<01:03,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8802, UAS: 0.9375, LAS: 0.8818, UEM: 0.5544, LEM: 0.3182, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5666, partial_loss/deprel_loss: 0.7057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8096, loss: 0.7999, batch_reg_loss: 0.1317, reg_loss: 0.1315 ||:  18%|#8        | 20/111 [00:13<01:01,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8757, UAS: 0.9373, LAS: 0.8809, UEM: 0.5360, LEM: 0.2984, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6051, partial_loss/deprel_loss: 0.7038, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8158, loss: 0.8015, batch_reg_loss: 0.1317, reg_loss: 0.1315 ||:  21%|##        | 23/111 [00:15<00:59,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9358, LAS: 0.8789, UEM: 0.5296, LEM: 0.2913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3506, partial_loss/deprel_loss: 0.5437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6369, loss: 0.8139, batch_reg_loss: 0.1318, reg_loss: 0.1316 ||:  24%|##4       | 27/111 [00:18<00:56,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9368, LAS: 0.8799, UEM: 0.5409, LEM: 0.2947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2640, partial_loss/deprel_loss: 0.4096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5124, loss: 0.8028, batch_reg_loss: 0.1319, reg_loss: 0.1316 ||:  28%|##7       | 31/111 [00:20<00:52,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7975, UAS: 0.9310, LAS: 0.8739, UEM: 0.5321, LEM: 0.2887, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7992, partial_loss/deprel_loss: 1.2460, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4886, loss: 0.8534, batch_reg_loss: 0.1319, reg_loss: 0.1316 ||:  31%|###       | 34/111 [00:23<00:53,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9295, LAS: 0.8724, UEM: 0.5293, LEM: 0.2876, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5793, partial_loss/deprel_loss: 0.6494, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7674, loss: 0.8636, batch_reg_loss: 0.1320, reg_loss: 0.1317 ||:  34%|###4      | 38/111 [00:25<00:49,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9291, LAS: 0.8717, UEM: 0.5239, LEM: 0.2817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7996, partial_loss/deprel_loss: 0.7570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8976, loss: 0.8671, batch_reg_loss: 0.1321, reg_loss: 0.1317 ||:  37%|###6      | 41/111 [00:27<00:48,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8628, UAS: 0.9284, LAS: 0.8710, UEM: 0.5212, LEM: 0.2801, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8072, partial_loss/deprel_loss: 0.7757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9141, loss: 0.8724, batch_reg_loss: 0.1321, reg_loss: 0.1317 ||:  40%|###9      | 44/111 [00:30<00:47,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9267, LAS: 0.8691, UEM: 0.5128, LEM: 0.2733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3557, partial_loss/deprel_loss: 0.5814, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6685, loss: 0.8894, batch_reg_loss: 0.1322, reg_loss: 0.1318 ||:  42%|####2     | 47/111 [00:32<00:45,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9279, LAS: 0.8706, UEM: 0.5283, LEM: 0.2888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2007, partial_loss/deprel_loss: 0.3160, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4252, loss: 0.8751, batch_reg_loss: 0.1323, reg_loss: 0.1318 ||:  46%|####5     | 51/111 [00:35<00:42,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9263, LAS: 0.8688, UEM: 0.5287, LEM: 0.2919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2684, partial_loss/deprel_loss: 0.4409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5387, loss: 0.8898, batch_reg_loss: 0.1323, reg_loss: 0.1318 ||:  49%|####8     | 54/111 [00:37<00:41,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8261, UAS: 0.9249, LAS: 0.8676, UEM: 0.5162, LEM: 0.2841, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4259, partial_loss/deprel_loss: 0.9915, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2108, loss: 0.8998, batch_reg_loss: 0.1324, reg_loss: 0.1319 ||:  51%|#####1    | 57/111 [00:39<00:38,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9245, LAS: 0.8671, UEM: 0.5301, LEM: 0.3042, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1480, partial_loss/deprel_loss: 0.2760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3828, loss: 0.9042, batch_reg_loss: 0.1325, reg_loss: 0.1319 ||:  54%|#####4    | 60/111 [00:41<00:36,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8584, UAS: 0.9240, LAS: 0.8665, UEM: 0.5210, LEM: 0.2975, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8904, partial_loss/deprel_loss: 0.8210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9674, loss: 0.9083, batch_reg_loss: 0.1325, reg_loss: 0.1319 ||:  57%|#####6    | 63/111 [00:43<00:34,  1.41it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9239, LAS: 0.8662, UEM: 0.5185, LEM: 0.2949, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3084, partial_loss/deprel_loss: 0.5285, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6171, loss: 0.9107, batch_reg_loss: 0.1326, reg_loss: 0.1319 ||:  59%|#####9    | 66/111 [00:45<00:31,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9242, LAS: 0.8665, UEM: 0.5151, LEM: 0.2909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3071, partial_loss/deprel_loss: 0.4553, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5583, loss: 0.9102, batch_reg_loss: 0.1327, reg_loss: 0.1320 ||:  63%|######3   | 70/111 [00:48<00:28,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8097, UAS: 0.9240, LAS: 0.8662, UEM: 0.5102, LEM: 0.2864, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4604, partial_loss/deprel_loss: 1.2037, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3878, loss: 0.9143, batch_reg_loss: 0.1327, reg_loss: 0.1320 ||:  67%|######6   | 74/111 [00:50<00:24,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9252, LAS: 0.8674, UEM: 0.5201, LEM: 0.2896, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4208, partial_loss/deprel_loss: 0.6707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7536, loss: 0.9017, batch_reg_loss: 0.1328, reg_loss: 0.1321 ||:  70%|#######   | 78/111 [00:53<00:22,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8867, UAS: 0.9250, LAS: 0.8668, UEM: 0.5147, LEM: 0.2835, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4345, partial_loss/deprel_loss: 0.6903, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7721, loss: 0.9045, batch_reg_loss: 0.1329, reg_loss: 0.1321 ||:  74%|#######3  | 82/111 [00:55<00:18,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9257, LAS: 0.8676, UEM: 0.5136, LEM: 0.2802, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7814, partial_loss/deprel_loss: 0.6975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8472, loss: 0.8976, batch_reg_loss: 0.1330, reg_loss: 0.1321 ||:  77%|#######7  | 86/111 [00:58<00:16,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8497, UAS: 0.9262, LAS: 0.8681, UEM: 0.5186, LEM: 0.2849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9150, partial_loss/deprel_loss: 0.9404, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0683, loss: 0.8935, batch_reg_loss: 0.1331, reg_loss: 0.1322 ||:  81%|########1 | 90/111 [01:00<00:13,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8307, UAS: 0.9267, LAS: 0.8686, UEM: 0.5241, LEM: 0.2879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1581, partial_loss/deprel_loss: 0.9771, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1465, loss: 0.8894, batch_reg_loss: 0.1331, reg_loss: 0.1322 ||:  85%|########4 | 94/111 [01:03<00:10,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8477, UAS: 0.9258, LAS: 0.8677, UEM: 0.5219, LEM: 0.2883, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0681, partial_loss/deprel_loss: 1.0203, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1631, loss: 0.8979, batch_reg_loss: 0.1332, reg_loss: 0.1323 ||:  88%|########8 | 98/111 [01:06<00:08,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9266, LAS: 0.8686, UEM: 0.5311, LEM: 0.2940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3334, partial_loss/deprel_loss: 0.4944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5954, loss: 0.8899, batch_reg_loss: 0.1333, reg_loss: 0.1323 ||:  92%|#########1| 102/111 [01:09<00:06,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9265, LAS: 0.8684, UEM: 0.5272, LEM: 0.2905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4459, partial_loss/deprel_loss: 0.6718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7599, loss: 0.8925, batch_reg_loss: 0.1333, reg_loss: 0.1323 ||:  95%|#########4| 105/111 [01:11<00:04,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8827, UAS: 0.9261, LAS: 0.8679, UEM: 0.5228, LEM: 0.2874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5106, partial_loss/deprel_loss: 0.6320, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7411, loss: 0.8953, batch_reg_loss: 0.1334, reg_loss: 0.1324 ||:  97%|#########7| 108/111 [01:13<00:02,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9265, LAS: 0.8684, UEM: 0.5222, LEM: 0.2859, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5453, partial_loss/deprel_loss: 0.6499, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7624, loss: 0.8914, batch_reg_loss: 0.1334, reg_loss: 0.1324 ||: 100%|##########| 111/111 [01:15<00:00,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9265, LAS: 0.8684, UEM: 0.5222, LEM: 0.2859, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5453, partial_loss/deprel_loss: 0.6499, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7624, loss: 0.8914, batch_reg_loss: 0.1334, reg_loss: 0.1324 ||: 100%|##########| 111/111 [01:15<00:00,  1.46it/s]\n",
      "2023-04-06 23:39:48,042 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:39:48,042 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:39:48,042 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:39:48,042 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:39:48,042 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:39:48,042 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.650  |       N/A\n",
      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.545  |       N/A\n",
      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.132  |       N/A\n",
      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - UEM                      |     0.522  |       N/A\n",
      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - LAS                      |     0.868  |       N/A\n",
      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - loss                     |     0.891  |       N/A\n",
      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - LEM                      |     0.286  |       N/A\n",
      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - UAS                      |     0.926  |       N/A\n",
      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:39:48,043 - INFO - combo.training.tensorboard_writer - EM                       |     0.894  |       N/A\n",
      "2023-04-06 23:39:48,044 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:39:48,044 - INFO - combo.training.trainer - Epoch duration: 0:01:15.865530\n",
      "2023-04-06 23:39:48,045 - INFO - combo.training.trainer - Estimated training time remaining: 7:56:25\n",
      "2023-04-06 23:39:48,045 - INFO - allennlp.training.trainer - Epoch 38/399\n",
      "2023-04-06 23:39:48,045 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:39:48,045 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:39:48,052 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8437, UAS: 0.9161, LAS: 0.8534, UEM: 0.1467, LEM: 0.0433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0036, partial_loss/deprel_loss: 0.8636, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0250, loss: 0.9915, batch_reg_loss: 0.1335, reg_loss: 0.1335 ||:   3%|2         | 3/111 [00:02<01:16,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8142, UAS: 0.9123, LAS: 0.8513, UEM: 0.1802, LEM: 0.0496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5122, partial_loss/deprel_loss: 1.1313, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3410, loss: 1.0190, batch_reg_loss: 0.1335, reg_loss: 0.1335 ||:   5%|5         | 6/111 [00:04<01:13,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9073, LAS: 0.8475, UEM: 0.2964, LEM: 0.1575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3239, partial_loss/deprel_loss: 0.4766, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5797, loss: 1.0513, batch_reg_loss: 0.1336, reg_loss: 0.1335 ||:   9%|9         | 10/111 [00:06<01:08,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9198, LAS: 0.8619, UEM: 0.4844, LEM: 0.2866, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5275, partial_loss/deprel_loss: 0.6271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7409, loss: 0.9421, batch_reg_loss: 0.1337, reg_loss: 0.1336 ||:  13%|#2        | 14/111 [00:09<01:04,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9218, LAS: 0.8642, UEM: 0.4745, LEM: 0.2762, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3876, partial_loss/deprel_loss: 0.4967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6086, loss: 0.9359, batch_reg_loss: 0.1338, reg_loss: 0.1336 ||:  15%|#5        | 17/111 [00:11<01:02,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8924, UAS: 0.9248, LAS: 0.8685, UEM: 0.4811, LEM: 0.2716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4559, partial_loss/deprel_loss: 0.6083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7117, loss: 0.9002, batch_reg_loss: 0.1338, reg_loss: 0.1336 ||:  19%|#8        | 21/111 [00:13<00:59,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9240, LAS: 0.8676, UEM: 0.4905, LEM: 0.2772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5441, partial_loss/deprel_loss: 0.6274, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7447, loss: 0.9093, batch_reg_loss: 0.1339, reg_loss: 0.1337 ||:  22%|##1       | 24/111 [00:16<01:00,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8375, UAS: 0.9241, LAS: 0.8673, UEM: 0.4942, LEM: 0.2837, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0271, partial_loss/deprel_loss: 0.9570, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1050, loss: 0.9047, batch_reg_loss: 0.1340, reg_loss: 0.1337 ||:  24%|##4       | 27/111 [00:18<00:59,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9236, LAS: 0.8662, UEM: 0.4872, LEM: 0.2738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3372, partial_loss/deprel_loss: 0.5897, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6733, loss: 0.9112, batch_reg_loss: 0.1340, reg_loss: 0.1337 ||:  27%|##7       | 30/111 [00:20<00:58,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9250, LAS: 0.8682, UEM: 0.5068, LEM: 0.2874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3059, partial_loss/deprel_loss: 0.4710, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5721, loss: 0.8960, batch_reg_loss: 0.1341, reg_loss: 0.1338 ||:  30%|##9       | 33/111 [00:22<00:55,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7594, UAS: 0.9238, LAS: 0.8673, UEM: 0.5198, LEM: 0.2986, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.6236, partial_loss/deprel_loss: 1.6358, partial_loss/cycle_loss: 0.0000, batch_loss: 1.9675, loss: 0.9092, batch_reg_loss: 0.1341, reg_loss: 0.1338 ||:  32%|###2      | 36/111 [00:25<00:56,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8449, UAS: 0.9248, LAS: 0.8688, UEM: 0.5415, LEM: 0.3280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0372, partial_loss/deprel_loss: 0.9183, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0763, loss: 0.8961, batch_reg_loss: 0.1342, reg_loss: 0.1338 ||:  35%|###5      | 39/111 [00:27<00:53,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9254, LAS: 0.8697, UEM: 0.5361, LEM: 0.3217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3875, partial_loss/deprel_loss: 0.4584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5785, loss: 0.8888, batch_reg_loss: 0.1343, reg_loss: 0.1338 ||:  38%|###7      | 42/111 [00:29<00:51,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9276, LAS: 0.8721, UEM: 0.5593, LEM: 0.3361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1639, partial_loss/deprel_loss: 0.4386, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5180, loss: 0.8677, batch_reg_loss: 0.1343, reg_loss: 0.1339 ||:  41%|####1     | 46/111 [00:32<00:46,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8959, UAS: 0.9286, LAS: 0.8729, UEM: 0.5516, LEM: 0.3245, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4020, partial_loss/deprel_loss: 0.5790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6780, loss: 0.8602, batch_reg_loss: 0.1344, reg_loss: 0.1339 ||:  45%|####5     | 50/111 [00:34<00:42,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8677, UAS: 0.9283, LAS: 0.8724, UEM: 0.5407, LEM: 0.3145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7025, partial_loss/deprel_loss: 0.8024, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9169, loss: 0.8647, batch_reg_loss: 0.1345, reg_loss: 0.1340 ||:  48%|####7     | 53/111 [00:37<00:42,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9300, LAS: 0.8742, UEM: 0.5445, LEM: 0.3121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3832, partial_loss/deprel_loss: 0.6491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7305, loss: 0.8520, batch_reg_loss: 0.1345, reg_loss: 0.1340 ||:  51%|#####1    | 57/111 [00:39<00:38,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8420, UAS: 0.9292, LAS: 0.8732, UEM: 0.5361, LEM: 0.3047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0990, partial_loss/deprel_loss: 0.9602, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1226, loss: 0.8597, batch_reg_loss: 0.1346, reg_loss: 0.1340 ||:  55%|#####4    | 61/111 [00:42<00:34,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9296, LAS: 0.8736, UEM: 0.5367, LEM: 0.3039, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4994, partial_loss/deprel_loss: 0.5723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6924, loss: 0.8544, batch_reg_loss: 0.1346, reg_loss: 0.1341 ||:  58%|#####7    | 64/111 [00:44<00:33,  1.42it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7939, UAS: 0.9282, LAS: 0.8718, UEM: 0.5287, LEM: 0.2974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7784, partial_loss/deprel_loss: 1.2841, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5176, loss: 0.8678, batch_reg_loss: 0.1347, reg_loss: 0.1341 ||:  60%|######    | 67/111 [00:46<00:30,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8464, UAS: 0.9276, LAS: 0.8711, UEM: 0.5219, LEM: 0.2923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9674, partial_loss/deprel_loss: 0.8496, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0079, loss: 0.8726, batch_reg_loss: 0.1347, reg_loss: 0.1341 ||:  63%|######3   | 70/111 [00:48<00:29,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8898, UAS: 0.9280, LAS: 0.8714, UEM: 0.5153, LEM: 0.2841, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4529, partial_loss/deprel_loss: 0.6124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7153, loss: 0.8731, batch_reg_loss: 0.1348, reg_loss: 0.1341 ||:  67%|######6   | 74/111 [00:51<00:24,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8183, UAS: 0.9288, LAS: 0.8724, UEM: 0.5400, LEM: 0.3144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4612, partial_loss/deprel_loss: 1.1146, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3188, loss: 0.8662, batch_reg_loss: 0.1349, reg_loss: 0.1342 ||:  70%|#######   | 78/111 [00:54<00:23,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9283, LAS: 0.8717, UEM: 0.5372, LEM: 0.3119, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3601, partial_loss/deprel_loss: 0.5822, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6727, loss: 0.8713, batch_reg_loss: 0.1349, reg_loss: 0.1342 ||:  73%|#######2  | 81/111 [00:56<00:21,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8786, UAS: 0.9280, LAS: 0.8713, UEM: 0.5341, LEM: 0.3088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5286, partial_loss/deprel_loss: 0.6541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7640, loss: 0.8738, batch_reg_loss: 0.1350, reg_loss: 0.1342 ||:  76%|#######5  | 84/111 [00:58<00:18,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8724, UAS: 0.9284, LAS: 0.8716, UEM: 0.5292, LEM: 0.3033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6210, partial_loss/deprel_loss: 0.6848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8071, loss: 0.8722, batch_reg_loss: 0.1351, reg_loss: 0.1343 ||:  79%|#######9  | 88/111 [01:01<00:15,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8379, UAS: 0.9283, LAS: 0.8715, UEM: 0.5263, LEM: 0.3003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2265, partial_loss/deprel_loss: 0.9465, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1377, loss: 0.8723, batch_reg_loss: 0.1352, reg_loss: 0.1343 ||:  83%|########2 | 92/111 [01:03<00:12,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9284, LAS: 0.8716, UEM: 0.5317, LEM: 0.3056, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3219, partial_loss/deprel_loss: 0.5873, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6694, loss: 0.8716, batch_reg_loss: 0.1352, reg_loss: 0.1343 ||:  86%|########6 | 96/111 [01:06<00:10,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7974, UAS: 0.9280, LAS: 0.8711, UEM: 0.5262, LEM: 0.3005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6483, partial_loss/deprel_loss: 1.2148, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4368, loss: 0.8753, batch_reg_loss: 0.1353, reg_loss: 0.1344 ||:  90%|######### | 100/111 [01:09<00:07,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8199, UAS: 0.9261, LAS: 0.8692, UEM: 0.5205, LEM: 0.2971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4797, partial_loss/deprel_loss: 1.0433, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2660, loss: 0.8891, batch_reg_loss: 0.1354, reg_loss: 0.1344 ||:  93%|#########2| 103/111 [01:11<00:05,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8481, UAS: 0.9259, LAS: 0.8689, UEM: 0.5149, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9886, partial_loss/deprel_loss: 0.9805, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1176, loss: 0.8923, batch_reg_loss: 0.1354, reg_loss: 0.1345 ||:  96%|#########6| 107/111 [01:14<00:02,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9264, LAS: 0.8696, UEM: 0.5161, LEM: 0.2913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2614, partial_loss/deprel_loss: 0.4928, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5820, loss: 0.8875, batch_reg_loss: 0.1355, reg_loss: 0.1345 ||: 100%|##########| 111/111 [01:16<00:00,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9264, LAS: 0.8696, UEM: 0.5161, LEM: 0.2913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2614, partial_loss/deprel_loss: 0.4928, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5820, loss: 0.8875, batch_reg_loss: 0.1355, reg_loss: 0.1345 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.493  |       N/A\n",
      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.261  |       N/A\n",
      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.134  |       N/A\n",
      "2023-04-06 23:41:04,480 - INFO - combo.training.tensorboard_writer - UEM                      |     0.516  |       N/A\n",
      "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - LAS                      |     0.870  |       N/A\n",
      "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - loss                     |     0.888  |       N/A\n",
      "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - LEM                      |     0.291  |       N/A\n",
      "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - UAS                      |     0.926  |       N/A\n",
      "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - EM                       |     0.911  |       N/A\n",
      "2023-04-06 23:41:04,481 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:41:04,482 - INFO - combo.training.trainer - Epoch duration: 0:01:16.437091\n",
      "2023-04-06 23:41:04,482 - INFO - combo.training.trainer - Estimated training time remaining: 7:54:43\n",
      "2023-04-06 23:41:04,482 - INFO - allennlp.training.trainer - Epoch 39/399\n",
      "2023-04-06 23:41:04,482 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:41:04,482 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:41:04,489 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8679, UAS: 0.9271, LAS: 0.8726, UEM: 0.3130, LEM: 0.1275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7463, partial_loss/deprel_loss: 0.7432, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8794, loss: 0.8727, batch_reg_loss: 0.1356, reg_loss: 0.1356 ||:   3%|2         | 3/111 [00:02<01:26,  1.24it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8643, UAS: 0.9318, LAS: 0.8801, UEM: 0.6530, LEM: 0.5221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8199, partial_loss/deprel_loss: 0.7412, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8926, loss: 0.8137, batch_reg_loss: 0.1357, reg_loss: 0.1356 ||:   5%|5         | 6/111 [00:04<01:23,  1.25it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8942, UAS: 0.9279, LAS: 0.8751, UEM: 0.6365, LEM: 0.4647, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4726, partial_loss/deprel_loss: 0.5603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6784, loss: 0.8520, batch_reg_loss: 0.1357, reg_loss: 0.1356 ||:   8%|8         | 9/111 [00:07<01:20,  1.27it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9365, LAS: 0.8843, UEM: 0.6833, LEM: 0.4764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1591, partial_loss/deprel_loss: 0.3740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4668, loss: 0.7746, batch_reg_loss: 0.1358, reg_loss: 0.1357 ||:  11%|#         | 12/111 [00:09<01:17,  1.28it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9311, LAS: 0.8782, UEM: 0.6278, LEM: 0.4261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4972, partial_loss/deprel_loss: 0.5300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6593, loss: 0.8231, batch_reg_loss: 0.1358, reg_loss: 0.1357 ||:  14%|#4        | 16/111 [00:11<01:08,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8565, UAS: 0.9309, LAS: 0.8773, UEM: 0.5934, LEM: 0.3878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9564, partial_loss/deprel_loss: 0.8364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9963, loss: 0.8333, batch_reg_loss: 0.1359, reg_loss: 0.1357 ||:  17%|#7        | 19/111 [00:14<01:07,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9315, LAS: 0.8780, UEM: 0.6091, LEM: 0.4108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1309, partial_loss/deprel_loss: 0.2656, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3746, loss: 0.8262, batch_reg_loss: 0.1360, reg_loss: 0.1358 ||:  20%|#9        | 22/111 [00:16<01:05,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8924, UAS: 0.9291, LAS: 0.8751, UEM: 0.5884, LEM: 0.3928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4094, partial_loss/deprel_loss: 0.5780, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6803, loss: 0.8458, batch_reg_loss: 0.1360, reg_loss: 0.1358 ||:  23%|##2       | 25/111 [00:18<01:03,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8899, UAS: 0.9310, LAS: 0.8771, UEM: 0.5775, LEM: 0.3731, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4881, partial_loss/deprel_loss: 0.6655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7661, loss: 0.8331, batch_reg_loss: 0.1361, reg_loss: 0.1358 ||:  25%|##5       | 28/111 [00:20<00:59,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9315, LAS: 0.8775, UEM: 0.5766, LEM: 0.3667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3092, partial_loss/deprel_loss: 0.4598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5658, loss: 0.8266, batch_reg_loss: 0.1361, reg_loss: 0.1358 ||:  28%|##7       | 31/111 [00:23<01:02,  1.28it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9334, LAS: 0.8794, UEM: 0.5744, LEM: 0.3537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4142, partial_loss/deprel_loss: 0.5945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6946, loss: 0.8153, batch_reg_loss: 0.1362, reg_loss: 0.1359 ||:  32%|###1      | 35/111 [00:25<00:56,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9338, LAS: 0.8798, UEM: 0.5824, LEM: 0.3585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1928, partial_loss/deprel_loss: 0.3426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4489, loss: 0.8117, batch_reg_loss: 0.1363, reg_loss: 0.1359 ||:  35%|###5      | 39/111 [00:28<00:49,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9350, LAS: 0.8810, UEM: 0.5892, LEM: 0.3634, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3795, partial_loss/deprel_loss: 0.5966, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6895, loss: 0.8028, batch_reg_loss: 0.1363, reg_loss: 0.1360 ||:  39%|###8      | 43/111 [00:30<00:45,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9368, LAS: 0.8829, UEM: 0.5965, LEM: 0.3631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2365, partial_loss/deprel_loss: 0.4359, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5324, loss: 0.7887, batch_reg_loss: 0.1364, reg_loss: 0.1360 ||:  42%|####2     | 47/111 [00:32<00:40,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8263, UAS: 0.9351, LAS: 0.8808, UEM: 0.5802, LEM: 0.3496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2804, partial_loss/deprel_loss: 1.0114, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2017, loss: 0.8047, batch_reg_loss: 0.1365, reg_loss: 0.1360 ||:  46%|####5     | 51/111 [00:35<00:38,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7825, UAS: 0.9341, LAS: 0.8795, UEM: 0.5765, LEM: 0.3437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8381, partial_loss/deprel_loss: 1.2425, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4981, loss: 0.8138, batch_reg_loss: 0.1365, reg_loss: 0.1361 ||:  50%|####9     | 55/111 [00:38<00:38,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9343, LAS: 0.8798, UEM: 0.5758, LEM: 0.3433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2422, partial_loss/deprel_loss: 0.3801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4891, loss: 0.8124, batch_reg_loss: 0.1366, reg_loss: 0.1361 ||:  52%|#####2    | 58/111 [00:40<00:36,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9338, LAS: 0.8791, UEM: 0.5644, LEM: 0.3330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5629, partial_loss/deprel_loss: 0.6541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7725, loss: 0.8162, batch_reg_loss: 0.1366, reg_loss: 0.1361 ||:  56%|#####5    | 62/111 [00:42<00:31,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8466, UAS: 0.9340, LAS: 0.8790, UEM: 0.5651, LEM: 0.3313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0235, partial_loss/deprel_loss: 0.9341, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0887, loss: 0.8163, batch_reg_loss: 0.1367, reg_loss: 0.1362 ||:  59%|#####9    | 66/111 [00:45<00:28,  1.61it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8475, UAS: 0.9333, LAS: 0.8778, UEM: 0.5585, LEM: 0.3260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8708, partial_loss/deprel_loss: 1.0278, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1332, loss: 0.8263, batch_reg_loss: 0.1368, reg_loss: 0.1362 ||:  63%|######3   | 70/111 [00:48<00:26,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9324, LAS: 0.8769, UEM: 0.5601, LEM: 0.3258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4513, partial_loss/deprel_loss: 0.5420, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6606, loss: 0.8319, batch_reg_loss: 0.1368, reg_loss: 0.1362 ||:  67%|######6   | 74/111 [00:50<00:23,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9312, LAS: 0.8757, UEM: 0.5582, LEM: 0.3261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3023, partial_loss/deprel_loss: 0.4266, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5386, loss: 0.8426, batch_reg_loss: 0.1369, reg_loss: 0.1363 ||:  70%|#######   | 78/111 [00:53<00:22,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9305, LAS: 0.8749, UEM: 0.5510, LEM: 0.3210, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3944, partial_loss/deprel_loss: 0.5743, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6753, loss: 0.8499, batch_reg_loss: 0.1370, reg_loss: 0.1363 ||:  74%|#######3  | 82/111 [00:56<00:19,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9310, LAS: 0.8753, UEM: 0.5488, LEM: 0.3173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3884, partial_loss/deprel_loss: 0.5201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6308, loss: 0.8477, batch_reg_loss: 0.1370, reg_loss: 0.1363 ||:  77%|#######6  | 85/111 [00:58<00:17,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8486, UAS: 0.9303, LAS: 0.8745, UEM: 0.5408, LEM: 0.3115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9831, partial_loss/deprel_loss: 0.8483, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0123, loss: 0.8528, batch_reg_loss: 0.1371, reg_loss: 0.1363 ||:  79%|#######9  | 88/111 [01:00<00:15,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9297, LAS: 0.8737, UEM: 0.5392, LEM: 0.3100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4849, partial_loss/deprel_loss: 0.6716, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7715, loss: 0.8581, batch_reg_loss: 0.1372, reg_loss: 0.1364 ||:  83%|########2 | 92/111 [01:02<00:12,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8381, UAS: 0.9299, LAS: 0.8737, UEM: 0.5393, LEM: 0.3086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0448, partial_loss/deprel_loss: 0.8961, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0631, loss: 0.8567, batch_reg_loss: 0.1373, reg_loss: 0.1364 ||:  86%|########6 | 96/111 [01:05<00:09,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8109, UAS: 0.9285, LAS: 0.8721, UEM: 0.5326, LEM: 0.3036, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6162, partial_loss/deprel_loss: 1.2664, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4737, loss: 0.8717, batch_reg_loss: 0.1374, reg_loss: 0.1364 ||:  90%|######### | 100/111 [01:08<00:07,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8685, UAS: 0.9289, LAS: 0.8726, UEM: 0.5333, LEM: 0.3021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6726, partial_loss/deprel_loss: 0.6797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8157, loss: 0.8672, batch_reg_loss: 0.1374, reg_loss: 0.1365 ||:  93%|#########2| 103/111 [01:10<00:05,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8184, UAS: 0.9280, LAS: 0.8714, UEM: 0.5288, LEM: 0.2982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3722, partial_loss/deprel_loss: 1.1339, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3191, loss: 0.8774, batch_reg_loss: 0.1375, reg_loss: 0.1365 ||:  96%|#########6| 107/111 [01:13<00:02,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8885, UAS: 0.9276, LAS: 0.8710, UEM: 0.5262, LEM: 0.2959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5914, partial_loss/deprel_loss: 0.5512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6968, loss: 0.8794, batch_reg_loss: 0.1376, reg_loss: 0.1365 ||: 100%|##########| 111/111 [01:15<00:00,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8885, UAS: 0.9276, LAS: 0.8710, UEM: 0.5262, LEM: 0.2959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5914, partial_loss/deprel_loss: 0.5512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6968, loss: 0.8794, batch_reg_loss: 0.1376, reg_loss: 0.1365 ||: 100%|##########| 111/111 [01:15<00:00,  1.46it/s]\n",
      "2023-04-06 23:42:20,382 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:42:20,382 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:42:20,382 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.551  |       N/A\n",
      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.591  |       N/A\n",
      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.137  |       N/A\n",
      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - UEM                      |     0.526  |       N/A\n",
      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - LAS                      |     0.871  |       N/A\n",
      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - loss                     |     0.879  |       N/A\n",
      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - LEM                      |     0.296  |       N/A\n",
      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:42:20,383 - INFO - combo.training.tensorboard_writer - UAS                      |     0.928  |       N/A\n",
      "2023-04-06 23:42:20,384 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:42:20,384 - INFO - combo.training.tensorboard_writer - EM                       |     0.889  |       N/A\n",
      "2023-04-06 23:42:20,384 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:42:20,384 - INFO - combo.training.trainer - Epoch duration: 0:01:15.902319\n",
      "2023-04-06 23:42:20,384 - INFO - combo.training.trainer - Estimated training time remaining: 7:52:57\n",
      "2023-04-06 23:42:20,385 - INFO - allennlp.training.trainer - Epoch 40/399\n",
      "2023-04-06 23:42:20,385 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:42:20,385 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:42:20,392 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8570, UAS: 0.9317, LAS: 0.8756, UEM: 0.5489, LEM: 0.2962, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8281, partial_loss/deprel_loss: 0.8210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9601, loss: 0.8450, batch_reg_loss: 0.1376, reg_loss: 0.1376 ||:   4%|3         | 4/111 [00:02<01:11,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9439, LAS: 0.8883, UEM: 0.6418, LEM: 0.3665, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3450, partial_loss/deprel_loss: 0.6142, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6981, loss: 0.7376, batch_reg_loss: 0.1377, reg_loss: 0.1376 ||:   6%|6         | 7/111 [00:05<01:17,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8566, UAS: 0.9406, LAS: 0.8849, UEM: 0.5977, LEM: 0.3307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9597, partial_loss/deprel_loss: 0.8677, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0238, loss: 0.7623, batch_reg_loss: 0.1378, reg_loss: 0.1377 ||:   9%|9         | 10/111 [00:07<01:15,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8822, UAS: 0.9310, LAS: 0.8748, UEM: 0.5612, LEM: 0.3008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5104, partial_loss/deprel_loss: 0.6686, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7747, loss: 0.8476, batch_reg_loss: 0.1378, reg_loss: 0.1377 ||:  12%|#1        | 13/111 [00:09<01:12,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9346, LAS: 0.8790, UEM: 0.5600, LEM: 0.2946, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3911, partial_loss/deprel_loss: 0.5027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6182, loss: 0.8156, batch_reg_loss: 0.1379, reg_loss: 0.1377 ||:  14%|#4        | 16/111 [00:12<01:10,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8492, UAS: 0.9323, LAS: 0.8758, UEM: 0.5203, LEM: 0.2651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9130, partial_loss/deprel_loss: 0.9827, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1067, loss: 0.8472, batch_reg_loss: 0.1379, reg_loss: 0.1378 ||:  18%|#8        | 20/111 [00:14<01:05,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8734, UAS: 0.9317, LAS: 0.8753, UEM: 0.4986, LEM: 0.2493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7004, partial_loss/deprel_loss: 0.7843, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9055, loss: 0.8557, batch_reg_loss: 0.1380, reg_loss: 0.1378 ||:  21%|##        | 23/111 [00:16<01:03,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9292, LAS: 0.8729, UEM: 0.4781, LEM: 0.2357, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4067, partial_loss/deprel_loss: 0.5801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6835, loss: 0.8777, batch_reg_loss: 0.1381, reg_loss: 0.1378 ||:  24%|##4       | 27/111 [00:19<00:57,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8920, UAS: 0.9319, LAS: 0.8755, UEM: 0.5036, LEM: 0.2529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5178, partial_loss/deprel_loss: 0.6325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7477, loss: 0.8563, batch_reg_loss: 0.1381, reg_loss: 0.1379 ||:  28%|##7       | 31/111 [00:21<00:53,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8942, UAS: 0.9352, LAS: 0.8802, UEM: 0.5864, LEM: 0.3575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4408, partial_loss/deprel_loss: 0.6740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7656, loss: 0.8228, batch_reg_loss: 0.1382, reg_loss: 0.1379 ||:  31%|###       | 34/111 [00:24<00:56,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9331, LAS: 0.8780, UEM: 0.5720, LEM: 0.3460, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5699, partial_loss/deprel_loss: 0.6384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7629, loss: 0.8427, batch_reg_loss: 0.1382, reg_loss: 0.1379 ||:  33%|###3      | 37/111 [00:26<00:53,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9335, LAS: 0.8782, UEM: 0.5702, LEM: 0.3385, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2598, partial_loss/deprel_loss: 0.4579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5566, loss: 0.8412, batch_reg_loss: 0.1383, reg_loss: 0.1380 ||:  37%|###6      | 41/111 [00:29<00:48,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8557, UAS: 0.9335, LAS: 0.8780, UEM: 0.5642, LEM: 0.3338, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8098, partial_loss/deprel_loss: 0.8707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9969, loss: 0.8421, batch_reg_loss: 0.1384, reg_loss: 0.1380 ||:  40%|###9      | 44/111 [00:31<00:48,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9330, LAS: 0.8774, UEM: 0.5605, LEM: 0.3306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3433, partial_loss/deprel_loss: 0.4961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6040, loss: 0.8485, batch_reg_loss: 0.1384, reg_loss: 0.1380 ||:  42%|####2     | 47/111 [00:33<00:46,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9339, LAS: 0.8782, UEM: 0.5593, LEM: 0.3252, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3518, partial_loss/deprel_loss: 0.4778, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5911, loss: 0.8408, batch_reg_loss: 0.1385, reg_loss: 0.1380 ||:  45%|####5     | 50/111 [00:35<00:43,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8571, UAS: 0.9330, LAS: 0.8769, UEM: 0.5442, LEM: 0.3141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8073, partial_loss/deprel_loss: 0.8530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9824, loss: 0.8503, batch_reg_loss: 0.1385, reg_loss: 0.1381 ||:  49%|####8     | 54/111 [00:38<00:39,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8757, UAS: 0.9338, LAS: 0.8778, UEM: 0.5522, LEM: 0.3229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5658, partial_loss/deprel_loss: 0.7195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8274, loss: 0.8418, batch_reg_loss: 0.1386, reg_loss: 0.1381 ||:  51%|#####1    | 57/111 [00:40<00:39,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8581, UAS: 0.9322, LAS: 0.8759, UEM: 0.5406, LEM: 0.3129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8303, partial_loss/deprel_loss: 0.8697, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0005, loss: 0.8547, batch_reg_loss: 0.1387, reg_loss: 0.1381 ||:  55%|#####4    | 61/111 [00:43<00:34,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8370, UAS: 0.9314, LAS: 0.8750, UEM: 0.5303, LEM: 0.3042, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0092, partial_loss/deprel_loss: 0.9400, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0926, loss: 0.8601, batch_reg_loss: 0.1387, reg_loss: 0.1382 ||:  59%|#####8    | 65/111 [00:45<00:29,  1.54it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9322, LAS: 0.8760, UEM: 0.5436, LEM: 0.3141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2285, partial_loss/deprel_loss: 0.4120, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.8483, batch_reg_loss: 0.1388, reg_loss: 0.1382 ||:  62%|######2   | 69/111 [00:48<00:27,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8724, UAS: 0.9315, LAS: 0.8752, UEM: 0.5358, LEM: 0.3083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7962, partial_loss/deprel_loss: 0.7627, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9083, loss: 0.8559, batch_reg_loss: 0.1389, reg_loss: 0.1382 ||:  66%|######5   | 73/111 [00:50<00:25,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8556, UAS: 0.9308, LAS: 0.8746, UEM: 0.5263, LEM: 0.3017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9985, partial_loss/deprel_loss: 0.9882, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1292, loss: 0.8618, batch_reg_loss: 0.1390, reg_loss: 0.1383 ||:  69%|######9   | 77/111 [00:53<00:23,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9109, UAS: 0.9306, LAS: 0.8743, UEM: 0.5325, LEM: 0.3061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2627, partial_loss/deprel_loss: 0.4424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5455, loss: 0.8641, batch_reg_loss: 0.1390, reg_loss: 0.1383 ||:  73%|#######2  | 81/111 [00:56<00:21,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9309, LAS: 0.8746, UEM: 0.5345, LEM: 0.3060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3698, partial_loss/deprel_loss: 0.4835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5998, loss: 0.8614, batch_reg_loss: 0.1391, reg_loss: 0.1383 ||:  77%|#######6  | 85/111 [00:59<00:17,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9311, LAS: 0.8748, UEM: 0.5386, LEM: 0.3098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1995, partial_loss/deprel_loss: 0.3761, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4799, loss: 0.8597, batch_reg_loss: 0.1392, reg_loss: 0.1384 ||:  79%|#######9  | 88/111 [01:01<00:15,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7752, UAS: 0.9306, LAS: 0.8743, UEM: 0.5397, LEM: 0.3097, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1589, partial_loss/deprel_loss: 1.3621, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6607, loss: 0.8631, batch_reg_loss: 0.1392, reg_loss: 0.1384 ||:  83%|########2 | 92/111 [01:03<00:12,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8928, UAS: 0.9301, LAS: 0.8737, UEM: 0.5393, LEM: 0.3071, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4196, partial_loss/deprel_loss: 0.6012, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7042, loss: 0.8662, batch_reg_loss: 0.1393, reg_loss: 0.1384 ||:  86%|########5 | 95/111 [01:06<00:11,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8977, UAS: 0.9305, LAS: 0.8740, UEM: 0.5404, LEM: 0.3065, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3724, partial_loss/deprel_loss: 0.5439, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6489, loss: 0.8636, batch_reg_loss: 0.1393, reg_loss: 0.1385 ||:  88%|########8 | 98/111 [01:08<00:09,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8126, UAS: 0.9289, LAS: 0.8722, UEM: 0.5321, LEM: 0.3010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5588, partial_loss/deprel_loss: 1.1620, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3808, loss: 0.8792, batch_reg_loss: 0.1394, reg_loss: 0.1385 ||:  92%|#########1| 102/111 [01:10<00:06,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9288, LAS: 0.8719, UEM: 0.5261, LEM: 0.2958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6212, partial_loss/deprel_loss: 0.7073, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8296, loss: 0.8832, batch_reg_loss: 0.1395, reg_loss: 0.1385 ||:  95%|#########5| 106/111 [01:13<00:03,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8191, UAS: 0.9283, LAS: 0.8714, UEM: 0.5235, LEM: 0.2934, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4445, partial_loss/deprel_loss: 1.0017, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2298, loss: 0.8870, batch_reg_loss: 0.1396, reg_loss: 0.1386 ||:  99%|#########9| 110/111 [01:16<00:00,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9286, LAS: 0.8717, UEM: 0.5255, LEM: 0.2944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2913, partial_loss/deprel_loss: 0.4945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5934, loss: 0.8844, batch_reg_loss: 0.1396, reg_loss: 0.1386 ||: 100%|##########| 111/111 [01:17<00:00,  1.44it/s]\n",
      "2023-04-06 23:43:37,470 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9060, UAS: 0.9208, LAS: 0.8625, UEM: 0.4979, LEM: 0.1992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3803, partial_loss/deprel_loss: 25.0669, partial_loss/cycle_loss: 0.0000, batch_loss: 20.1296, loss: 34.6105, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:11,  1.03s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8574, UAS: 0.9200, LAS: 0.8624, UEM: 0.3798, LEM: 0.1298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2659, partial_loss/deprel_loss: 50.9556, partial_loss/cycle_loss: 0.0000, batch_loss: 41.0176, loss: 35.2960, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  31%|###       | 4/13 [00:04<00:09,  1.03s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8879, UAS: 0.9319, LAS: 0.8754, UEM: 0.4854, LEM: 0.2095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5658, partial_loss/deprel_loss: 25.1574, partial_loss/cycle_loss: 0.0000, batch_loss: 20.2391, loss: 30.3282, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  54%|#####3    | 7/13 [00:06<00:05,  1.00it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9064, UAS: 0.9407, LAS: 0.8855, UEM: 0.6077, LEM: 0.3154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3743, partial_loss/deprel_loss: 26.9548, partial_loss/cycle_loss: 0.0000, batch_loss: 21.6387, loss: 28.1431, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  69%|######9   | 9/13 [00:08<00:04,  1.01s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8816, UAS: 0.9435, LAS: 0.8899, UEM: 0.6518, LEM: 0.3867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7037, partial_loss/deprel_loss: 31.0434, partial_loss/cycle_loss: 0.0000, batch_loss: 24.9755, loss: 26.9689, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  92%|#########2| 12/13 [00:11<00:00,  1.03it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8706, UAS: 0.9423, LAS: 0.8885, UEM: 0.6328, LEM: 0.3709, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9222, partial_loss/deprel_loss: 32.1733, partial_loss/cycle_loss: 0.0000, batch_loss: 25.9231, loss: 26.8884, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.05it/s]\n",
      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.494  |    32.173\n",
      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.291  |     0.922\n",
      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.139  |     0.000\n",
      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - UEM                      |     0.525  |     0.633\n",
      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - LAS                      |     0.872  |     0.888\n",
      "2023-04-06 23:43:49,821 - INFO - combo.training.tensorboard_writer - loss                     |     0.884  |    26.888\n",
      "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - LEM                      |     0.294  |     0.371\n",
      "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - UAS                      |     0.929  |     0.942\n",
      "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - EM                       |     0.911  |     0.871\n",
      "2023-04-06 23:43:49,822 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:43:49,822 - INFO - combo.training.trainer - Epoch duration: 0:01:29.437908\n",
      "2023-04-06 23:43:49,823 - INFO - combo.training.trainer - Estimated training time remaining: 7:53:11\n",
      "2023-04-06 23:43:49,823 - INFO - allennlp.training.trainer - Epoch 41/399\n",
      "2023-04-06 23:43:49,823 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:43:49,823 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:43:49,829 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8656, UAS: 0.9473, LAS: 0.8922, UEM: 0.5747, LEM: 0.2760, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7457, partial_loss/deprel_loss: 0.8736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9877, loss: 0.7340, batch_reg_loss: 0.1397, reg_loss: 0.1396 ||:   4%|3         | 4/111 [00:02<01:06,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8831, UAS: 0.9386, LAS: 0.8829, UEM: 0.5009, LEM: 0.2195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5661, partial_loss/deprel_loss: 0.6803, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7971, loss: 0.8012, batch_reg_loss: 0.1397, reg_loss: 0.1397 ||:   6%|6         | 7/111 [00:04<01:06,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9384, LAS: 0.8814, UEM: 0.4792, LEM: 0.2018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3911, partial_loss/deprel_loss: 0.5334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6447, loss: 0.8055, batch_reg_loss: 0.1398, reg_loss: 0.1397 ||:  10%|9         | 11/111 [00:07<01:05,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9380, LAS: 0.8812, UEM: 0.4718, LEM: 0.1999, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6246, partial_loss/deprel_loss: 0.7587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8718, loss: 0.8062, batch_reg_loss: 0.1399, reg_loss: 0.1397 ||:  14%|#3        | 15/111 [00:09<01:01,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9369, LAS: 0.8806, UEM: 0.4850, LEM: 0.2139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4880, partial_loss/deprel_loss: 0.5864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7066, loss: 0.8159, batch_reg_loss: 0.1399, reg_loss: 0.1398 ||:  16%|#6        | 18/111 [00:12<01:03,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9013, UAS: 0.9404, LAS: 0.8844, UEM: 0.5462, LEM: 0.2671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2989, partial_loss/deprel_loss: 0.4637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5707, loss: 0.7806, batch_reg_loss: 0.1400, reg_loss: 0.1398 ||:  19%|#8        | 21/111 [00:14<01:02,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8661, UAS: 0.9405, LAS: 0.8848, UEM: 0.5380, LEM: 0.2601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7704, partial_loss/deprel_loss: 0.7739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9132, loss: 0.7765, batch_reg_loss: 0.1400, reg_loss: 0.1398 ||:  22%|##1       | 24/111 [00:16<01:03,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8796, UAS: 0.9381, LAS: 0.8821, UEM: 0.5425, LEM: 0.2663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4807, partial_loss/deprel_loss: 0.6797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7800, loss: 0.7943, batch_reg_loss: 0.1401, reg_loss: 0.1398 ||:  24%|##4       | 27/111 [00:18<01:00,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8412, UAS: 0.9360, LAS: 0.8798, UEM: 0.5291, LEM: 0.2597, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2766, partial_loss/deprel_loss: 0.8635, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0862, loss: 0.8113, batch_reg_loss: 0.1401, reg_loss: 0.1399 ||:  27%|##7       | 30/111 [00:20<00:56,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8469, UAS: 0.9353, LAS: 0.8792, UEM: 0.5505, LEM: 0.2951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0839, partial_loss/deprel_loss: 0.9513, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1179, loss: 0.8167, batch_reg_loss: 0.1401, reg_loss: 0.1399 ||:  30%|##9       | 33/111 [00:22<00:55,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9379, LAS: 0.8819, UEM: 0.5853, LEM: 0.3245, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1621, partial_loss/deprel_loss: 0.4345, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5203, loss: 0.7952, batch_reg_loss: 0.1402, reg_loss: 0.1399 ||:  32%|###2      | 36/111 [00:25<00:54,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8714, UAS: 0.9373, LAS: 0.8810, UEM: 0.5804, LEM: 0.3192, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5903, partial_loss/deprel_loss: 0.6910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8111, loss: 0.8015, batch_reg_loss: 0.1403, reg_loss: 0.1399 ||:  36%|###6      | 40/111 [00:27<00:50,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9365, LAS: 0.8805, UEM: 0.5882, LEM: 0.3335, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1602, partial_loss/deprel_loss: 0.3119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4219, loss: 0.8045, batch_reg_loss: 0.1403, reg_loss: 0.1400 ||:  39%|###8      | 43/111 [00:29<00:48,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8546, UAS: 0.9357, LAS: 0.8799, UEM: 0.5839, LEM: 0.3325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0559, partial_loss/deprel_loss: 0.8560, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0364, loss: 0.8087, batch_reg_loss: 0.1404, reg_loss: 0.1400 ||:  41%|####1     | 46/111 [00:32<00:45,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9030, UAS: 0.9341, LAS: 0.8782, UEM: 0.5697, LEM: 0.3216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4055, partial_loss/deprel_loss: 0.4768, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6030, loss: 0.8229, batch_reg_loss: 0.1404, reg_loss: 0.1400 ||:  45%|####5     | 50/111 [00:34<00:41,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8459, UAS: 0.9332, LAS: 0.8772, UEM: 0.5581, LEM: 0.3137, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9401, partial_loss/deprel_loss: 0.8900, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0405, loss: 0.8303, batch_reg_loss: 0.1405, reg_loss: 0.1401 ||:  48%|####7     | 53/111 [00:36<00:39,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9313, LAS: 0.8754, UEM: 0.5553, LEM: 0.3113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7602, partial_loss/deprel_loss: 0.7644, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9042, loss: 0.8451, batch_reg_loss: 0.1406, reg_loss: 0.1401 ||:  50%|#####     | 56/111 [00:38<00:38,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9299, LAS: 0.8736, UEM: 0.5401, LEM: 0.3008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6608, partial_loss/deprel_loss: 0.7292, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8562, loss: 0.8595, batch_reg_loss: 0.1406, reg_loss: 0.1401 ||:  54%|#####4    | 60/111 [00:41<00:35,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8242, UAS: 0.9297, LAS: 0.8732, UEM: 0.5341, LEM: 0.2944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2914, partial_loss/deprel_loss: 0.9993, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1984, loss: 0.8635, batch_reg_loss: 0.1407, reg_loss: 0.1401 ||:  57%|#####6    | 63/111 [00:43<00:33,  1.43it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9030, UAS: 0.9302, LAS: 0.8736, UEM: 0.5320, LEM: 0.2897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3977, partial_loss/deprel_loss: 0.5494, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6598, loss: 0.8592, batch_reg_loss: 0.1408, reg_loss: 0.1402 ||:  59%|#####9    | 66/111 [00:45<00:31,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8815, UAS: 0.9306, LAS: 0.8740, UEM: 0.5362, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5458, partial_loss/deprel_loss: 0.6075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7360, loss: 0.8557, batch_reg_loss: 0.1408, reg_loss: 0.1402 ||:  63%|######3   | 70/111 [00:48<00:28,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8934, UAS: 0.9305, LAS: 0.8737, UEM: 0.5287, LEM: 0.2884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3618, partial_loss/deprel_loss: 0.5886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6841, loss: 0.8577, batch_reg_loss: 0.1409, reg_loss: 0.1402 ||:  67%|######6   | 74/111 [00:50<00:24,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8691, UAS: 0.9301, LAS: 0.8732, UEM: 0.5233, LEM: 0.2842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6254, partial_loss/deprel_loss: 0.8169, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9195, loss: 0.8652, batch_reg_loss: 0.1410, reg_loss: 0.1403 ||:  70%|#######   | 78/111 [00:53<00:21,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8655, UAS: 0.9296, LAS: 0.8724, UEM: 0.5124, LEM: 0.2764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8604, partial_loss/deprel_loss: 0.7997, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9529, loss: 0.8711, batch_reg_loss: 0.1411, reg_loss: 0.1403 ||:  74%|#######3  | 82/111 [00:56<00:19,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8117, UAS: 0.9287, LAS: 0.8713, UEM: 0.5086, LEM: 0.2733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6232, partial_loss/deprel_loss: 1.1753, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4060, loss: 0.8803, batch_reg_loss: 0.1411, reg_loss: 0.1404 ||:  77%|#######7  | 86/111 [00:58<00:16,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8470, UAS: 0.9289, LAS: 0.8716, UEM: 0.5090, LEM: 0.2731, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9237, partial_loss/deprel_loss: 0.8957, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0425, loss: 0.8771, batch_reg_loss: 0.1412, reg_loss: 0.1404 ||:  81%|########1 | 90/111 [01:01<00:14,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8360, UAS: 0.9291, LAS: 0.8718, UEM: 0.5114, LEM: 0.2740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2032, partial_loss/deprel_loss: 1.0468, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2193, loss: 0.8760, batch_reg_loss: 0.1413, reg_loss: 0.1404 ||:  84%|########3 | 93/111 [01:05<00:15,  1.13it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9488, UAS: 0.9303, LAS: 0.8733, UEM: 0.5341, LEM: 0.3001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0761, partial_loss/deprel_loss: 0.1753, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2968, loss: 0.8647, batch_reg_loss: 0.1413, reg_loss: 0.1404 ||:  86%|########6 | 96/111 [01:08<00:12,  1.17it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8879, UAS: 0.9304, LAS: 0.8733, UEM: 0.5303, LEM: 0.2949, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4572, partial_loss/deprel_loss: 0.5740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6921, loss: 0.8644, batch_reg_loss: 0.1414, reg_loss: 0.1405 ||:  90%|######### | 100/111 [01:10<00:08,  1.25it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7828, UAS: 0.9302, LAS: 0.8732, UEM: 0.5366, LEM: 0.3012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0178, partial_loss/deprel_loss: 1.2750, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5650, loss: 0.8644, batch_reg_loss: 0.1415, reg_loss: 0.1405 ||:  93%|#########2| 103/111 [01:12<00:06,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8301, UAS: 0.9297, LAS: 0.8725, UEM: 0.5303, LEM: 0.2958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2271, partial_loss/deprel_loss: 0.9879, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1772, loss: 0.8693, batch_reg_loss: 0.1415, reg_loss: 0.1405 ||:  96%|#########6| 107/111 [01:15<00:02,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8079, UAS: 0.9286, LAS: 0.8714, UEM: 0.5247, LEM: 0.2920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5258, partial_loss/deprel_loss: 1.1332, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3533, loss: 0.8775, batch_reg_loss: 0.1416, reg_loss: 0.1406 ||: 100%|##########| 111/111 [01:17<00:00,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8079, UAS: 0.9286, LAS: 0.8714, UEM: 0.5247, LEM: 0.2920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5258, partial_loss/deprel_loss: 1.1332, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3533, loss: 0.8775, batch_reg_loss: 0.1416, reg_loss: 0.1406 ||: 100%|##########| 111/111 [01:17<00:00,  1.43it/s]\n",
      "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:45:07,632 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.133  |       N/A\n",
      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.526  |       N/A\n",
      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.141  |       N/A\n",
      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - UEM                      |     0.525  |       N/A\n",
      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - LAS                      |     0.871  |       N/A\n",
      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - loss                     |     0.877  |       N/A\n",
      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - LEM                      |     0.292  |       N/A\n",
      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - UAS                      |     0.929  |       N/A\n",
      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - EM                       |     0.808  |       N/A\n",
      "2023-04-06 23:45:07,633 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:45:07,634 - INFO - combo.training.trainer - Epoch duration: 0:01:17.811230\n",
      "2023-04-06 23:45:07,634 - INFO - combo.training.trainer - Estimated training time remaining: 7:51:41\n",
      "2023-04-06 23:45:07,634 - INFO - allennlp.training.trainer - Epoch 42/399\n",
      "2023-04-06 23:45:07,634 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:45:07,635 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:45:07,641 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9418, LAS: 0.8844, UEM: 0.6837, LEM: 0.4383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1491, partial_loss/deprel_loss: 0.3171, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4252, loss: 0.7424, batch_reg_loss: 0.1416, reg_loss: 0.1416 ||:   3%|2         | 3/111 [00:02<01:17,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9439, LAS: 0.8897, UEM: 0.6355, LEM: 0.3676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3734, partial_loss/deprel_loss: 0.5091, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6237, loss: 0.7500, batch_reg_loss: 0.1417, reg_loss: 0.1416 ||:   6%|6         | 7/111 [00:04<01:12,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8109, UAS: 0.9345, LAS: 0.8808, UEM: 0.5993, LEM: 0.3413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8176, partial_loss/deprel_loss: 1.0696, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3609, loss: 0.8223, batch_reg_loss: 0.1418, reg_loss: 0.1417 ||:   9%|9         | 10/111 [00:06<01:10,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8456, UAS: 0.9321, LAS: 0.8780, UEM: 0.5473, LEM: 0.3023, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9754, partial_loss/deprel_loss: 0.9375, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0869, loss: 0.8430, batch_reg_loss: 0.1418, reg_loss: 0.1417 ||:  12%|#1        | 13/111 [00:09<01:11,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8557, UAS: 0.9290, LAS: 0.8745, UEM: 0.5006, LEM: 0.2696, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9098, partial_loss/deprel_loss: 0.8706, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0203, loss: 0.8699, batch_reg_loss: 0.1419, reg_loss: 0.1417 ||:  14%|#4        | 16/111 [00:11<01:08,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7885, UAS: 0.9225, LAS: 0.8667, UEM: 0.4693, LEM: 0.2489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9202, partial_loss/deprel_loss: 1.2812, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5509, loss: 0.9321, batch_reg_loss: 0.1419, reg_loss: 0.1418 ||:  17%|#7        | 19/111 [00:13<01:06,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9252, LAS: 0.8689, UEM: 0.4885, LEM: 0.2640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2645, partial_loss/deprel_loss: 0.3956, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5114, loss: 0.9091, batch_reg_loss: 0.1420, reg_loss: 0.1418 ||:  20%|#9        | 22/111 [00:15<01:04,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7888, UAS: 0.9224, LAS: 0.8653, UEM: 0.4605, LEM: 0.2419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7105, partial_loss/deprel_loss: 1.1578, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4104, loss: 0.9309, batch_reg_loss: 0.1421, reg_loss: 0.1418 ||:  23%|##3       | 26/111 [00:18<00:57,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8680, UAS: 0.9242, LAS: 0.8673, UEM: 0.4631, LEM: 0.2382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6195, partial_loss/deprel_loss: 0.7172, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8398, loss: 0.9185, batch_reg_loss: 0.1421, reg_loss: 0.1419 ||:  27%|##7       | 30/111 [00:20<00:54,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9257, LAS: 0.8693, UEM: 0.4708, LEM: 0.2398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4584, partial_loss/deprel_loss: 0.5306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6584, loss: 0.9047, batch_reg_loss: 0.1422, reg_loss: 0.1419 ||:  31%|###       | 34/111 [00:22<00:49,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8119, UAS: 0.9266, LAS: 0.8708, UEM: 0.5190, LEM: 0.2948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5656, partial_loss/deprel_loss: 1.1580, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3818, loss: 0.8919, batch_reg_loss: 0.1423, reg_loss: 0.1419 ||:  34%|###4      | 38/111 [00:25<00:47,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8013, UAS: 0.9268, LAS: 0.8702, UEM: 0.5255, LEM: 0.2939, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6049, partial_loss/deprel_loss: 1.2007, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4239, loss: 0.8945, batch_reg_loss: 0.1424, reg_loss: 0.1420 ||:  38%|###7      | 42/111 [00:28<00:44,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9244, LAS: 0.8681, UEM: 0.5113, LEM: 0.2843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5069, partial_loss/deprel_loss: 0.5866, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7131, loss: 0.9143, batch_reg_loss: 0.1425, reg_loss: 0.1420 ||:  41%|####1     | 46/111 [00:30<00:42,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8545, UAS: 0.9260, LAS: 0.8699, UEM: 0.5146, LEM: 0.2838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9033, partial_loss/deprel_loss: 0.9612, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0922, loss: 0.9012, batch_reg_loss: 0.1425, reg_loss: 0.1421 ||:  45%|####5     | 50/111 [00:33<00:41,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9020, UAS: 0.9262, LAS: 0.8700, UEM: 0.5082, LEM: 0.2782, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3898, partial_loss/deprel_loss: 0.5459, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6573, loss: 0.8964, batch_reg_loss: 0.1426, reg_loss: 0.1421 ||:  48%|####7     | 53/111 [00:35<00:39,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9264, LAS: 0.8700, UEM: 0.5088, LEM: 0.2775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2628, partial_loss/deprel_loss: 0.4712, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5722, loss: 0.8967, batch_reg_loss: 0.1427, reg_loss: 0.1421 ||:  50%|#####     | 56/111 [00:38<00:38,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8572, UAS: 0.9269, LAS: 0.8703, UEM: 0.5012, LEM: 0.2697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8432, partial_loss/deprel_loss: 0.8230, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9697, loss: 0.8934, batch_reg_loss: 0.1427, reg_loss: 0.1422 ||:  54%|#####4    | 60/111 [00:40<00:33,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8983, UAS: 0.9261, LAS: 0.8694, UEM: 0.4960, LEM: 0.2659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4341, partial_loss/deprel_loss: 0.5681, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6841, loss: 0.9014, batch_reg_loss: 0.1428, reg_loss: 0.1422 ||:  58%|#####7    | 64/111 [00:43<00:31,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9270, LAS: 0.8702, UEM: 0.5018, LEM: 0.2708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4418, partial_loss/deprel_loss: 0.5853, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6995, loss: 0.8965, batch_reg_loss: 0.1429, reg_loss: 0.1422 ||:  61%|######1   | 68/111 [00:45<00:29,  1.48it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9281, LAS: 0.8715, UEM: 0.5132, LEM: 0.2776, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3822, partial_loss/deprel_loss: 0.5883, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6900, loss: 0.8848, batch_reg_loss: 0.1429, reg_loss: 0.1423 ||:  64%|######3   | 71/111 [00:47<00:27,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9280, LAS: 0.8712, UEM: 0.5081, LEM: 0.2720, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6994, partial_loss/deprel_loss: 0.7017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8442, loss: 0.8869, batch_reg_loss: 0.1430, reg_loss: 0.1423 ||:  68%|######7   | 75/111 [00:50<00:23,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8278, UAS: 0.9281, LAS: 0.8714, UEM: 0.5251, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4009, partial_loss/deprel_loss: 1.1302, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3274, loss: 0.8879, batch_reg_loss: 0.1431, reg_loss: 0.1423 ||:  71%|#######1  | 79/111 [00:53<00:21,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8092, UAS: 0.9276, LAS: 0.8707, UEM: 0.5240, LEM: 0.2971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5534, partial_loss/deprel_loss: 1.0782, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3164, loss: 0.8904, batch_reg_loss: 0.1432, reg_loss: 0.1424 ||:  75%|#######4  | 83/111 [00:55<00:18,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9264, LAS: 0.8695, UEM: 0.5132, LEM: 0.2898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8338, partial_loss/deprel_loss: 0.8070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9556, loss: 0.9018, batch_reg_loss: 0.1432, reg_loss: 0.1424 ||:  78%|#######8  | 87/111 [00:58<00:15,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9264, LAS: 0.8696, UEM: 0.5124, LEM: 0.2889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2878, partial_loss/deprel_loss: 0.4932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5954, loss: 0.9021, batch_reg_loss: 0.1433, reg_loss: 0.1425 ||:  82%|########1 | 91/111 [01:00<00:12,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9273, LAS: 0.8706, UEM: 0.5229, LEM: 0.2959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3174, partial_loss/deprel_loss: 0.4176, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5409, loss: 0.8934, batch_reg_loss: 0.1434, reg_loss: 0.1425 ||:  86%|########5 | 95/111 [01:04<00:11,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8778, UAS: 0.9280, LAS: 0.8714, UEM: 0.5268, LEM: 0.2972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5531, partial_loss/deprel_loss: 0.6957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8106, loss: 0.8872, batch_reg_loss: 0.1434, reg_loss: 0.1425 ||:  88%|########8 | 98/111 [01:06<00:09,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8226, UAS: 0.9276, LAS: 0.8709, UEM: 0.5227, LEM: 0.2933, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2476, partial_loss/deprel_loss: 1.0486, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2319, loss: 0.8905, batch_reg_loss: 0.1435, reg_loss: 0.1425 ||:  91%|######### | 101/111 [01:08<00:07,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8271, UAS: 0.9276, LAS: 0.8708, UEM: 0.5191, LEM: 0.2894, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2091, partial_loss/deprel_loss: 0.9989, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1845, loss: 0.8903, batch_reg_loss: 0.1435, reg_loss: 0.1426 ||:  94%|#########3| 104/111 [01:10<00:04,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8996, UAS: 0.9281, LAS: 0.8713, UEM: 0.5172, LEM: 0.2862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3627, partial_loss/deprel_loss: 0.5546, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6599, loss: 0.8854, batch_reg_loss: 0.1436, reg_loss: 0.1426 ||:  97%|#########7| 108/111 [01:12<00:02,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9289, LAS: 0.8721, UEM: 0.5273, LEM: 0.2946, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1537, partial_loss/deprel_loss: 0.3458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4510, loss: 0.8789, batch_reg_loss: 0.1437, reg_loss: 0.1426 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
      "2023-04-06 23:46:23,087 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.346  |       N/A\n",
      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.154  |       N/A\n",
      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.143  |       N/A\n",
      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - UEM                      |     0.527  |       N/A\n",
      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - LAS                      |     0.872  |       N/A\n",
      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - loss                     |     0.879  |       N/A\n",
      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:46:23,088 - INFO - combo.training.tensorboard_writer - LEM                      |     0.295  |       N/A\n",
      "2023-04-06 23:46:23,089 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:46:23,089 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:46:23,089 - INFO - combo.training.tensorboard_writer - UAS                      |     0.929  |       N/A\n",
      "2023-04-06 23:46:23,089 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:46:23,089 - INFO - combo.training.tensorboard_writer - EM                       |     0.923  |       N/A\n",
      "2023-04-06 23:46:23,089 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:46:23,089 - INFO - combo.training.trainer - Epoch duration: 0:01:15.455331\n",
      "2023-04-06 23:46:23,090 - INFO - combo.training.trainer - Estimated training time remaining: 7:49:52\n",
      "2023-04-06 23:46:23,090 - INFO - allennlp.training.trainer - Epoch 43/399\n",
      "2023-04-06 23:46:23,090 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:46:23,090 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:46:23,096 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8652, UAS: 0.9428, LAS: 0.8899, UEM: 0.5301, LEM: 0.2811, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7088, partial_loss/deprel_loss: 0.7559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8902, loss: 0.7165, batch_reg_loss: 0.1437, reg_loss: 0.1437 ||:   4%|3         | 4/111 [00:02<01:12,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8554, UAS: 0.9305, LAS: 0.8755, UEM: 0.4153, LEM: 0.2112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9663, partial_loss/deprel_loss: 0.8616, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0263, loss: 0.8579, batch_reg_loss: 0.1438, reg_loss: 0.1437 ||:   6%|6         | 7/111 [00:04<01:12,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9267, LAS: 0.8695, UEM: 0.3652, LEM: 0.1685, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4697, partial_loss/deprel_loss: 0.6609, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7665, loss: 0.8932, batch_reg_loss: 0.1438, reg_loss: 0.1438 ||:  10%|9         | 11/111 [00:07<01:07,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9170, UAS: 0.9308, LAS: 0.8744, UEM: 0.4503, LEM: 0.2264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2776, partial_loss/deprel_loss: 0.3887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5104, loss: 0.8467, batch_reg_loss: 0.1439, reg_loss: 0.1438 ||:  13%|#2        | 14/111 [00:09<01:07,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9310, LAS: 0.8749, UEM: 0.4808, LEM: 0.2451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4315, partial_loss/deprel_loss: 0.5662, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6832, loss: 0.8372, batch_reg_loss: 0.1439, reg_loss: 0.1438 ||:  15%|#5        | 17/111 [00:11<01:07,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9305, LAS: 0.8744, UEM: 0.4984, LEM: 0.2527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2001, partial_loss/deprel_loss: 0.4246, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5237, loss: 0.8381, batch_reg_loss: 0.1440, reg_loss: 0.1438 ||:  18%|#8        | 20/111 [00:14<01:04,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9020, UAS: 0.9311, LAS: 0.8754, UEM: 0.4955, LEM: 0.2494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4113, partial_loss/deprel_loss: 0.5384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6570, loss: 0.8374, batch_reg_loss: 0.1440, reg_loss: 0.1438 ||:  21%|##        | 23/111 [00:16<01:02,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8517, UAS: 0.9299, LAS: 0.8747, UEM: 0.5014, LEM: 0.2621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0566, partial_loss/deprel_loss: 0.9292, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0988, loss: 0.8457, batch_reg_loss: 0.1441, reg_loss: 0.1439 ||:  23%|##3       | 26/111 [00:18<01:00,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8671, UAS: 0.9280, LAS: 0.8729, UEM: 0.4755, LEM: 0.2457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7893, partial_loss/deprel_loss: 0.7554, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9063, loss: 0.8606, batch_reg_loss: 0.1441, reg_loss: 0.1439 ||:  27%|##7       | 30/111 [00:20<00:53,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9309, LAS: 0.8757, UEM: 0.4968, LEM: 0.2569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4710, partial_loss/deprel_loss: 0.7238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8175, loss: 0.8412, batch_reg_loss: 0.1442, reg_loss: 0.1439 ||:  31%|###       | 34/111 [00:23<00:50,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9296, LAS: 0.8741, UEM: 0.4825, LEM: 0.2462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4805, partial_loss/deprel_loss: 0.6438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7554, loss: 0.8578, batch_reg_loss: 0.1443, reg_loss: 0.1440 ||:  33%|###3      | 37/111 [00:25<00:49,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9576, UAS: 0.9296, LAS: 0.8747, UEM: 0.5280, LEM: 0.3088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0719, partial_loss/deprel_loss: 0.1706, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2952, loss: 0.8560, batch_reg_loss: 0.1443, reg_loss: 0.1440 ||:  36%|###6      | 40/111 [00:27<00:49,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8147, UAS: 0.9272, LAS: 0.8719, UEM: 0.5142, LEM: 0.2989, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4103, partial_loss/deprel_loss: 1.0491, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2657, loss: 0.8769, batch_reg_loss: 0.1444, reg_loss: 0.1440 ||:  39%|###8      | 43/111 [00:29<00:46,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8604, UAS: 0.9253, LAS: 0.8700, UEM: 0.5011, LEM: 0.2891, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8102, partial_loss/deprel_loss: 0.8194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9620, loss: 0.8908, batch_reg_loss: 0.1444, reg_loss: 0.1440 ||:  41%|####1     | 46/111 [00:31<00:46,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9264, LAS: 0.8710, UEM: 0.5009, LEM: 0.2851, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3478, partial_loss/deprel_loss: 0.5009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6148, loss: 0.8833, batch_reg_loss: 0.1445, reg_loss: 0.1441 ||:  44%|####4     | 49/111 [00:33<00:43,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8962, UAS: 0.9273, LAS: 0.8721, UEM: 0.5077, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4123, partial_loss/deprel_loss: 0.5633, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6777, loss: 0.8738, batch_reg_loss: 0.1446, reg_loss: 0.1441 ||:  48%|####7     | 53/111 [00:36<00:39,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9096, UAS: 0.9277, LAS: 0.8724, UEM: 0.5111, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2746, partial_loss/deprel_loss: 0.5166, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6128, loss: 0.8723, batch_reg_loss: 0.1446, reg_loss: 0.1441 ||:  50%|#####     | 56/111 [00:38<00:38,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9271, LAS: 0.8720, UEM: 0.5031, LEM: 0.2829, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3995, partial_loss/deprel_loss: 0.4965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6218, loss: 0.8758, batch_reg_loss: 0.1447, reg_loss: 0.1442 ||:  54%|#####4    | 60/111 [00:41<00:35,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9282, LAS: 0.8732, UEM: 0.5039, LEM: 0.2799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4876, partial_loss/deprel_loss: 0.6137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7333, loss: 0.8675, batch_reg_loss: 0.1448, reg_loss: 0.1442 ||:  58%|#####7    | 64/111 [00:43<00:31,  1.49it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8652, UAS: 0.9280, LAS: 0.8729, UEM: 0.5005, LEM: 0.2765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7839, partial_loss/deprel_loss: 0.7660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9144, loss: 0.8710, batch_reg_loss: 0.1449, reg_loss: 0.1442 ||:  61%|######1   | 68/111 [00:46<00:27,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9287, LAS: 0.8736, UEM: 0.4970, LEM: 0.2705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4859, partial_loss/deprel_loss: 0.6183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7367, loss: 0.8662, batch_reg_loss: 0.1449, reg_loss: 0.1443 ||:  65%|######4   | 72/111 [00:48<00:23,  1.63it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8157, UAS: 0.9272, LAS: 0.8720, UEM: 0.4943, LEM: 0.2668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5636, partial_loss/deprel_loss: 1.0879, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3280, loss: 0.8815, batch_reg_loss: 0.1450, reg_loss: 0.1443 ||:  68%|######8   | 76/111 [00:50<00:21,  1.64it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8144, UAS: 0.9269, LAS: 0.8717, UEM: 0.5034, LEM: 0.2805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5043, partial_loss/deprel_loss: 1.1348, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3537, loss: 0.8843, batch_reg_loss: 0.1450, reg_loss: 0.1443 ||:  72%|#######2  | 80/111 [00:53<00:18,  1.65it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8524, UAS: 0.9266, LAS: 0.8709, UEM: 0.4931, LEM: 0.2729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7594, partial_loss/deprel_loss: 0.8771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9986, loss: 0.8908, batch_reg_loss: 0.1451, reg_loss: 0.1444 ||:  76%|#######5  | 84/111 [00:55<00:16,  1.68it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9272, LAS: 0.8716, UEM: 0.5056, LEM: 0.2823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3730, partial_loss/deprel_loss: 0.5287, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6428, loss: 0.8835, batch_reg_loss: 0.1452, reg_loss: 0.1444 ||:  79%|#######9  | 88/111 [00:58<00:15,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9283, LAS: 0.8730, UEM: 0.5235, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1638, partial_loss/deprel_loss: 0.2994, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4175, loss: 0.8710, batch_reg_loss: 0.1453, reg_loss: 0.1445 ||:  83%|########2 | 92/111 [01:01<00:13,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8782, UAS: 0.9284, LAS: 0.8731, UEM: 0.5205, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4851, partial_loss/deprel_loss: 0.6839, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7895, loss: 0.8712, batch_reg_loss: 0.1453, reg_loss: 0.1445 ||:  86%|########6 | 96/111 [01:04<00:09,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8395, UAS: 0.9279, LAS: 0.8724, UEM: 0.5209, LEM: 0.2968, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1321, partial_loss/deprel_loss: 1.0463, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2089, loss: 0.8762, batch_reg_loss: 0.1454, reg_loss: 0.1445 ||:  90%|######### | 100/111 [01:06<00:07,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8728, UAS: 0.9277, LAS: 0.8722, UEM: 0.5211, LEM: 0.2954, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6545, partial_loss/deprel_loss: 0.6932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8310, loss: 0.8775, batch_reg_loss: 0.1455, reg_loss: 0.1446 ||:  94%|#########3| 104/111 [01:09<00:04,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8994, UAS: 0.9282, LAS: 0.8725, UEM: 0.5207, LEM: 0.2928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3772, partial_loss/deprel_loss: 0.5600, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6690, loss: 0.8751, batch_reg_loss: 0.1455, reg_loss: 0.1446 ||:  97%|#########7| 108/111 [01:11<00:01,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7823, UAS: 0.9278, LAS: 0.8719, UEM: 0.5203, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0270, partial_loss/deprel_loss: 1.3010, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5918, loss: 0.8791, batch_reg_loss: 0.1456, reg_loss: 0.1446 ||: 100%|##########| 111/111 [01:14<00:00,  1.50it/s]\n",
      "2023-04-06 23:47:37,185 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:47:37,185 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:47:37,185 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:47:37,185 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:47:37,185 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:47:37,185 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.301  |       N/A\n",
      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     2.027  |       N/A\n",
      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.145  |       N/A\n",
      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - UEM                      |     0.520  |       N/A\n",
      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - LAS                      |     0.872  |       N/A\n",
      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - loss                     |     0.879  |       N/A\n",
      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - LEM                      |     0.292  |       N/A\n",
      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - UAS                      |     0.928  |       N/A\n",
      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - EM                       |     0.782  |       N/A\n",
      "2023-04-06 23:47:37,186 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:47:37,187 - INFO - combo.training.trainer - Epoch duration: 0:01:14.097322\n",
      "2023-04-06 23:47:37,187 - INFO - combo.training.trainer - Estimated training time remaining: 7:47:54\n",
      "2023-04-06 23:47:37,187 - INFO - allennlp.training.trainer - Epoch 44/399\n",
      "2023-04-06 23:47:37,187 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:47:37,188 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:47:37,194 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9630, LAS: 0.9171, UEM: 0.7763, LEM: 0.5258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3786, partial_loss/deprel_loss: 0.5238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6404, loss: 0.5429, batch_reg_loss: 0.1456, reg_loss: 0.1456 ||:   3%|2         | 3/111 [00:02<01:23,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8908, UAS: 0.9468, LAS: 0.8951, UEM: 0.6389, LEM: 0.3900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5384, partial_loss/deprel_loss: 0.6080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7398, loss: 0.7117, batch_reg_loss: 0.1457, reg_loss: 0.1456 ||:   6%|6         | 7/111 [00:04<01:16,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9520, LAS: 0.9005, UEM: 0.6665, LEM: 0.3958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4527, partial_loss/deprel_loss: 0.5690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6915, loss: 0.6676, batch_reg_loss: 0.1458, reg_loss: 0.1457 ||:  10%|9         | 11/111 [00:07<01:09,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7963, UAS: 0.9398, LAS: 0.8874, UEM: 0.6268, LEM: 0.3682, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8417, partial_loss/deprel_loss: 1.2189, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4893, loss: 0.7801, batch_reg_loss: 0.1458, reg_loss: 0.1457 ||:  13%|#2        | 14/111 [00:09<01:07,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8781, UAS: 0.9389, LAS: 0.8862, UEM: 0.6093, LEM: 0.3491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6420, partial_loss/deprel_loss: 0.6886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8252, loss: 0.7783, batch_reg_loss: 0.1458, reg_loss: 0.1457 ||:  15%|#5        | 17/111 [00:11<01:06,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8938, UAS: 0.9394, LAS: 0.8866, UEM: 0.6067, LEM: 0.3482, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4438, partial_loss/deprel_loss: 0.6601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7627, loss: 0.7781, batch_reg_loss: 0.1459, reg_loss: 0.1457 ||:  18%|#8        | 20/111 [00:13<01:04,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8509, UAS: 0.9330, LAS: 0.8786, UEM: 0.5653, LEM: 0.3216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9093, partial_loss/deprel_loss: 0.8832, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0344, loss: 0.8428, batch_reg_loss: 0.1460, reg_loss: 0.1458 ||:  22%|##1       | 24/111 [00:16<00:59,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7874, UAS: 0.9295, LAS: 0.8749, UEM: 0.5659, LEM: 0.3276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0483, partial_loss/deprel_loss: 1.1934, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5104, loss: 0.8740, batch_reg_loss: 0.1460, reg_loss: 0.1458 ||:  25%|##5       | 28/111 [00:18<00:56,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8710, UAS: 0.9314, LAS: 0.8773, UEM: 0.5799, LEM: 0.3389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6995, partial_loss/deprel_loss: 0.7559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8907, loss: 0.8550, batch_reg_loss: 0.1461, reg_loss: 0.1458 ||:  28%|##7       | 31/111 [00:21<00:55,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9303, LAS: 0.8762, UEM: 0.5832, LEM: 0.3393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4871, partial_loss/deprel_loss: 0.5664, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6967, loss: 0.8632, batch_reg_loss: 0.1462, reg_loss: 0.1459 ||:  32%|###1      | 35/111 [00:23<00:51,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8777, UAS: 0.9297, LAS: 0.8753, UEM: 0.5582, LEM: 0.3193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6452, partial_loss/deprel_loss: 0.7188, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8503, loss: 0.8698, batch_reg_loss: 0.1462, reg_loss: 0.1459 ||:  35%|###5      | 39/111 [00:26<00:48,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8624, UAS: 0.9305, LAS: 0.8756, UEM: 0.5537, LEM: 0.3114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7213, partial_loss/deprel_loss: 0.7833, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9172, loss: 0.8642, batch_reg_loss: 0.1463, reg_loss: 0.1459 ||:  38%|###7      | 42/111 [00:28<00:47,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8437, UAS: 0.9290, LAS: 0.8735, UEM: 0.5410, LEM: 0.2992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0237, partial_loss/deprel_loss: 0.8837, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0581, loss: 0.8770, batch_reg_loss: 0.1464, reg_loss: 0.1460 ||:  41%|####1     | 46/111 [00:30<00:43,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8991, UAS: 0.9317, LAS: 0.8768, UEM: 0.5692, LEM: 0.3247, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3221, partial_loss/deprel_loss: 0.5263, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6319, loss: 0.8508, batch_reg_loss: 0.1465, reg_loss: 0.1460 ||:  45%|####5     | 50/111 [00:33<00:40,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8850, UAS: 0.9321, LAS: 0.8772, UEM: 0.5601, LEM: 0.3158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5211, partial_loss/deprel_loss: 0.6311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7556, loss: 0.8474, batch_reg_loss: 0.1465, reg_loss: 0.1460 ||:  49%|####8     | 54/111 [00:36<00:37,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9311, LAS: 0.8759, UEM: 0.5516, LEM: 0.3082, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5666, partial_loss/deprel_loss: 0.6358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7685, loss: 0.8563, batch_reg_loss: 0.1466, reg_loss: 0.1461 ||:  52%|#####2    | 58/111 [00:38<00:35,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8161, UAS: 0.9310, LAS: 0.8758, UEM: 0.5487, LEM: 0.3056, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4201, partial_loss/deprel_loss: 1.0710, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2874, loss: 0.8568, batch_reg_loss: 0.1466, reg_loss: 0.1461 ||:  56%|#####5    | 62/111 [00:41<00:34,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8756, UAS: 0.9310, LAS: 0.8756, UEM: 0.5411, LEM: 0.2988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6316, partial_loss/deprel_loss: 0.7124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8429, loss: 0.8575, batch_reg_loss: 0.1467, reg_loss: 0.1461 ||:  59%|#####8    | 65/111 [00:43<00:32,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9304, LAS: 0.8748, UEM: 0.5300, LEM: 0.2917, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8484, partial_loss/deprel_loss: 0.8227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9745, loss: 0.8617, batch_reg_loss: 0.1467, reg_loss: 0.1462 ||:  61%|######1   | 68/111 [00:46<00:29,  1.44it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8927, UAS: 0.9297, LAS: 0.8742, UEM: 0.5247, LEM: 0.2871, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5040, partial_loss/deprel_loss: 0.5522, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6894, loss: 0.8663, batch_reg_loss: 0.1468, reg_loss: 0.1462 ||:  65%|######4   | 72/111 [00:48<00:25,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9296, LAS: 0.8740, UEM: 0.5207, LEM: 0.2814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2853, partial_loss/deprel_loss: 0.5267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6253, loss: 0.8694, batch_reg_loss: 0.1469, reg_loss: 0.1462 ||:  68%|######8   | 76/111 [00:51<00:23,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8936, UAS: 0.9301, LAS: 0.8746, UEM: 0.5239, LEM: 0.2825, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4784, partial_loss/deprel_loss: 0.6309, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7473, loss: 0.8649, batch_reg_loss: 0.1470, reg_loss: 0.1463 ||:  72%|#######2  | 80/111 [00:53<00:20,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8661, UAS: 0.9295, LAS: 0.8739, UEM: 0.5156, LEM: 0.2772, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8536, partial_loss/deprel_loss: 0.8270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9793, loss: 0.8710, batch_reg_loss: 0.1470, reg_loss: 0.1463 ||:  76%|#######5  | 84/111 [00:56<00:17,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8424, UAS: 0.9279, LAS: 0.8721, UEM: 0.5087, LEM: 0.2720, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1010, partial_loss/deprel_loss: 0.9139, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0984, loss: 0.8855, batch_reg_loss: 0.1471, reg_loss: 0.1463 ||:  79%|#######9  | 88/111 [00:58<00:15,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8623, UAS: 0.9283, LAS: 0.8724, UEM: 0.5060, LEM: 0.2680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7206, partial_loss/deprel_loss: 0.8822, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9970, loss: 0.8843, batch_reg_loss: 0.1472, reg_loss: 0.1464 ||:  83%|########2 | 92/111 [01:01<00:11,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.9280, LAS: 0.8721, UEM: 0.5019, LEM: 0.2653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9525, partial_loss/deprel_loss: 0.8787, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0407, loss: 0.8880, batch_reg_loss: 0.1473, reg_loss: 0.1464 ||:  86%|########6 | 96/111 [01:03<00:09,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9492, UAS: 0.9288, LAS: 0.8728, UEM: 0.5220, LEM: 0.2890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0723, partial_loss/deprel_loss: 0.2095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3294, loss: 0.8826, batch_reg_loss: 0.1473, reg_loss: 0.1464 ||:  90%|######### | 100/111 [01:07<00:07,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8337, UAS: 0.9286, LAS: 0.8726, UEM: 0.5207, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3335, partial_loss/deprel_loss: 1.0984, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2928, loss: 0.8856, batch_reg_loss: 0.1474, reg_loss: 0.1465 ||:  93%|#########2| 103/111 [01:09<00:05,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8814, UAS: 0.9291, LAS: 0.8730, UEM: 0.5236, LEM: 0.2890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4793, partial_loss/deprel_loss: 0.6887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7942, loss: 0.8808, batch_reg_loss: 0.1474, reg_loss: 0.1465 ||:  95%|#########5| 106/111 [01:11<00:03,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9294, LAS: 0.8734, UEM: 0.5320, LEM: 0.2991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1479, partial_loss/deprel_loss: 0.2737, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3960, loss: 0.8765, batch_reg_loss: 0.1475, reg_loss: 0.1465 ||:  98%|#########8| 109/111 [01:13<00:01,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8766, UAS: 0.9296, LAS: 0.8735, UEM: 0.5301, LEM: 0.2970, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6356, partial_loss/deprel_loss: 0.8034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9174, loss: 0.8758, batch_reg_loss: 0.1475, reg_loss: 0.1465 ||: 100%|##########| 111/111 [01:15<00:00,  1.48it/s]\n",
      "2023-04-06 23:48:52,323 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:48:52,323 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.803  |       N/A\n",
      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.636  |       N/A\n",
      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.147  |       N/A\n",
      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - UEM                      |     0.530  |       N/A\n",
      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - LAS                      |     0.873  |       N/A\n",
      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - loss                     |     0.876  |       N/A\n",
      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:48:52,324 - INFO - combo.training.tensorboard_writer - LEM                      |     0.297  |       N/A\n",
      "2023-04-06 23:48:52,325 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:48:52,325 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:48:52,325 - INFO - combo.training.tensorboard_writer - UAS                      |     0.930  |       N/A\n",
      "2023-04-06 23:48:52,325 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:48:52,325 - INFO - combo.training.tensorboard_writer - EM                       |     0.877  |       N/A\n",
      "2023-04-06 23:48:52,325 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:48:52,326 - INFO - combo.training.trainer - Epoch duration: 0:01:15.138417\n",
      "2023-04-06 23:48:52,326 - INFO - combo.training.trainer - Estimated training time remaining: 7:46:06\n",
      "2023-04-06 23:48:52,326 - INFO - allennlp.training.trainer - Epoch 45/399\n",
      "2023-04-06 23:48:52,326 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:48:52,326 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:48:52,334 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9169, LAS: 0.8645, UEM: 0.6209, LEM: 0.3762, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3488, partial_loss/deprel_loss: 0.4880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6077, loss: 0.9611, batch_reg_loss: 0.1476, reg_loss: 0.1476 ||:   4%|3         | 4/111 [00:02<01:17,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7991, UAS: 0.9205, LAS: 0.8661, UEM: 0.6082, LEM: 0.3561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7394, partial_loss/deprel_loss: 1.2242, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4749, loss: 0.9431, batch_reg_loss: 0.1476, reg_loss: 0.1476 ||:   6%|6         | 7/111 [00:05<01:14,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8656, UAS: 0.9206, LAS: 0.8646, UEM: 0.5249, LEM: 0.2889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7115, partial_loss/deprel_loss: 0.7655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9024, loss: 0.9411, batch_reg_loss: 0.1477, reg_loss: 0.1476 ||:  10%|9         | 11/111 [00:07<01:07,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8830, UAS: 0.9248, LAS: 0.8690, UEM: 0.5142, LEM: 0.2694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5019, partial_loss/deprel_loss: 0.7006, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8086, loss: 0.8999, batch_reg_loss: 0.1478, reg_loss: 0.1476 ||:  13%|#2        | 14/111 [00:09<01:06,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9275, LAS: 0.8721, UEM: 0.5363, LEM: 0.2925, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2829, partial_loss/deprel_loss: 0.3895, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5160, loss: 0.8710, batch_reg_loss: 0.1478, reg_loss: 0.1477 ||:  15%|#5        | 17/111 [00:11<01:06,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8806, UAS: 0.9285, LAS: 0.8730, UEM: 0.5128, LEM: 0.2727, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5980, partial_loss/deprel_loss: 0.6489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7866, loss: 0.8690, batch_reg_loss: 0.1479, reg_loss: 0.1477 ||:  18%|#8        | 20/111 [00:13<01:04,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8446, UAS: 0.9269, LAS: 0.8713, UEM: 0.4956, LEM: 0.2596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9929, partial_loss/deprel_loss: 0.9136, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0774, loss: 0.8785, batch_reg_loss: 0.1479, reg_loss: 0.1477 ||:  21%|##        | 23/111 [00:15<01:02,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9277, LAS: 0.8720, UEM: 0.4875, LEM: 0.2508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7347, partial_loss/deprel_loss: 0.7592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9022, loss: 0.8687, batch_reg_loss: 0.1480, reg_loss: 0.1478 ||:  23%|##3       | 26/111 [00:18<01:00,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9321, LAS: 0.8777, UEM: 0.5737, LEM: 0.3447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3178, partial_loss/deprel_loss: 0.5158, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6243, loss: 0.8307, batch_reg_loss: 0.1480, reg_loss: 0.1478 ||:  26%|##6       | 29/111 [00:21<01:05,  1.25it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9321, LAS: 0.8777, UEM: 0.5882, LEM: 0.3674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4529, partial_loss/deprel_loss: 0.5867, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7080, loss: 0.8318, batch_reg_loss: 0.1481, reg_loss: 0.1478 ||:  30%|##9       | 33/111 [00:23<00:58,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9305, LAS: 0.8756, UEM: 0.5741, LEM: 0.3538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8034, partial_loss/deprel_loss: 0.8026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9509, loss: 0.8478, batch_reg_loss: 0.1481, reg_loss: 0.1478 ||:  32%|###2      | 36/111 [00:25<00:54,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8671, UAS: 0.9317, LAS: 0.8763, UEM: 0.5771, LEM: 0.3511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6548, partial_loss/deprel_loss: 0.8313, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9442, loss: 0.8396, batch_reg_loss: 0.1482, reg_loss: 0.1479 ||:  35%|###5      | 39/111 [00:27<00:52,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9338, LAS: 0.8790, UEM: 0.5864, LEM: 0.3539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3781, partial_loss/deprel_loss: 0.5629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6742, loss: 0.8236, batch_reg_loss: 0.1482, reg_loss: 0.1479 ||:  39%|###8      | 43/111 [00:30<00:47,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8419, UAS: 0.9320, LAS: 0.8768, UEM: 0.5703, LEM: 0.3423, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1642, partial_loss/deprel_loss: 0.9447, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1368, loss: 0.8393, batch_reg_loss: 0.1483, reg_loss: 0.1479 ||:  41%|####1     | 46/111 [00:32<00:45,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9201, UAS: 0.9331, LAS: 0.8779, UEM: 0.5812, LEM: 0.3521, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1896, partial_loss/deprel_loss: 0.3194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4418, loss: 0.8277, batch_reg_loss: 0.1483, reg_loss: 0.1479 ||:  44%|####4     | 49/111 [00:34<00:42,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9328, LAS: 0.8772, UEM: 0.5853, LEM: 0.3549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1467, partial_loss/deprel_loss: 0.3971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4954, loss: 0.8332, batch_reg_loss: 0.1484, reg_loss: 0.1480 ||:  47%|####6     | 52/111 [00:36<00:40,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8404, UAS: 0.9322, LAS: 0.8766, UEM: 0.5773, LEM: 0.3481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2362, partial_loss/deprel_loss: 0.9801, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1798, loss: 0.8400, batch_reg_loss: 0.1484, reg_loss: 0.1480 ||:  50%|####9     | 55/111 [00:38<00:39,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9042, UAS: 0.9298, LAS: 0.8743, UEM: 0.5684, LEM: 0.3423, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3632, partial_loss/deprel_loss: 0.4450, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5771, loss: 0.8590, batch_reg_loss: 0.1485, reg_loss: 0.1480 ||:  53%|#####3    | 59/111 [00:41<00:37,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9287, LAS: 0.8731, UEM: 0.5648, LEM: 0.3388, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3237, partial_loss/deprel_loss: 0.4315, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5585, loss: 0.8692, batch_reg_loss: 0.1485, reg_loss: 0.1480 ||:  56%|#####5    | 62/111 [00:44<00:35,  1.38it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8407, UAS: 0.9284, LAS: 0.8725, UEM: 0.5539, LEM: 0.3295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2580, partial_loss/deprel_loss: 1.0314, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2254, loss: 0.8760, batch_reg_loss: 0.1486, reg_loss: 0.1481 ||:  59%|#####9    | 66/111 [00:46<00:31,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8227, UAS: 0.9278, LAS: 0.8719, UEM: 0.5486, LEM: 0.3246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4298, partial_loss/deprel_loss: 0.9430, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1891, loss: 0.8808, batch_reg_loss: 0.1487, reg_loss: 0.1481 ||:  62%|######2   | 69/111 [00:48<00:29,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8764, UAS: 0.9270, LAS: 0.8709, UEM: 0.5420, LEM: 0.3179, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6441, partial_loss/deprel_loss: 0.6258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7782, loss: 0.8877, batch_reg_loss: 0.1487, reg_loss: 0.1481 ||:  65%|######4   | 72/111 [00:50<00:27,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8926, UAS: 0.9276, LAS: 0.8713, UEM: 0.5411, LEM: 0.3138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4335, partial_loss/deprel_loss: 0.6407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7481, loss: 0.8853, batch_reg_loss: 0.1488, reg_loss: 0.1482 ||:  68%|######8   | 76/111 [00:53<00:24,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8540, UAS: 0.9268, LAS: 0.8706, UEM: 0.5445, LEM: 0.3183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9612, partial_loss/deprel_loss: 0.8148, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9930, loss: 0.8901, batch_reg_loss: 0.1489, reg_loss: 0.1482 ||:  71%|#######1  | 79/111 [00:55<00:22,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9272, LAS: 0.8709, UEM: 0.5434, LEM: 0.3147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3584, partial_loss/deprel_loss: 0.5370, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6502, loss: 0.8875, batch_reg_loss: 0.1490, reg_loss: 0.1482 ||:  74%|#######3  | 82/111 [00:58<00:21,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8341, UAS: 0.9271, LAS: 0.8708, UEM: 0.5359, LEM: 0.3090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1788, partial_loss/deprel_loss: 0.9773, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1667, loss: 0.8887, batch_reg_loss: 0.1490, reg_loss: 0.1483 ||:  77%|#######7  | 86/111 [01:00<00:17,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8259, UAS: 0.9264, LAS: 0.8700, UEM: 0.5294, LEM: 0.3038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1285, partial_loss/deprel_loss: 1.1447, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2905, loss: 0.8945, batch_reg_loss: 0.1491, reg_loss: 0.1483 ||:  81%|########1 | 90/111 [01:02<00:13,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8613, UAS: 0.9266, LAS: 0.8703, UEM: 0.5230, LEM: 0.2979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9470, partial_loss/deprel_loss: 0.7802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9627, loss: 0.8945, batch_reg_loss: 0.1492, reg_loss: 0.1483 ||:  85%|########4 | 94/111 [01:05<00:11,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9273, LAS: 0.8712, UEM: 0.5234, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2959, partial_loss/deprel_loss: 0.5120, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6180, loss: 0.8880, batch_reg_loss: 0.1493, reg_loss: 0.1484 ||:  88%|########8 | 98/111 [01:07<00:08,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8325, UAS: 0.9275, LAS: 0.8714, UEM: 0.5286, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2757, partial_loss/deprel_loss: 0.9351, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1526, loss: 0.8843, batch_reg_loss: 0.1493, reg_loss: 0.1484 ||:  92%|#########1| 102/111 [01:10<00:06,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9280, LAS: 0.8719, UEM: 0.5266, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5151, partial_loss/deprel_loss: 0.5887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7234, loss: 0.8805, batch_reg_loss: 0.1494, reg_loss: 0.1484 ||:  95%|#########5| 106/111 [01:13<00:03,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9284, LAS: 0.8724, UEM: 0.5281, LEM: 0.2977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3449, partial_loss/deprel_loss: 0.4950, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6144, loss: 0.8774, batch_reg_loss: 0.1494, reg_loss: 0.1485 ||:  99%|#########9| 110/111 [01:16<00:00,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8283, UAS: 0.9282, LAS: 0.8720, UEM: 0.5259, LEM: 0.2964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1604, partial_loss/deprel_loss: 1.0838, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2486, loss: 0.8807, batch_reg_loss: 0.1495, reg_loss: 0.1485 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
      "2023-04-06 23:50:09,062 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9534, LAS: 0.9001, UEM: 0.6753, LEM: 0.3628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1819, partial_loss/deprel_loss: 23.7693, partial_loss/cycle_loss: 0.0000, batch_loss: 19.0518, loss: 22.2928, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:08,  1.17it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9487, LAS: 0.8920, UEM: 0.6040, LEM: 0.2900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9910, partial_loss/deprel_loss: 37.4935, partial_loss/cycle_loss: 0.0000, batch_loss: 30.1930, loss: 23.5104, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:06,  1.14it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9415, LAS: 0.8858, UEM: 0.5706, LEM: 0.2838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9017, partial_loss/deprel_loss: 31.2307, partial_loss/cycle_loss: 0.0000, batch_loss: 25.1649, loss: 25.3184, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  69%|######9   | 9/13 [00:07<00:03,  1.17it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9419, LAS: 0.8882, UEM: 0.6289, LEM: 0.3770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1918, partial_loss/deprel_loss: 20.7598, partial_loss/cycle_loss: 0.0000, batch_loss: 16.6462, loss: 25.8303, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:09<00:01,  1.10it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8678, UAS: 0.9422, LAS: 0.8879, UEM: 0.6232, LEM: 0.3631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0590, partial_loss/deprel_loss: 43.7483, partial_loss/cycle_loss: 0.0000, batch_loss: 35.2104, loss: 26.2072, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:11<00:00,  1.05it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8678, UAS: 0.9422, LAS: 0.8879, UEM: 0.6232, LEM: 0.3631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0590, partial_loss/deprel_loss: 43.7483, partial_loss/cycle_loss: 0.0000, batch_loss: 35.2104, loss: 26.2072, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:11<00:00,  1.09it/s]\n",
      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.084  |    43.748\n",
      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.160  |     1.059\n",
      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.148  |     0.000\n",
      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - UEM                      |     0.526  |     0.623\n",
      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - LAS                      |     0.872  |     0.888\n",
      "2023-04-06 23:50:21,016 - INFO - combo.training.tensorboard_writer - loss                     |     0.881  |    26.207\n",
      "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - LEM                      |     0.296  |     0.363\n",
      "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - UAS                      |     0.928  |     0.942\n",
      "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - EM                       |     0.828  |     0.868\n",
      "2023-04-06 23:50:21,017 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:50:21,017 - INFO - combo.training.trainer - Epoch duration: 0:01:28.691575\n",
      "2023-04-06 23:50:21,018 - INFO - combo.training.trainer - Estimated training time remaining: 7:46:03\n",
      "2023-04-06 23:50:21,018 - INFO - allennlp.training.trainer - Epoch 46/399\n",
      "2023-04-06 23:50:21,018 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:50:21,018 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:50:21,024 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9393, LAS: 0.8848, UEM: 0.7867, LEM: 0.5840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1217, partial_loss/deprel_loss: 0.2555, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3782, loss: 0.7494, batch_reg_loss: 0.1495, reg_loss: 0.1495 ||:   3%|2         | 3/111 [00:02<01:20,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8622, UAS: 0.9277, LAS: 0.8710, UEM: 0.5986, LEM: 0.4062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7870, partial_loss/deprel_loss: 0.9187, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0420, loss: 0.8931, batch_reg_loss: 0.1496, reg_loss: 0.1495 ||:   6%|6         | 7/111 [00:04<01:10,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9300, LAS: 0.8734, UEM: 0.5550, LEM: 0.3467, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4426, partial_loss/deprel_loss: 0.5726, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6963, loss: 0.8855, batch_reg_loss: 0.1496, reg_loss: 0.1496 ||:  10%|9         | 11/111 [00:06<01:05,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9138, UAS: 0.9345, LAS: 0.8780, UEM: 0.5825, LEM: 0.3564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2641, partial_loss/deprel_loss: 0.3866, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5118, loss: 0.8413, batch_reg_loss: 0.1497, reg_loss: 0.1496 ||:  13%|#2        | 14/111 [00:08<01:05,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8545, UAS: 0.9332, LAS: 0.8768, UEM: 0.5385, LEM: 0.3190, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9611, partial_loss/deprel_loss: 0.9256, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0825, loss: 0.8551, batch_reg_loss: 0.1498, reg_loss: 0.1496 ||:  16%|#6        | 18/111 [00:11<01:00,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9484, UAS: 0.9320, LAS: 0.8767, UEM: 0.5975, LEM: 0.3967, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0807, partial_loss/deprel_loss: 0.1996, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3256, loss: 0.8484, batch_reg_loss: 0.1498, reg_loss: 0.1496 ||:  20%|#9        | 22/111 [00:14<01:00,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8950, UAS: 0.9341, LAS: 0.8794, UEM: 0.5979, LEM: 0.3846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4832, partial_loss/deprel_loss: 0.6899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7985, loss: 0.8280, batch_reg_loss: 0.1499, reg_loss: 0.1497 ||:  23%|##2       | 25/111 [00:16<00:58,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9348, LAS: 0.8796, UEM: 0.5840, LEM: 0.3619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3874, partial_loss/deprel_loss: 0.6064, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7125, loss: 0.8244, batch_reg_loss: 0.1499, reg_loss: 0.1497 ||:  26%|##6       | 29/111 [00:19<00:55,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9347, LAS: 0.8794, UEM: 0.5729, LEM: 0.3494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5306, partial_loss/deprel_loss: 0.5927, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7302, loss: 0.8259, batch_reg_loss: 0.1500, reg_loss: 0.1497 ||:  29%|##8       | 32/111 [00:21<00:53,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9323, LAS: 0.8763, UEM: 0.5530, LEM: 0.3312, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5293, partial_loss/deprel_loss: 0.6402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7681, loss: 0.8487, batch_reg_loss: 0.1500, reg_loss: 0.1498 ||:  32%|###2      | 36/111 [00:23<00:49,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9328, LAS: 0.8771, UEM: 0.5633, LEM: 0.3422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1378, partial_loss/deprel_loss: 0.3228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4359, loss: 0.8430, batch_reg_loss: 0.1501, reg_loss: 0.1498 ||:  35%|###5      | 39/111 [00:25<00:48,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9319, LAS: 0.8759, UEM: 0.5512, LEM: 0.3293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3804, partial_loss/deprel_loss: 0.6162, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7192, loss: 0.8529, batch_reg_loss: 0.1501, reg_loss: 0.1498 ||:  39%|###8      | 43/111 [00:28<00:45,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9323, LAS: 0.8762, UEM: 0.5401, LEM: 0.3185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4595, partial_loss/deprel_loss: 0.5603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6904, loss: 0.8498, batch_reg_loss: 0.1502, reg_loss: 0.1498 ||:  42%|####2     | 47/111 [00:30<00:41,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8462, UAS: 0.9327, LAS: 0.8767, UEM: 0.5498, LEM: 0.3266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0265, partial_loss/deprel_loss: 0.8848, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0634, loss: 0.8436, batch_reg_loss: 0.1503, reg_loss: 0.1499 ||:  46%|####5     | 51/111 [00:33<00:38,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8446, UAS: 0.9336, LAS: 0.8777, UEM: 0.5578, LEM: 0.3318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9532, partial_loss/deprel_loss: 0.9401, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0931, loss: 0.8347, batch_reg_loss: 0.1503, reg_loss: 0.1499 ||:  50%|####9     | 55/111 [00:35<00:35,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8091, UAS: 0.9310, LAS: 0.8748, UEM: 0.5446, LEM: 0.3223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6452, partial_loss/deprel_loss: 1.0977, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3576, loss: 0.8591, batch_reg_loss: 0.1504, reg_loss: 0.1499 ||:  53%|#####3    | 59/111 [00:38<00:32,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9295, LAS: 0.8733, UEM: 0.5337, LEM: 0.3132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5317, partial_loss/deprel_loss: 0.6523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7787, loss: 0.8732, batch_reg_loss: 0.1505, reg_loss: 0.1500 ||:  57%|#####6    | 63/111 [00:40<00:30,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9297, LAS: 0.8738, UEM: 0.5323, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2996, partial_loss/deprel_loss: 0.4510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5713, loss: 0.8672, batch_reg_loss: 0.1505, reg_loss: 0.1500 ||:  60%|######    | 67/111 [00:43<00:28,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9302, LAS: 0.8744, UEM: 0.5323, LEM: 0.3087, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2982, partial_loss/deprel_loss: 0.4410, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5631, loss: 0.8616, batch_reg_loss: 0.1506, reg_loss: 0.1500 ||:  64%|######3   | 71/111 [00:46<00:26,  1.51it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8887, UAS: 0.9310, LAS: 0.8752, UEM: 0.5322, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4613, partial_loss/deprel_loss: 0.6015, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7241, loss: 0.8551, batch_reg_loss: 0.1507, reg_loss: 0.1501 ||:  68%|######7   | 75/111 [00:49<00:24,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8928, UAS: 0.9300, LAS: 0.8740, UEM: 0.5275, LEM: 0.2992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3972, partial_loss/deprel_loss: 0.5661, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6831, loss: 0.8679, batch_reg_loss: 0.1508, reg_loss: 0.1501 ||:  71%|#######1  | 79/111 [00:51<00:21,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8049, UAS: 0.9278, LAS: 0.8714, UEM: 0.5172, LEM: 0.2928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6741, partial_loss/deprel_loss: 1.1973, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4435, loss: 0.8901, batch_reg_loss: 0.1508, reg_loss: 0.1501 ||:  75%|#######4  | 83/111 [00:54<00:18,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9281, LAS: 0.8717, UEM: 0.5223, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3916, partial_loss/deprel_loss: 0.5200, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6452, loss: 0.8872, batch_reg_loss: 0.1509, reg_loss: 0.1502 ||:  78%|#######8  | 87/111 [00:57<00:16,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8840, UAS: 0.9278, LAS: 0.8714, UEM: 0.5150, LEM: 0.2903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5170, partial_loss/deprel_loss: 0.6603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7826, loss: 0.8900, batch_reg_loss: 0.1510, reg_loss: 0.1502 ||:  82%|########1 | 91/111 [00:59<00:13,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8360, UAS: 0.9279, LAS: 0.8717, UEM: 0.5151, LEM: 0.2906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3055, partial_loss/deprel_loss: 0.9726, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1902, loss: 0.8875, batch_reg_loss: 0.1511, reg_loss: 0.1502 ||:  86%|########5 | 95/111 [01:01<00:10,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9284, LAS: 0.8722, UEM: 0.5175, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1813, partial_loss/deprel_loss: 0.4224, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5253, loss: 0.8842, batch_reg_loss: 0.1512, reg_loss: 0.1503 ||:  89%|########9 | 99/111 [01:04<00:07,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9037, UAS: 0.9288, LAS: 0.8727, UEM: 0.5197, LEM: 0.2928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2933, partial_loss/deprel_loss: 0.4974, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6078, loss: 0.8797, batch_reg_loss: 0.1512, reg_loss: 0.1503 ||:  93%|#########2| 103/111 [01:07<00:05,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7736, UAS: 0.9286, LAS: 0.8725, UEM: 0.5249, LEM: 0.2976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1080, partial_loss/deprel_loss: 1.4011, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6937, loss: 0.8808, batch_reg_loss: 0.1513, reg_loss: 0.1504 ||:  96%|#########6| 107/111 [01:10<00:02,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8936, UAS: 0.9285, LAS: 0.8723, UEM: 0.5211, LEM: 0.2944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4362, partial_loss/deprel_loss: 0.5338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6656, loss: 0.8816, batch_reg_loss: 0.1513, reg_loss: 0.1504 ||:  99%|#########9| 110/111 [01:12<00:00,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9286, LAS: 0.8724, UEM: 0.5211, LEM: 0.2937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5446, partial_loss/deprel_loss: 0.5990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7395, loss: 0.8803, batch_reg_loss: 0.1513, reg_loss: 0.1504 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
      "2023-04-06 23:51:34,483 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:51:34,483 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:51:34,483 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:51:34,483 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.599  |       N/A\n",
      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.545  |       N/A\n",
      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.150  |       N/A\n",
      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - UEM                      |     0.521  |       N/A\n",
      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - LAS                      |     0.872  |       N/A\n",
      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - loss                     |     0.880  |       N/A\n",
      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - LEM                      |     0.294  |       N/A\n",
      "2023-04-06 23:51:34,484 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:51:34,485 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:51:34,485 - INFO - combo.training.tensorboard_writer - UAS                      |     0.929  |       N/A\n",
      "2023-04-06 23:51:34,485 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:51:34,485 - INFO - combo.training.tensorboard_writer - EM                       |     0.890  |       N/A\n",
      "2023-04-06 23:51:34,485 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:51:34,486 - INFO - combo.training.trainer - Epoch duration: 0:01:13.468063\n",
      "2023-04-06 23:51:34,486 - INFO - combo.training.trainer - Estimated training time remaining: 7:44:03\n",
      "2023-04-06 23:51:34,486 - INFO - allennlp.training.trainer - Epoch 47/399\n",
      "2023-04-06 23:51:34,486 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:51:34,487 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:51:34,497 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8854, UAS: 0.9484, LAS: 0.8921, UEM: 0.5152, LEM: 0.2265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5373, partial_loss/deprel_loss: 0.6751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7989, loss: 0.7461, batch_reg_loss: 0.1514, reg_loss: 0.1514 ||:   4%|3         | 4/111 [00:02<01:05,  1.63it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8846, UAS: 0.9466, LAS: 0.8903, UEM: 0.5488, LEM: 0.2500, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4419, partial_loss/deprel_loss: 0.6563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7649, loss: 0.7337, batch_reg_loss: 0.1514, reg_loss: 0.1514 ||:   6%|6         | 7/111 [00:04<01:10,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9452, LAS: 0.8893, UEM: 0.5505, LEM: 0.2724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5635, partial_loss/deprel_loss: 0.6452, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7804, loss: 0.7389, batch_reg_loss: 0.1515, reg_loss: 0.1514 ||:   9%|9         | 10/111 [00:07<01:09,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8630, UAS: 0.9440, LAS: 0.8878, UEM: 0.5283, LEM: 0.2561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8270, partial_loss/deprel_loss: 0.9081, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0434, loss: 0.7611, batch_reg_loss: 0.1515, reg_loss: 0.1514 ||:  12%|#1        | 13/111 [00:09<01:07,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9360, LAS: 0.8785, UEM: 0.4933, LEM: 0.2363, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5545, partial_loss/deprel_loss: 0.6104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7509, loss: 0.8289, batch_reg_loss: 0.1516, reg_loss: 0.1515 ||:  15%|#5        | 17/111 [00:11<01:02,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9351, LAS: 0.8776, UEM: 0.4647, LEM: 0.2148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5660, partial_loss/deprel_loss: 0.6389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7760, loss: 0.8371, batch_reg_loss: 0.1517, reg_loss: 0.1515 ||:  19%|#8        | 21/111 [00:13<00:57,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9373, LAS: 0.8812, UEM: 0.4902, LEM: 0.2398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2424, partial_loss/deprel_loss: 0.4311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5451, loss: 0.8146, batch_reg_loss: 0.1517, reg_loss: 0.1515 ||:  22%|##1       | 24/111 [00:16<00:57,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9377, LAS: 0.8817, UEM: 0.5209, LEM: 0.2785, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4732, partial_loss/deprel_loss: 0.6436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7613, loss: 0.8096, batch_reg_loss: 0.1518, reg_loss: 0.1516 ||:  24%|##4       | 27/111 [00:18<00:55,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8254, UAS: 0.9377, LAS: 0.8823, UEM: 0.5501, LEM: 0.3158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4170, partial_loss/deprel_loss: 1.0259, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2560, loss: 0.8059, batch_reg_loss: 0.1518, reg_loss: 0.1516 ||:  28%|##7       | 31/111 [00:20<00:52,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9379, LAS: 0.8831, UEM: 0.5481, LEM: 0.3144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3535, partial_loss/deprel_loss: 0.4208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5592, loss: 0.8039, batch_reg_loss: 0.1519, reg_loss: 0.1516 ||:  31%|###       | 34/111 [00:22<00:51,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8378, UAS: 0.9348, LAS: 0.8797, UEM: 0.5299, LEM: 0.3030, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1099, partial_loss/deprel_loss: 1.1716, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3112, loss: 0.8368, batch_reg_loss: 0.1519, reg_loss: 0.1516 ||:  33%|###3      | 37/111 [00:24<00:49,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8553, UAS: 0.9310, LAS: 0.8754, UEM: 0.5079, LEM: 0.2880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8518, partial_loss/deprel_loss: 0.8380, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9927, loss: 0.8694, batch_reg_loss: 0.1520, reg_loss: 0.1517 ||:  37%|###6      | 41/111 [00:27<00:46,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8168, UAS: 0.9289, LAS: 0.8730, UEM: 0.4885, LEM: 0.2745, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4595, partial_loss/deprel_loss: 1.1418, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3574, loss: 0.8871, batch_reg_loss: 0.1521, reg_loss: 0.1517 ||:  41%|####      | 45/111 [00:29<00:43,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9281, LAS: 0.8723, UEM: 0.4868, LEM: 0.2702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4924, partial_loss/deprel_loss: 0.6568, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7761, loss: 0.8943, batch_reg_loss: 0.1521, reg_loss: 0.1517 ||:  44%|####4     | 49/111 [00:32<00:41,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9272, LAS: 0.8714, UEM: 0.4838, LEM: 0.2672, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3521, partial_loss/deprel_loss: 0.5455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6591, loss: 0.9020, batch_reg_loss: 0.1522, reg_loss: 0.1518 ||:  47%|####6     | 52/111 [00:34<00:39,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9289, LAS: 0.8733, UEM: 0.5055, LEM: 0.2813, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2791, partial_loss/deprel_loss: 0.4182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5426, loss: 0.8857, batch_reg_loss: 0.1523, reg_loss: 0.1518 ||:  50%|####9     | 55/111 [00:37<00:39,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9281, LAS: 0.8722, UEM: 0.4949, LEM: 0.2733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7369, partial_loss/deprel_loss: 0.7573, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9055, loss: 0.8954, batch_reg_loss: 0.1523, reg_loss: 0.1518 ||:  52%|#####2    | 58/111 [00:39<00:37,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9273, LAS: 0.8712, UEM: 0.4849, LEM: 0.2654, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5280, partial_loss/deprel_loss: 0.7407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8505, loss: 0.9024, batch_reg_loss: 0.1524, reg_loss: 0.1518 ||:  55%|#####4    | 61/111 [00:41<00:34,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9278, LAS: 0.8717, UEM: 0.4898, LEM: 0.2680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3571, partial_loss/deprel_loss: 0.5670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6775, loss: 0.8988, batch_reg_loss: 0.1525, reg_loss: 0.1519 ||:  59%|#####8    | 65/111 [00:43<00:30,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8651, UAS: 0.9284, LAS: 0.8724, UEM: 0.4908, LEM: 0.2672, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7764, partial_loss/deprel_loss: 0.8388, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9789, loss: 0.8927, batch_reg_loss: 0.1525, reg_loss: 0.1519 ||:  61%|######1   | 68/111 [00:45<00:29,  1.46it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9291, LAS: 0.8732, UEM: 0.5030, LEM: 0.2763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1377, partial_loss/deprel_loss: 0.3870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4897, loss: 0.8876, batch_reg_loss: 0.1526, reg_loss: 0.1519 ||:  64%|######3   | 71/111 [00:48<00:28,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9283, LAS: 0.8722, UEM: 0.4949, LEM: 0.2694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9420, partial_loss/deprel_loss: 0.8445, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0166, loss: 0.8945, batch_reg_loss: 0.1526, reg_loss: 0.1520 ||:  68%|######7   | 75/111 [00:50<00:24,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9281, LAS: 0.8719, UEM: 0.4908, LEM: 0.2648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4672, partial_loss/deprel_loss: 0.6235, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7450, loss: 0.8979, batch_reg_loss: 0.1527, reg_loss: 0.1520 ||:  71%|#######1  | 79/111 [00:53<00:21,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9287, LAS: 0.8727, UEM: 0.4885, LEM: 0.2607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5525, partial_loss/deprel_loss: 0.6233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7619, loss: 0.8915, batch_reg_loss: 0.1528, reg_loss: 0.1520 ||:  75%|#######4  | 83/111 [00:55<00:18,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8832, UAS: 0.9288, LAS: 0.8729, UEM: 0.4905, LEM: 0.2638, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6938, partial_loss/deprel_loss: 0.7008, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8522, loss: 0.8901, batch_reg_loss: 0.1528, reg_loss: 0.1521 ||:  78%|#######8  | 87/111 [00:58<00:15,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8669, UAS: 0.9289, LAS: 0.8732, UEM: 0.4935, LEM: 0.2668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8700, partial_loss/deprel_loss: 0.8386, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9978, loss: 0.8883, batch_reg_loss: 0.1529, reg_loss: 0.1521 ||:  82%|########1 | 91/111 [01:01<00:13,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9280, LAS: 0.8724, UEM: 0.4954, LEM: 0.2697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2556, partial_loss/deprel_loss: 0.3945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5197, loss: 0.8933, batch_reg_loss: 0.1530, reg_loss: 0.1521 ||:  85%|########4 | 94/111 [01:03<00:11,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9572, UAS: 0.9289, LAS: 0.8735, UEM: 0.5164, LEM: 0.2943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0686, partial_loss/deprel_loss: 0.1776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3088, loss: 0.8856, batch_reg_loss: 0.1530, reg_loss: 0.1522 ||:  87%|########7 | 97/111 [01:06<00:10,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9109, UAS: 0.9289, LAS: 0.8735, UEM: 0.5153, LEM: 0.2937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3051, partial_loss/deprel_loss: 0.4620, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5837, loss: 0.8855, batch_reg_loss: 0.1531, reg_loss: 0.1522 ||:  91%|######### | 101/111 [01:08<00:07,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9299, LAS: 0.8746, UEM: 0.5268, LEM: 0.3022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2536, partial_loss/deprel_loss: 0.3871, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5135, loss: 0.8753, batch_reg_loss: 0.1532, reg_loss: 0.1522 ||:  95%|#########4| 105/111 [01:10<00:03,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9301, LAS: 0.8749, UEM: 0.5290, LEM: 0.3036, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2639, partial_loss/deprel_loss: 0.4698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5818, loss: 0.8739, batch_reg_loss: 0.1532, reg_loss: 0.1523 ||:  98%|#########8| 109/111 [01:12<00:01,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8612, UAS: 0.9302, LAS: 0.8748, UEM: 0.5266, LEM: 0.3005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7826, partial_loss/deprel_loss: 0.8032, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9523, loss: 0.8742, batch_reg_loss: 0.1532, reg_loss: 0.1523 ||: 100%|##########| 111/111 [01:14<00:00,  1.50it/s]\n",
      "2023-04-06 23:52:48,579 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:52:48,579 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.803  |       N/A\n",
      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.783  |       N/A\n",
      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.152  |       N/A\n",
      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - UEM                      |     0.527  |       N/A\n",
      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - LAS                      |     0.875  |       N/A\n",
      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - loss                     |     0.874  |       N/A\n",
      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - LEM                      |     0.301  |       N/A\n",
      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:52:48,580 - INFO - combo.training.tensorboard_writer - UAS                      |     0.930  |       N/A\n",
      "2023-04-06 23:52:48,581 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:52:48,581 - INFO - combo.training.tensorboard_writer - EM                       |     0.861  |       N/A\n",
      "2023-04-06 23:52:48,581 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:52:48,581 - INFO - combo.training.trainer - Epoch duration: 0:01:14.095098\n",
      "2023-04-06 23:52:48,581 - INFO - combo.training.trainer - Estimated training time remaining: 7:42:09\n",
      "2023-04-06 23:52:48,581 - INFO - allennlp.training.trainer - Epoch 48/399\n",
      "2023-04-06 23:52:48,581 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:52:48,582 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:52:48,587 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9000, UAS: 0.9342, LAS: 0.8798, UEM: 0.4156, LEM: 0.1978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4324, partial_loss/deprel_loss: 0.5304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6641, loss: 0.8418, batch_reg_loss: 0.1533, reg_loss: 0.1533 ||:   4%|3         | 4/111 [00:02<01:08,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8507, UAS: 0.9253, LAS: 0.8706, UEM: 0.3450, LEM: 0.1517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0604, partial_loss/deprel_loss: 0.8071, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0111, loss: 0.9093, batch_reg_loss: 0.1534, reg_loss: 0.1533 ||:   7%|7         | 8/111 [00:04<01:04,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8520, UAS: 0.9315, LAS: 0.8776, UEM: 0.5266, LEM: 0.3168, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9183, partial_loss/deprel_loss: 0.9036, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0599, loss: 0.8473, batch_reg_loss: 0.1534, reg_loss: 0.1533 ||:  10%|9         | 11/111 [00:07<01:08,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8656, UAS: 0.9278, LAS: 0.8743, UEM: 0.5129, LEM: 0.3092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9617, partial_loss/deprel_loss: 0.8241, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0050, loss: 0.8777, batch_reg_loss: 0.1534, reg_loss: 0.1533 ||:  13%|#2        | 14/111 [00:09<01:06,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8652, UAS: 0.9300, LAS: 0.8761, UEM: 0.5064, LEM: 0.2942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7605, partial_loss/deprel_loss: 0.8143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9571, loss: 0.8568, batch_reg_loss: 0.1535, reg_loss: 0.1534 ||:  16%|#6        | 18/111 [00:12<01:02,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8517, UAS: 0.9269, LAS: 0.8725, UEM: 0.4682, LEM: 0.2664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0474, partial_loss/deprel_loss: 0.8697, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0588, loss: 0.8885, batch_reg_loss: 0.1536, reg_loss: 0.1534 ||:  20%|#9        | 22/111 [00:14<00:58,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9289, LAS: 0.8747, UEM: 0.4699, LEM: 0.2578, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4745, partial_loss/deprel_loss: 0.5828, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7148, loss: 0.8740, batch_reg_loss: 0.1536, reg_loss: 0.1534 ||:  23%|##3       | 26/111 [00:16<00:54,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9288, LAS: 0.8747, UEM: 0.4876, LEM: 0.2748, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3346, partial_loss/deprel_loss: 0.4859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6094, loss: 0.8699, batch_reg_loss: 0.1537, reg_loss: 0.1535 ||:  27%|##7       | 30/111 [00:19<00:52,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9319, LAS: 0.8781, UEM: 0.5407, LEM: 0.3196, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1436, partial_loss/deprel_loss: 0.3075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4285, loss: 0.8452, batch_reg_loss: 0.1538, reg_loss: 0.1535 ||:  30%|##9       | 33/111 [00:21<00:53,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9313, LAS: 0.8776, UEM: 0.5379, LEM: 0.3147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4710, partial_loss/deprel_loss: 0.5909, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7208, loss: 0.8510, batch_reg_loss: 0.1538, reg_loss: 0.1535 ||:  33%|###3      | 37/111 [00:24<00:49,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9324, LAS: 0.8791, UEM: 0.5453, LEM: 0.3157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3170, partial_loss/deprel_loss: 0.4551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5813, loss: 0.8379, batch_reg_loss: 0.1539, reg_loss: 0.1536 ||:  36%|###6      | 40/111 [00:26<00:48,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8750, UAS: 0.9319, LAS: 0.8783, UEM: 0.5334, LEM: 0.3062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5949, partial_loss/deprel_loss: 0.6138, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7640, loss: 0.8391, batch_reg_loss: 0.1539, reg_loss: 0.1536 ||:  39%|###8      | 43/111 [00:28<00:47,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9336, LAS: 0.8803, UEM: 0.5564, LEM: 0.3248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2271, partial_loss/deprel_loss: 0.3773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5012, loss: 0.8227, batch_reg_loss: 0.1540, reg_loss: 0.1536 ||:  41%|####1     | 46/111 [00:31<00:46,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9314, LAS: 0.8775, UEM: 0.5413, LEM: 0.3131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5589, partial_loss/deprel_loss: 0.5810, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7306, loss: 0.8463, batch_reg_loss: 0.1540, reg_loss: 0.1536 ||:  45%|####5     | 50/111 [00:33<00:42,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9315, LAS: 0.8776, UEM: 0.5407, LEM: 0.3128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2421, partial_loss/deprel_loss: 0.3574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4884, loss: 0.8460, batch_reg_loss: 0.1541, reg_loss: 0.1537 ||:  48%|####7     | 53/111 [00:35<00:40,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9021, UAS: 0.9324, LAS: 0.8785, UEM: 0.5441, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3978, partial_loss/deprel_loss: 0.6004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7141, loss: 0.8389, batch_reg_loss: 0.1542, reg_loss: 0.1537 ||:  51%|#####1    | 57/111 [00:38<00:37,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9316, LAS: 0.8776, UEM: 0.5364, LEM: 0.3044, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6206, partial_loss/deprel_loss: 0.7314, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8634, loss: 0.8457, batch_reg_loss: 0.1542, reg_loss: 0.1537 ||:  54%|#####4    | 60/111 [00:40<00:35,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7838, UAS: 0.9304, LAS: 0.8762, UEM: 0.5293, LEM: 0.2987, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.1126, partial_loss/deprel_loss: 1.3161, partial_loss/cycle_loss: 0.0000, batch_loss: 1.6297, loss: 0.8591, batch_reg_loss: 0.1543, reg_loss: 0.1538 ||:  58%|#####7    | 64/111 [00:43<00:31,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9300, LAS: 0.8758, UEM: 0.5307, LEM: 0.3013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2438, partial_loss/deprel_loss: 0.3579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4894, loss: 0.8597, batch_reg_loss: 0.1543, reg_loss: 0.1538 ||:  60%|######    | 67/111 [00:45<00:30,  1.45it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9548, UAS: 0.9313, LAS: 0.8773, UEM: 0.5548, LEM: 0.3303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0642, partial_loss/deprel_loss: 0.1699, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3031, loss: 0.8491, batch_reg_loss: 0.1544, reg_loss: 0.1538 ||:  63%|######3   | 70/111 [00:47<00:29,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8385, UAS: 0.9314, LAS: 0.8771, UEM: 0.5535, LEM: 0.3281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1907, partial_loss/deprel_loss: 1.0234, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2113, loss: 0.8511, batch_reg_loss: 0.1544, reg_loss: 0.1538 ||:  66%|######5   | 73/111 [00:50<00:28,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8736, UAS: 0.9308, LAS: 0.8763, UEM: 0.5414, LEM: 0.3172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5767, partial_loss/deprel_loss: 0.7398, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8617, loss: 0.8574, batch_reg_loss: 0.1545, reg_loss: 0.1539 ||:  69%|######9   | 77/111 [00:52<00:24,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8864, UAS: 0.9307, LAS: 0.8762, UEM: 0.5364, LEM: 0.3123, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4993, partial_loss/deprel_loss: 0.6346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7621, loss: 0.8571, batch_reg_loss: 0.1546, reg_loss: 0.1539 ||:  73%|#######2  | 81/111 [00:54<00:20,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8896, UAS: 0.9312, LAS: 0.8766, UEM: 0.5370, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4384, partial_loss/deprel_loss: 0.6207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7389, loss: 0.8523, batch_reg_loss: 0.1546, reg_loss: 0.1539 ||:  76%|#######5  | 84/111 [00:57<00:18,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9312, LAS: 0.8766, UEM: 0.5312, LEM: 0.3050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7141, partial_loss/deprel_loss: 0.6809, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8422, loss: 0.8526, batch_reg_loss: 0.1547, reg_loss: 0.1539 ||:  78%|#######8  | 87/111 [00:59<00:16,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8319, UAS: 0.9298, LAS: 0.8751, UEM: 0.5309, LEM: 0.3053, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1345, partial_loss/deprel_loss: 0.9797, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1654, loss: 0.8649, batch_reg_loss: 0.1547, reg_loss: 0.1540 ||:  81%|########1 | 90/111 [01:01<00:14,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8867, UAS: 0.9301, LAS: 0.8755, UEM: 0.5403, LEM: 0.3164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5235, partial_loss/deprel_loss: 0.6702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7956, loss: 0.8621, batch_reg_loss: 0.1548, reg_loss: 0.1540 ||:  84%|########3 | 93/111 [01:03<00:12,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8038, UAS: 0.9290, LAS: 0.8744, UEM: 0.5343, LEM: 0.3122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9209, partial_loss/deprel_loss: 1.1134, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4297, loss: 0.8719, batch_reg_loss: 0.1548, reg_loss: 0.1540 ||:  86%|########6 | 96/111 [01:05<00:10,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8983, UAS: 0.9294, LAS: 0.8747, UEM: 0.5321, LEM: 0.3085, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3043, partial_loss/deprel_loss: 0.5841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6830, loss: 0.8683, batch_reg_loss: 0.1549, reg_loss: 0.1541 ||:  90%|######### | 100/111 [01:08<00:07,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8439, UAS: 0.9285, LAS: 0.8737, UEM: 0.5242, LEM: 0.3027, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1519, partial_loss/deprel_loss: 0.9448, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1412, loss: 0.8762, batch_reg_loss: 0.1550, reg_loss: 0.1541 ||:  94%|#########3| 104/111 [01:10<00:04,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9284, LAS: 0.8734, UEM: 0.5209, LEM: 0.2983, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3185, partial_loss/deprel_loss: 0.4996, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6184, loss: 0.8786, batch_reg_loss: 0.1550, reg_loss: 0.1541 ||:  97%|#########7| 108/111 [01:13<00:01,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9289, LAS: 0.8740, UEM: 0.5235, LEM: 0.2984, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3537, partial_loss/deprel_loss: 0.4988, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6249, loss: 0.8731, batch_reg_loss: 0.1551, reg_loss: 0.1542 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.499  |       N/A\n",
      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.354  |       N/A\n",
      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.154  |       N/A\n",
      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - UEM                      |     0.523  |       N/A\n",
      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - LAS                      |     0.874  |       N/A\n",
      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - loss                     |     0.873  |       N/A\n",
      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:54:04,142 - INFO - combo.training.tensorboard_writer - LEM                      |     0.298  |       N/A\n",
      "2023-04-06 23:54:04,143 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:54:04,143 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:54:04,143 - INFO - combo.training.tensorboard_writer - UAS                      |     0.929  |       N/A\n",
      "2023-04-06 23:54:04,143 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:54:04,143 - INFO - combo.training.tensorboard_writer - EM                       |     0.896  |       N/A\n",
      "2023-04-06 23:54:04,143 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:54:04,143 - INFO - combo.training.trainer - Epoch duration: 0:01:15.561956\n",
      "2023-04-06 23:54:04,143 - INFO - combo.training.trainer - Estimated training time remaining: 7:40:27\n",
      "2023-04-06 23:54:04,143 - INFO - allennlp.training.trainer - Epoch 49/399\n",
      "2023-04-06 23:54:04,144 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:54:04,144 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:54:04,149 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7909, UAS: 0.8954, LAS: 0.8373, UEM: 0.3531, LEM: 0.2014, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9718, partial_loss/deprel_loss: 1.1487, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4685, loss: 1.1159, batch_reg_loss: 0.1552, reg_loss: 0.1552 ||:   4%|3         | 4/111 [00:02<01:10,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9175, LAS: 0.8616, UEM: 0.4567, LEM: 0.2334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3460, partial_loss/deprel_loss: 0.4872, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6142, loss: 0.9446, batch_reg_loss: 0.1553, reg_loss: 0.1552 ||:   7%|7         | 8/111 [00:05<01:06,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8947, UAS: 0.9264, LAS: 0.8697, UEM: 0.5122, LEM: 0.2647, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3347, partial_loss/deprel_loss: 0.5663, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6753, loss: 0.8896, batch_reg_loss: 0.1553, reg_loss: 0.1552 ||:  10%|9         | 11/111 [00:07<01:07,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8149, UAS: 0.9191, LAS: 0.8626, UEM: 0.4610, LEM: 0.2322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7589, partial_loss/deprel_loss: 1.0592, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3545, loss: 0.9608, batch_reg_loss: 0.1554, reg_loss: 0.1553 ||:  14%|#3        | 15/111 [00:09<01:02,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9214, LAS: 0.8657, UEM: 0.4965, LEM: 0.2659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1912, partial_loss/deprel_loss: 0.3556, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4782, loss: 0.9304, batch_reg_loss: 0.1554, reg_loss: 0.1553 ||:  17%|#7        | 19/111 [00:12<00:58,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9223, LAS: 0.8664, UEM: 0.4895, LEM: 0.2537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3587, partial_loss/deprel_loss: 0.5543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6707, loss: 0.9235, batch_reg_loss: 0.1555, reg_loss: 0.1553 ||:  21%|##        | 23/111 [00:14<00:57,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9138, UAS: 0.9252, LAS: 0.8696, UEM: 0.4974, LEM: 0.2570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2637, partial_loss/deprel_loss: 0.3971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5260, loss: 0.8980, batch_reg_loss: 0.1556, reg_loss: 0.1554 ||:  24%|##4       | 27/111 [00:17<00:54,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8481, UAS: 0.9248, LAS: 0.8688, UEM: 0.4822, LEM: 0.2448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9313, partial_loss/deprel_loss: 0.9207, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0785, loss: 0.9065, batch_reg_loss: 0.1556, reg_loss: 0.1554 ||:  27%|##7       | 30/111 [00:19<00:53,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9034, UAS: 0.9285, LAS: 0.8729, UEM: 0.5310, LEM: 0.2872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3969, partial_loss/deprel_loss: 0.4874, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6250, loss: 0.8737, batch_reg_loss: 0.1557, reg_loss: 0.1554 ||:  30%|##9       | 33/111 [00:22<00:55,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9296, LAS: 0.8746, UEM: 0.5256, LEM: 0.2821, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6425, partial_loss/deprel_loss: 0.6280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7866, loss: 0.8591, batch_reg_loss: 0.1558, reg_loss: 0.1554 ||:  33%|###3      | 37/111 [00:24<00:50,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9084, UAS: 0.9294, LAS: 0.8742, UEM: 0.5161, LEM: 0.2751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3167, partial_loss/deprel_loss: 0.4630, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5896, loss: 0.8647, batch_reg_loss: 0.1558, reg_loss: 0.1555 ||:  37%|###6      | 41/111 [00:26<00:44,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8782, UAS: 0.9300, LAS: 0.8749, UEM: 0.5093, LEM: 0.2689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6331, partial_loss/deprel_loss: 0.7067, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8478, loss: 0.8596, batch_reg_loss: 0.1559, reg_loss: 0.1555 ||:  41%|####      | 45/111 [00:29<00:43,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9171, UAS: 0.9313, LAS: 0.8765, UEM: 0.5172, LEM: 0.2726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2331, partial_loss/deprel_loss: 0.4538, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5656, loss: 0.8482, batch_reg_loss: 0.1559, reg_loss: 0.1555 ||:  44%|####4     | 49/111 [00:31<00:39,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9308, LAS: 0.8760, UEM: 0.5255, LEM: 0.2803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3214, partial_loss/deprel_loss: 0.5428, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6545, loss: 0.8538, batch_reg_loss: 0.1560, reg_loss: 0.1556 ||:  48%|####7     | 53/111 [00:34<00:39,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9295, LAS: 0.8748, UEM: 0.5237, LEM: 0.2787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4346, partial_loss/deprel_loss: 0.6295, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7466, loss: 0.8677, batch_reg_loss: 0.1560, reg_loss: 0.1556 ||:  50%|#####     | 56/111 [00:37<00:38,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8777, UAS: 0.9301, LAS: 0.8753, UEM: 0.5200, LEM: 0.2719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5485, partial_loss/deprel_loss: 0.6739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8050, loss: 0.8635, batch_reg_loss: 0.1561, reg_loss: 0.1556 ||:  53%|#####3    | 59/111 [00:39<00:36,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9182, UAS: 0.9304, LAS: 0.8758, UEM: 0.5333, LEM: 0.2861, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1874, partial_loss/deprel_loss: 0.3743, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4931, loss: 0.8582, batch_reg_loss: 0.1561, reg_loss: 0.1557 ||:  56%|#####5    | 62/111 [00:41<00:35,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9301, LAS: 0.8755, UEM: 0.5277, LEM: 0.2818, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3650, partial_loss/deprel_loss: 0.5520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6708, loss: 0.8625, batch_reg_loss: 0.1562, reg_loss: 0.1557 ||:  59%|#####8    | 65/111 [00:43<00:32,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8750, UAS: 0.9311, LAS: 0.8764, UEM: 0.5335, LEM: 0.2839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5554, partial_loss/deprel_loss: 0.6621, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7970, loss: 0.8548, batch_reg_loss: 0.1562, reg_loss: 0.1557 ||:  61%|######1   | 68/111 [00:46<00:32,  1.34it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9304, LAS: 0.8755, UEM: 0.5226, LEM: 0.2760, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8234, partial_loss/deprel_loss: 0.7134, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8917, loss: 0.8620, batch_reg_loss: 0.1563, reg_loss: 0.1557 ||:  65%|######4   | 72/111 [00:48<00:28,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8284, UAS: 0.9302, LAS: 0.8751, UEM: 0.5187, LEM: 0.2726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4144, partial_loss/deprel_loss: 1.0153, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2515, loss: 0.8652, batch_reg_loss: 0.1564, reg_loss: 0.1558 ||:  68%|######8   | 76/111 [00:51<00:24,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8980, UAS: 0.9312, LAS: 0.8763, UEM: 0.5408, LEM: 0.2998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4109, partial_loss/deprel_loss: 0.5739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6977, loss: 0.8563, batch_reg_loss: 0.1564, reg_loss: 0.1558 ||:  71%|#######1  | 79/111 [00:54<00:24,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8835, UAS: 0.9311, LAS: 0.8763, UEM: 0.5334, LEM: 0.2934, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5825, partial_loss/deprel_loss: 0.6902, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8251, loss: 0.8572, batch_reg_loss: 0.1565, reg_loss: 0.1558 ||:  75%|#######4  | 83/111 [00:56<00:19,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8287, UAS: 0.9302, LAS: 0.8752, UEM: 0.5287, LEM: 0.2902, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3085, partial_loss/deprel_loss: 1.0597, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2660, loss: 0.8685, batch_reg_loss: 0.1565, reg_loss: 0.1558 ||:  78%|#######8  | 87/111 [00:58<00:16,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9299, LAS: 0.8749, UEM: 0.5339, LEM: 0.2979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1485, partial_loss/deprel_loss: 0.3128, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4365, loss: 0.8724, batch_reg_loss: 0.1566, reg_loss: 0.1559 ||:  81%|########1 | 90/111 [01:01<00:14,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8676, UAS: 0.9307, LAS: 0.8758, UEM: 0.5454, LEM: 0.3116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7527, partial_loss/deprel_loss: 0.7827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9333, loss: 0.8654, batch_reg_loss: 0.1566, reg_loss: 0.1559 ||:  84%|########3 | 93/111 [01:03<00:12,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9312, LAS: 0.8764, UEM: 0.5440, LEM: 0.3083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8018, partial_loss/deprel_loss: 0.8328, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9833, loss: 0.8617, batch_reg_loss: 0.1567, reg_loss: 0.1559 ||:  87%|########7 | 97/111 [01:05<00:09,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8908, UAS: 0.9300, LAS: 0.8753, UEM: 0.5369, LEM: 0.3034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5177, partial_loss/deprel_loss: 0.6388, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7714, loss: 0.8700, batch_reg_loss: 0.1568, reg_loss: 0.1560 ||:  91%|######### | 101/111 [01:07<00:06,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8587, UAS: 0.9295, LAS: 0.8746, UEM: 0.5288, LEM: 0.2978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8003, partial_loss/deprel_loss: 0.8681, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0114, loss: 0.8759, batch_reg_loss: 0.1568, reg_loss: 0.1560 ||:  95%|#########4| 105/111 [01:10<00:03,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8610, UAS: 0.9292, LAS: 0.8742, UEM: 0.5270, LEM: 0.2972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8836, partial_loss/deprel_loss: 0.8153, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9858, loss: 0.8781, batch_reg_loss: 0.1569, reg_loss: 0.1560 ||:  98%|#########8| 109/111 [01:12<00:01,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9294, LAS: 0.8745, UEM: 0.5276, LEM: 0.2970, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2578, partial_loss/deprel_loss: 0.4366, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5578, loss: 0.8755, batch_reg_loss: 0.1569, reg_loss: 0.1560 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.437  |       N/A\n",
      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.258  |       N/A\n",
      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.156  |       N/A\n",
      "2023-04-06 23:55:18,545 - INFO - combo.training.tensorboard_writer - UEM                      |     0.528  |       N/A\n",
      "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - LAS                      |     0.874  |       N/A\n",
      "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - loss                     |     0.876  |       N/A\n",
      "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - LEM                      |     0.297  |       N/A\n",
      "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - UAS                      |     0.929  |       N/A\n",
      "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - EM                       |     0.914  |       N/A\n",
      "2023-04-06 23:55:18,546 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:55:18,547 - INFO - combo.training.trainer - Epoch duration: 0:01:14.403031\n",
      "2023-04-06 23:55:18,547 - INFO - combo.training.trainer - Estimated training time remaining: 7:38:38\n",
      "2023-04-06 23:55:18,547 - INFO - allennlp.training.trainer - Epoch 50/399\n",
      "2023-04-06 23:55:18,547 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:55:18,547 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:55:18,553 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8449, UAS: 0.9290, LAS: 0.8760, UEM: 0.5054, LEM: 0.2842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1142, partial_loss/deprel_loss: 0.8807, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0844, loss: 0.8502, batch_reg_loss: 0.1570, reg_loss: 0.1570 ||:   3%|2         | 3/111 [00:02<01:19,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9221, LAS: 0.8702, UEM: 0.4812, LEM: 0.2827, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2506, partial_loss/deprel_loss: 0.3848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5150, loss: 0.8912, batch_reg_loss: 0.1571, reg_loss: 0.1570 ||:   6%|6         | 7/111 [00:04<01:14,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9227, UAS: 0.9285, LAS: 0.8777, UEM: 0.5969, LEM: 0.3922, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2795, partial_loss/deprel_loss: 0.4394, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5646, loss: 0.8423, batch_reg_loss: 0.1571, reg_loss: 0.1570 ||:   9%|9         | 10/111 [00:07<01:17,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8914, UAS: 0.9283, LAS: 0.8774, UEM: 0.5628, LEM: 0.3540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5145, partial_loss/deprel_loss: 0.5950, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7361, loss: 0.8468, batch_reg_loss: 0.1572, reg_loss: 0.1571 ||:  12%|#1        | 13/111 [00:09<01:12,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8716, UAS: 0.9320, LAS: 0.8807, UEM: 0.5504, LEM: 0.3256, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7563, partial_loss/deprel_loss: 0.7074, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8744, loss: 0.8170, batch_reg_loss: 0.1572, reg_loss: 0.1571 ||:  15%|#5        | 17/111 [00:12<01:07,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9309, LAS: 0.8794, UEM: 0.5287, LEM: 0.3068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7209, partial_loss/deprel_loss: 0.7438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8965, loss: 0.8283, batch_reg_loss: 0.1573, reg_loss: 0.1571 ||:  18%|#8        | 20/111 [00:14<01:05,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8030, UAS: 0.9249, LAS: 0.8730, UEM: 0.4993, LEM: 0.2896, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9332, partial_loss/deprel_loss: 1.1208, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4406, loss: 0.8825, batch_reg_loss: 0.1573, reg_loss: 0.1571 ||:  21%|##        | 23/111 [00:16<01:03,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9199, UAS: 0.9282, LAS: 0.8763, UEM: 0.5111, LEM: 0.2914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2713, partial_loss/deprel_loss: 0.4207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5482, loss: 0.8626, batch_reg_loss: 0.1574, reg_loss: 0.1572 ||:  24%|##4       | 27/111 [00:18<00:56,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8736, UAS: 0.9296, LAS: 0.8774, UEM: 0.5096, LEM: 0.2850, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7129, partial_loss/deprel_loss: 0.7503, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9003, loss: 0.8551, batch_reg_loss: 0.1574, reg_loss: 0.1572 ||:  27%|##7       | 30/111 [00:21<00:55,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9288, LAS: 0.8761, UEM: 0.5080, LEM: 0.2875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2659, partial_loss/deprel_loss: 0.3883, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5213, loss: 0.8652, batch_reg_loss: 0.1575, reg_loss: 0.1572 ||:  31%|###       | 34/111 [00:23<00:52,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9288, LAS: 0.8758, UEM: 0.5034, LEM: 0.2842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5541, partial_loss/deprel_loss: 0.7148, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8402, loss: 0.8701, batch_reg_loss: 0.1576, reg_loss: 0.1573 ||:  33%|###3      | 37/111 [00:25<00:50,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9306, LAS: 0.8774, UEM: 0.5220, LEM: 0.2958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1300, partial_loss/deprel_loss: 0.3725, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4816, loss: 0.8589, batch_reg_loss: 0.1576, reg_loss: 0.1573 ||:  36%|###6      | 40/111 [00:27<00:49,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8382, UAS: 0.9289, LAS: 0.8753, UEM: 0.5036, LEM: 0.2838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1688, partial_loss/deprel_loss: 0.8952, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1076, loss: 0.8755, batch_reg_loss: 0.1577, reg_loss: 0.1573 ||:  40%|###9      | 44/111 [00:30<00:45,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8863, UAS: 0.9303, LAS: 0.8768, UEM: 0.5211, LEM: 0.2980, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5037, partial_loss/deprel_loss: 0.6167, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7518, loss: 0.8604, batch_reg_loss: 0.1577, reg_loss: 0.1573 ||:  42%|####2     | 47/111 [00:32<00:43,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8513, UAS: 0.9302, LAS: 0.8764, UEM: 0.5122, LEM: 0.2886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8860, partial_loss/deprel_loss: 0.8571, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0207, loss: 0.8628, batch_reg_loss: 0.1578, reg_loss: 0.1574 ||:  45%|####5     | 50/111 [00:34<00:41,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7913, UAS: 0.9295, LAS: 0.8755, UEM: 0.5144, LEM: 0.2883, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9336, partial_loss/deprel_loss: 1.3001, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5847, loss: 0.8703, batch_reg_loss: 0.1578, reg_loss: 0.1574 ||:  48%|####7     | 53/111 [00:37<00:42,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.9300, LAS: 0.8766, UEM: 0.5481, LEM: 0.3316, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5420, partial_loss/deprel_loss: 1.0670, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3199, loss: 0.8646, batch_reg_loss: 0.1579, reg_loss: 0.1574 ||:  50%|#####     | 56/111 [00:39<00:40,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7832, UAS: 0.9297, LAS: 0.8761, UEM: 0.5495, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8045, partial_loss/deprel_loss: 1.2793, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5423, loss: 0.8670, batch_reg_loss: 0.1579, reg_loss: 0.1574 ||:  54%|#####4    | 60/111 [00:42<00:36,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9289, LAS: 0.8751, UEM: 0.5481, LEM: 0.3267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3008, partial_loss/deprel_loss: 0.5128, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6284, loss: 0.8746, batch_reg_loss: 0.1580, reg_loss: 0.1575 ||:  57%|#####6    | 63/111 [00:44<00:34,  1.41it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9069, UAS: 0.9290, LAS: 0.8750, UEM: 0.5390, LEM: 0.3177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3938, partial_loss/deprel_loss: 0.5525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6788, loss: 0.8767, batch_reg_loss: 0.1581, reg_loss: 0.1575 ||:  60%|######    | 67/111 [00:46<00:30,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9295, LAS: 0.8755, UEM: 0.5369, LEM: 0.3129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3454, partial_loss/deprel_loss: 0.5430, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6616, loss: 0.8744, batch_reg_loss: 0.1581, reg_loss: 0.1575 ||:  64%|######3   | 71/111 [00:49<00:26,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8429, UAS: 0.9296, LAS: 0.8755, UEM: 0.5377, LEM: 0.3142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0116, partial_loss/deprel_loss: 1.0316, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1858, loss: 0.8755, batch_reg_loss: 0.1582, reg_loss: 0.1576 ||:  67%|######6   | 74/111 [00:51<00:25,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8721, UAS: 0.9294, LAS: 0.8754, UEM: 0.5309, LEM: 0.3089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8416, partial_loss/deprel_loss: 0.7885, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9573, loss: 0.8776, batch_reg_loss: 0.1582, reg_loss: 0.1576 ||:  70%|#######   | 78/111 [00:53<00:21,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8451, UAS: 0.9293, LAS: 0.8752, UEM: 0.5232, LEM: 0.3013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9259, partial_loss/deprel_loss: 0.9234, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0822, loss: 0.8784, batch_reg_loss: 0.1583, reg_loss: 0.1576 ||:  74%|#######3  | 82/111 [00:55<00:18,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9294, LAS: 0.8752, UEM: 0.5207, LEM: 0.2986, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2829, partial_loss/deprel_loss: 0.4930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6093, loss: 0.8777, batch_reg_loss: 0.1583, reg_loss: 0.1577 ||:  77%|#######7  | 86/111 [00:58<00:15,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8559, UAS: 0.9291, LAS: 0.8750, UEM: 0.5146, LEM: 0.2938, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1339, partial_loss/deprel_loss: 0.9053, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1094, loss: 0.8806, batch_reg_loss: 0.1584, reg_loss: 0.1577 ||:  81%|########1 | 90/111 [01:01<00:13,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9299, LAS: 0.8757, UEM: 0.5307, LEM: 0.3088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2277, partial_loss/deprel_loss: 0.4237, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5429, loss: 0.8738, batch_reg_loss: 0.1585, reg_loss: 0.1577 ||:  85%|########4 | 94/111 [01:04<00:11,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9301, LAS: 0.8760, UEM: 0.5314, LEM: 0.3079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3976, partial_loss/deprel_loss: 0.5300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6621, loss: 0.8717, batch_reg_loss: 0.1585, reg_loss: 0.1578 ||:  87%|########7 | 97/111 [01:06<00:09,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8842, UAS: 0.9302, LAS: 0.8758, UEM: 0.5269, LEM: 0.3024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5324, partial_loss/deprel_loss: 0.6760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8058, loss: 0.8718, batch_reg_loss: 0.1586, reg_loss: 0.1578 ||:  91%|######### | 101/111 [01:08<00:06,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9307, LAS: 0.8763, UEM: 0.5341, LEM: 0.3073, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2046, partial_loss/deprel_loss: 0.4037, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5225, loss: 0.8681, batch_reg_loss: 0.1586, reg_loss: 0.1578 ||:  95%|#########4| 105/111 [01:11<00:04,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8793, UAS: 0.9308, LAS: 0.8765, UEM: 0.5314, LEM: 0.3036, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5598, partial_loss/deprel_loss: 0.6800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8146, loss: 0.8667, batch_reg_loss: 0.1587, reg_loss: 0.1578 ||:  97%|#########7| 108/111 [01:13<00:02,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9303, LAS: 0.8757, UEM: 0.5319, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2880, partial_loss/deprel_loss: 0.4364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5654, loss: 0.8721, batch_reg_loss: 0.1587, reg_loss: 0.1579 ||: 100%|##########| 111/111 [01:16<00:00,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9303, LAS: 0.8757, UEM: 0.5319, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2880, partial_loss/deprel_loss: 0.4364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5654, loss: 0.8721, batch_reg_loss: 0.1587, reg_loss: 0.1579 ||: 100%|##########| 111/111 [01:16<00:00,  1.46it/s]\n",
      "2023-04-06 23:56:34,705 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9351, LAS: 0.8773, UEM: 0.4018, LEM: 0.1232, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6037, partial_loss/deprel_loss: 24.7088, partial_loss/cycle_loss: 0.0000, batch_loss: 19.8878, loss: 28.6320, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:09,  1.10it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9108, UAS: 0.9493, LAS: 0.8951, UEM: 0.6527, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4009, partial_loss/deprel_loss: 26.6414, partial_loss/cycle_loss: 0.0000, batch_loss: 21.3933, loss: 25.2934, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:04<00:07,  1.06it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8618, UAS: 0.9439, LAS: 0.8897, UEM: 0.5984, LEM: 0.2964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2572, partial_loss/deprel_loss: 49.6530, partial_loss/cycle_loss: 0.0000, batch_loss: 39.9738, loss: 26.4770, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:07<00:04,  1.07it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8273, UAS: 0.9402, LAS: 0.8860, UEM: 0.5746, LEM: 0.2867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6577, partial_loss/deprel_loss: 58.9864, partial_loss/cycle_loss: 0.0000, batch_loss: 47.5206, loss: 27.0998, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:09<00:01,  1.11it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8845, UAS: 0.9427, LAS: 0.8904, UEM: 0.6365, LEM: 0.3750, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6548, partial_loss/deprel_loss: 35.0931, partial_loss/cycle_loss: 0.0000, batch_loss: 28.2055, loss: 26.3856, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:11<00:00,  1.10it/s]\n",
      "2023-04-06 23:56:46,535 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.436  |    35.093\n",
      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.288  |     0.655\n",
      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.158  |     0.000\n",
      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - UEM                      |     0.532  |     0.636\n",
      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - LAS                      |     0.876  |     0.890\n",
      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - loss                     |     0.872  |    26.386\n",
      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - LEM                      |     0.305  |     0.375\n",
      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-06 23:56:46,536 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-06 23:56:46,537 - INFO - combo.training.tensorboard_writer - UAS                      |     0.930  |     0.943\n",
      "2023-04-06 23:56:46,537 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-06 23:56:46,537 - INFO - combo.training.tensorboard_writer - EM                       |     0.911  |     0.885\n",
      "2023-04-06 23:56:46,537 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:56:46,537 - INFO - combo.training.trainer - Epoch duration: 0:01:27.990431\n",
      "2023-04-06 23:56:46,537 - INFO - combo.training.trainer - Estimated training time remaining: 7:38:24\n",
      "2023-04-06 23:56:46,537 - INFO - allennlp.training.trainer - Epoch 51/399\n",
      "2023-04-06 23:56:46,537 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:56:46,538 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:56:46,543 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9240, LAS: 0.8692, UEM: 0.6476, LEM: 0.3819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2921, partial_loss/deprel_loss: 0.4776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5993, loss: 0.9016, batch_reg_loss: 0.1588, reg_loss: 0.1587 ||:   3%|2         | 3/111 [00:02<01:13,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9277, LAS: 0.8749, UEM: 0.6799, LEM: 0.4465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4705, partial_loss/deprel_loss: 0.5734, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7116, loss: 0.8611, batch_reg_loss: 0.1588, reg_loss: 0.1588 ||:   5%|5         | 6/111 [00:04<01:13,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9217, LAS: 0.8687, UEM: 0.6278, LEM: 0.3871, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3600, partial_loss/deprel_loss: 0.4258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5715, loss: 0.9148, batch_reg_loss: 0.1589, reg_loss: 0.1588 ||:   9%|9         | 10/111 [00:06<01:07,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9316, LAS: 0.8807, UEM: 0.6713, LEM: 0.4400, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1199, partial_loss/deprel_loss: 0.2607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3915, loss: 0.8255, batch_reg_loss: 0.1589, reg_loss: 0.1588 ||:  13%|#2        | 14/111 [00:09<01:05,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8761, UAS: 0.9349, LAS: 0.8836, UEM: 0.6458, LEM: 0.4052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6169, partial_loss/deprel_loss: 0.6818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8278, loss: 0.8022, batch_reg_loss: 0.1590, reg_loss: 0.1589 ||:  16%|#6        | 18/111 [00:11<01:00,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8600, UAS: 0.9336, LAS: 0.8810, UEM: 0.6118, LEM: 0.3778, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8011, partial_loss/deprel_loss: 0.8718, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0168, loss: 0.8227, batch_reg_loss: 0.1591, reg_loss: 0.1589 ||:  20%|#9        | 22/111 [00:14<00:58,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9371, LAS: 0.8849, UEM: 0.6244, LEM: 0.3825, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4766, partial_loss/deprel_loss: 0.6570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7800, loss: 0.7951, batch_reg_loss: 0.1591, reg_loss: 0.1589 ||:  23%|##3       | 26/111 [00:17<00:55,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8319, UAS: 0.9349, LAS: 0.8821, UEM: 0.5989, LEM: 0.3635, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2324, partial_loss/deprel_loss: 1.1135, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2964, loss: 0.8195, batch_reg_loss: 0.1592, reg_loss: 0.1590 ||:  26%|##6       | 29/111 [00:19<00:55,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9340, LAS: 0.8813, UEM: 0.5833, LEM: 0.3488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2795, partial_loss/deprel_loss: 0.4729, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5935, loss: 0.8260, batch_reg_loss: 0.1592, reg_loss: 0.1590 ||:  30%|##9       | 33/111 [00:21<00:52,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9356, LAS: 0.8825, UEM: 0.5790, LEM: 0.3380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3626, partial_loss/deprel_loss: 0.5307, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6563, loss: 0.8157, batch_reg_loss: 0.1593, reg_loss: 0.1590 ||:  33%|###3      | 37/111 [00:24<00:48,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8764, UAS: 0.9346, LAS: 0.8810, UEM: 0.5659, LEM: 0.3250, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5879, partial_loss/deprel_loss: 0.6852, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8250, loss: 0.8271, batch_reg_loss: 0.1593, reg_loss: 0.1590 ||:  37%|###6      | 41/111 [00:26<00:44,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9339, LAS: 0.8803, UEM: 0.5605, LEM: 0.3205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3940, partial_loss/deprel_loss: 0.5271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6599, loss: 0.8325, batch_reg_loss: 0.1594, reg_loss: 0.1591 ||:  41%|####      | 45/111 [00:29<00:43,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8878, UAS: 0.9337, LAS: 0.8795, UEM: 0.5521, LEM: 0.3106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4302, partial_loss/deprel_loss: 0.6363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7545, loss: 0.8381, batch_reg_loss: 0.1595, reg_loss: 0.1591 ||:  44%|####4     | 49/111 [00:32<00:41,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9334, LAS: 0.8794, UEM: 0.5531, LEM: 0.3134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3607, partial_loss/deprel_loss: 0.4791, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6150, loss: 0.8376, batch_reg_loss: 0.1595, reg_loss: 0.1591 ||:  47%|####6     | 52/111 [00:34<00:40,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8409, UAS: 0.9332, LAS: 0.8791, UEM: 0.5510, LEM: 0.3121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1740, partial_loss/deprel_loss: 1.0353, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2226, loss: 0.8416, batch_reg_loss: 0.1596, reg_loss: 0.1592 ||:  50%|####9     | 55/111 [00:36<00:38,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9325, LAS: 0.8786, UEM: 0.5527, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2625, partial_loss/deprel_loss: 0.4347, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5599, loss: 0.8446, batch_reg_loss: 0.1596, reg_loss: 0.1592 ||:  53%|#####3    | 59/111 [00:39<00:36,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8565, UAS: 0.9332, LAS: 0.8796, UEM: 0.5727, LEM: 0.3430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9880, partial_loss/deprel_loss: 0.8851, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0654, loss: 0.8385, batch_reg_loss: 0.1597, reg_loss: 0.1592 ||:  56%|#####5    | 62/111 [00:41<00:36,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9340, LAS: 0.8803, UEM: 0.5741, LEM: 0.3408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6115, partial_loss/deprel_loss: 0.6343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7895, loss: 0.8323, batch_reg_loss: 0.1598, reg_loss: 0.1592 ||:  59%|#####8    | 65/111 [00:43<00:33,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8495, UAS: 0.9338, LAS: 0.8803, UEM: 0.5767, LEM: 0.3446, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1369, partial_loss/deprel_loss: 0.9492, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1465, loss: 0.8330, batch_reg_loss: 0.1598, reg_loss: 0.1593 ||:  62%|######2   | 69/111 [00:46<00:28,  1.46it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8846, UAS: 0.9338, LAS: 0.8799, UEM: 0.5702, LEM: 0.3380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4896, partial_loss/deprel_loss: 0.6765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7990, loss: 0.8342, batch_reg_loss: 0.1599, reg_loss: 0.1593 ||:  66%|######5   | 73/111 [00:48<00:25,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9336, LAS: 0.8800, UEM: 0.5638, LEM: 0.3331, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5143, partial_loss/deprel_loss: 0.6041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7461, loss: 0.8336, batch_reg_loss: 0.1599, reg_loss: 0.1593 ||:  69%|######9   | 77/111 [00:51<00:22,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9337, LAS: 0.8802, UEM: 0.5669, LEM: 0.3362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2365, partial_loss/deprel_loss: 0.4236, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5462, loss: 0.8323, batch_reg_loss: 0.1600, reg_loss: 0.1594 ||:  73%|#######2  | 81/111 [00:53<00:19,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9341, LAS: 0.8807, UEM: 0.5677, LEM: 0.3368, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3866, partial_loss/deprel_loss: 0.5101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6455, loss: 0.8288, batch_reg_loss: 0.1601, reg_loss: 0.1594 ||:  77%|#######6  | 85/111 [00:56<00:17,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9332, LAS: 0.8796, UEM: 0.5588, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7277, partial_loss/deprel_loss: 0.6583, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8323, loss: 0.8376, batch_reg_loss: 0.1601, reg_loss: 0.1594 ||:  80%|########  | 89/111 [00:58<00:13,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8426, UAS: 0.9322, LAS: 0.8785, UEM: 0.5490, LEM: 0.3230, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9825, partial_loss/deprel_loss: 0.9410, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1095, loss: 0.8454, batch_reg_loss: 0.1602, reg_loss: 0.1595 ||:  84%|########3 | 93/111 [01:01<00:11,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9322, LAS: 0.8783, UEM: 0.5471, LEM: 0.3206, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1948, partial_loss/deprel_loss: 0.3857, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5078, loss: 0.8462, batch_reg_loss: 0.1602, reg_loss: 0.1595 ||:  87%|########7 | 97/111 [01:03<00:08,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8692, UAS: 0.9324, LAS: 0.8783, UEM: 0.5435, LEM: 0.3155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6677, partial_loss/deprel_loss: 0.8023, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9356, loss: 0.8459, batch_reg_loss: 0.1603, reg_loss: 0.1595 ||:  91%|######### | 101/111 [01:06<00:06,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8043, UAS: 0.9309, LAS: 0.8766, UEM: 0.5376, LEM: 0.3103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7838, partial_loss/deprel_loss: 1.3054, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5615, loss: 0.8610, batch_reg_loss: 0.1604, reg_loss: 0.1596 ||:  95%|#########4| 105/111 [01:09<00:03,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8459, UAS: 0.9305, LAS: 0.8760, UEM: 0.5314, LEM: 0.3052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2171, partial_loss/deprel_loss: 1.0465, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2410, loss: 0.8685, batch_reg_loss: 0.1604, reg_loss: 0.1596 ||:  98%|#########8| 109/111 [01:11<00:01,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8590, UAS: 0.9298, LAS: 0.8752, UEM: 0.5275, LEM: 0.3028, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0356, partial_loss/deprel_loss: 0.8129, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0179, loss: 0.8747, batch_reg_loss: 0.1605, reg_loss: 0.1596 ||: 100%|##########| 111/111 [01:12<00:00,  1.53it/s]\n",
      "2023-04-06 23:57:59,081 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.813  |       N/A\n",
      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.036  |       N/A\n",
      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.160  |       N/A\n",
      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - UEM                      |     0.528  |       N/A\n",
      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - LAS                      |     0.875  |       N/A\n",
      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - loss                     |     0.875  |       N/A\n",
      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - LEM                      |     0.303  |       N/A\n",
      "2023-04-06 23:57:59,082 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:57:59,083 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:57:59,083 - INFO - combo.training.tensorboard_writer - UAS                      |     0.930  |       N/A\n",
      "2023-04-06 23:57:59,083 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:57:59,083 - INFO - combo.training.tensorboard_writer - EM                       |     0.859  |       N/A\n",
      "2023-04-06 23:57:59,083 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:57:59,083 - INFO - combo.training.trainer - Epoch duration: 0:01:12.545910\n",
      "2023-04-06 23:57:59,083 - INFO - combo.training.trainer - Estimated training time remaining: 7:36:23\n",
      "2023-04-06 23:57:59,083 - INFO - allennlp.training.trainer - Epoch 52/399\n",
      "2023-04-06 23:57:59,084 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:57:59,084 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:57:59,089 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9408, LAS: 0.8872, UEM: 0.4940, LEM: 0.2390, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3542, partial_loss/deprel_loss: 0.5430, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6658, loss: 0.7606, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||:   3%|2         | 3/111 [00:02<01:12,  1.48it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9258, LAS: 0.8711, UEM: 0.3767, LEM: 0.1598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6446, partial_loss/deprel_loss: 0.7826, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9156, loss: 0.9016, batch_reg_loss: 0.1606, reg_loss: 0.1605 ||:   6%|6         | 7/111 [00:04<01:08,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9247, LAS: 0.8681, UEM: 0.3929, LEM: 0.1730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3376, partial_loss/deprel_loss: 0.5194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6437, loss: 0.9226, batch_reg_loss: 0.1607, reg_loss: 0.1606 ||:  10%|9         | 11/111 [00:06<01:04,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.9313, LAS: 0.8752, UEM: 0.4850, LEM: 0.2418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9508, partial_loss/deprel_loss: 0.9080, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0773, loss: 0.8719, batch_reg_loss: 0.1607, reg_loss: 0.1606 ||:  14%|#3        | 15/111 [00:09<01:01,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8230, UAS: 0.9278, LAS: 0.8711, UEM: 0.4450, LEM: 0.2155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4530, partial_loss/deprel_loss: 1.1169, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3450, loss: 0.9087, batch_reg_loss: 0.1608, reg_loss: 0.1607 ||:  17%|#7        | 19/111 [00:11<00:55,  1.64it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9078, UAS: 0.9296, LAS: 0.8736, UEM: 0.4856, LEM: 0.2525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4127, partial_loss/deprel_loss: 0.4800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6275, loss: 0.8893, batch_reg_loss: 0.1609, reg_loss: 0.1607 ||:  21%|##        | 23/111 [00:13<00:53,  1.65it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9339, LAS: 0.8787, UEM: 0.5379, LEM: 0.2897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3198, partial_loss/deprel_loss: 0.4749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6048, loss: 0.8470, batch_reg_loss: 0.1610, reg_loss: 0.1607 ||:  24%|##4       | 27/111 [00:16<00:49,  1.69it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8564, UAS: 0.9342, LAS: 0.8793, UEM: 0.5529, LEM: 0.3165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7539, partial_loss/deprel_loss: 0.8258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9725, loss: 0.8433, batch_reg_loss: 0.1610, reg_loss: 0.1608 ||:  28%|##7       | 31/111 [00:18<00:48,  1.66it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9025, UAS: 0.9329, LAS: 0.8781, UEM: 0.5454, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3077, partial_loss/deprel_loss: 0.5190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6378, loss: 0.8515, batch_reg_loss: 0.1611, reg_loss: 0.1608 ||:  32%|###1      | 35/111 [00:21<00:46,  1.64it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8574, UAS: 0.9309, LAS: 0.8760, UEM: 0.5404, LEM: 0.3105, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7887, partial_loss/deprel_loss: 0.8330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9853, loss: 0.8660, batch_reg_loss: 0.1611, reg_loss: 0.1608 ||:  35%|###5      | 39/111 [00:23<00:43,  1.64it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8541, UAS: 0.9303, LAS: 0.8754, UEM: 0.5276, LEM: 0.2985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9182, partial_loss/deprel_loss: 0.8559, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0296, loss: 0.8703, batch_reg_loss: 0.1612, reg_loss: 0.1609 ||:  39%|###8      | 43/111 [00:26<00:43,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8863, UAS: 0.9305, LAS: 0.8753, UEM: 0.5139, LEM: 0.2856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4979, partial_loss/deprel_loss: 0.6616, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7901, loss: 0.8702, batch_reg_loss: 0.1613, reg_loss: 0.1609 ||:  42%|####2     | 47/111 [00:29<00:41,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9313, LAS: 0.8764, UEM: 0.5228, LEM: 0.2900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3390, partial_loss/deprel_loss: 0.5202, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6453, loss: 0.8633, batch_reg_loss: 0.1613, reg_loss: 0.1609 ||:  46%|####5     | 51/111 [00:32<00:40,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9325, LAS: 0.8777, UEM: 0.5325, LEM: 0.2942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3731, partial_loss/deprel_loss: 0.5001, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6361, loss: 0.8511, batch_reg_loss: 0.1614, reg_loss: 0.1610 ||:  49%|####8     | 54/111 [00:34<00:42,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8530, UAS: 0.9318, LAS: 0.8771, UEM: 0.5251, LEM: 0.2886, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0108, partial_loss/deprel_loss: 0.8002, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0038, loss: 0.8569, batch_reg_loss: 0.1614, reg_loss: 0.1610 ||:  51%|#####1    | 57/111 [00:37<00:39,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8456, UAS: 0.9325, LAS: 0.8778, UEM: 0.5387, LEM: 0.3007, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9719, partial_loss/deprel_loss: 0.9103, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0841, loss: 0.8512, batch_reg_loss: 0.1615, reg_loss: 0.1610 ||:  54%|#####4    | 60/111 [00:39<00:36,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8968, UAS: 0.9320, LAS: 0.8774, UEM: 0.5422, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4026, partial_loss/deprel_loss: 0.5979, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7204, loss: 0.8555, batch_reg_loss: 0.1615, reg_loss: 0.1610 ||:  57%|#####6    | 63/111 [00:41<00:34,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7904, UAS: 0.9314, LAS: 0.8768, UEM: 0.5508, LEM: 0.3128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7467, partial_loss/deprel_loss: 1.1340, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4181, loss: 0.8571, batch_reg_loss: 0.1616, reg_loss: 0.1611 ||:  59%|#####9    | 66/111 [00:43<00:32,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8656, UAS: 0.9300, LAS: 0.8752, UEM: 0.5399, LEM: 0.3040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6887, partial_loss/deprel_loss: 0.7504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8997, loss: 0.8692, batch_reg_loss: 0.1616, reg_loss: 0.1611 ||:  63%|######3   | 70/111 [00:45<00:27,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7555, UAS: 0.9286, LAS: 0.8739, UEM: 0.5343, LEM: 0.3004, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.7179, partial_loss/deprel_loss: 1.4741, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8845, loss: 0.8808, batch_reg_loss: 0.1617, reg_loss: 0.1611 ||:  66%|######5   | 73/111 [00:47<00:26,  1.45it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9288, LAS: 0.8740, UEM: 0.5333, LEM: 0.2995, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5149, partial_loss/deprel_loss: 0.6655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7971, loss: 0.8786, batch_reg_loss: 0.1617, reg_loss: 0.1611 ||:  69%|######9   | 77/111 [00:50<00:22,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8485, UAS: 0.9295, LAS: 0.8748, UEM: 0.5507, LEM: 0.3237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9174, partial_loss/deprel_loss: 0.9188, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0803, loss: 0.8734, batch_reg_loss: 0.1618, reg_loss: 0.1612 ||:  72%|#######2  | 80/111 [00:52<00:22,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9300, LAS: 0.8753, UEM: 0.5510, LEM: 0.3238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5307, partial_loss/deprel_loss: 0.6004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7483, loss: 0.8682, batch_reg_loss: 0.1619, reg_loss: 0.1612 ||:  75%|#######4  | 83/111 [00:54<00:19,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8574, UAS: 0.9305, LAS: 0.8758, UEM: 0.5480, LEM: 0.3195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8368, partial_loss/deprel_loss: 0.9219, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0668, loss: 0.8654, batch_reg_loss: 0.1619, reg_loss: 0.1612 ||:  78%|#######8  | 87/111 [00:57<00:15,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8374, UAS: 0.9295, LAS: 0.8745, UEM: 0.5390, LEM: 0.3128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1307, partial_loss/deprel_loss: 0.9379, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1385, loss: 0.8737, batch_reg_loss: 0.1620, reg_loss: 0.1613 ||:  82%|########1 | 91/111 [00:59<00:12,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9304, LAS: 0.8754, UEM: 0.5423, LEM: 0.3122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5534, partial_loss/deprel_loss: 0.6744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8123, loss: 0.8675, batch_reg_loss: 0.1620, reg_loss: 0.1613 ||:  86%|########5 | 95/111 [01:01<00:10,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9307, LAS: 0.8758, UEM: 0.5385, LEM: 0.3075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4924, partial_loss/deprel_loss: 0.6291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7639, loss: 0.8670, batch_reg_loss: 0.1621, reg_loss: 0.1613 ||:  89%|########9 | 99/111 [01:04<00:07,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8665, UAS: 0.9301, LAS: 0.8751, UEM: 0.5371, LEM: 0.3062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8170, partial_loss/deprel_loss: 0.7834, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9523, loss: 0.8710, batch_reg_loss: 0.1622, reg_loss: 0.1613 ||:  93%|#########2| 103/111 [01:07<00:05,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8459, UAS: 0.9301, LAS: 0.8751, UEM: 0.5326, LEM: 0.3018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2890, partial_loss/deprel_loss: 0.9941, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2153, loss: 0.8726, batch_reg_loss: 0.1622, reg_loss: 0.1614 ||:  96%|#########6| 107/111 [01:09<00:02,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9304, LAS: 0.8754, UEM: 0.5313, LEM: 0.2993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4115, partial_loss/deprel_loss: 0.5774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7065, loss: 0.8711, batch_reg_loss: 0.1623, reg_loss: 0.1614 ||: 100%|##########| 111/111 [01:12<00:00,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9304, LAS: 0.8754, UEM: 0.5313, LEM: 0.2993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4115, partial_loss/deprel_loss: 0.5774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7065, loss: 0.8711, batch_reg_loss: 0.1623, reg_loss: 0.1614 ||: 100%|##########| 111/111 [01:12<00:00,  1.53it/s]\n",
      "2023-04-06 23:59:11,774 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-06 23:59:11,774 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:59:11,774 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:59:11,774 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-06 23:59:11,774 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-06 23:59:11,774 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.577  |       N/A\n",
      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.412  |       N/A\n",
      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.161  |       N/A\n",
      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - UEM                      |     0.531  |       N/A\n",
      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - LAS                      |     0.875  |       N/A\n",
      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - loss                     |     0.871  |       N/A\n",
      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - LEM                      |     0.299  |       N/A\n",
      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - UAS                      |     0.930  |       N/A\n",
      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - EM                       |     0.903  |       N/A\n",
      "2023-04-06 23:59:11,775 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-06 23:59:11,776 - INFO - combo.training.trainer - Epoch duration: 0:01:12.692473\n",
      "2023-04-06 23:59:11,776 - INFO - combo.training.trainer - Estimated training time remaining: 7:34:25\n",
      "2023-04-06 23:59:11,776 - INFO - allennlp.training.trainer - Epoch 53/399\n",
      "2023-04-06 23:59:11,776 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-06 23:59:11,776 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-06 23:59:11,782 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9467, LAS: 0.8928, UEM: 0.5404, LEM: 0.2362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5696, partial_loss/deprel_loss: 0.5960, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7530, loss: 0.7637, batch_reg_loss: 0.1623, reg_loss: 0.1623 ||:   3%|2         | 3/111 [00:02<01:12,  1.49it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9464, LAS: 0.8947, UEM: 0.5560, LEM: 0.2780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5968, partial_loss/deprel_loss: 0.5837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7487, loss: 0.7131, batch_reg_loss: 0.1624, reg_loss: 0.1623 ||:   6%|6         | 7/111 [00:04<01:08,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.9365, LAS: 0.8817, UEM: 0.4906, LEM: 0.2320, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8449, partial_loss/deprel_loss: 0.7423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9252, loss: 0.8082, batch_reg_loss: 0.1625, reg_loss: 0.1624 ||:  10%|9         | 11/111 [00:07<01:05,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9394, LAS: 0.8855, UEM: 0.5849, LEM: 0.3407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2795, partial_loss/deprel_loss: 0.4304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5627, loss: 0.7742, batch_reg_loss: 0.1625, reg_loss: 0.1624 ||:  13%|#2        | 14/111 [00:09<01:06,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9397, LAS: 0.8861, UEM: 0.5769, LEM: 0.3257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3935, partial_loss/deprel_loss: 0.5610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6901, loss: 0.7727, batch_reg_loss: 0.1625, reg_loss: 0.1624 ||:  15%|#5        | 17/111 [00:11<01:04,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8868, UAS: 0.9409, LAS: 0.8868, UEM: 0.5687, LEM: 0.3085, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5827, partial_loss/deprel_loss: 0.6183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7738, loss: 0.7743, batch_reg_loss: 0.1626, reg_loss: 0.1624 ||:  19%|#8        | 21/111 [00:13<00:57,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8515, UAS: 0.9382, LAS: 0.8830, UEM: 0.5330, LEM: 0.2812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7980, partial_loss/deprel_loss: 0.8121, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9719, loss: 0.8025, batch_reg_loss: 0.1626, reg_loss: 0.1625 ||:  23%|##2       | 25/111 [00:16<00:54,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8575, UAS: 0.9323, LAS: 0.8767, UEM: 0.5110, LEM: 0.2681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0175, partial_loss/deprel_loss: 0.8682, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0608, loss: 0.8586, batch_reg_loss: 0.1627, reg_loss: 0.1625 ||:  25%|##5       | 28/111 [00:18<00:54,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8408, UAS: 0.9278, LAS: 0.8720, UEM: 0.4900, LEM: 0.2561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1837, partial_loss/deprel_loss: 0.8709, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0962, loss: 0.8946, batch_reg_loss: 0.1627, reg_loss: 0.1625 ||:  28%|##7       | 31/111 [00:20<00:53,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9276, LAS: 0.8718, UEM: 0.4794, LEM: 0.2489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4080, partial_loss/deprel_loss: 0.4971, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6420, loss: 0.8936, batch_reg_loss: 0.1628, reg_loss: 0.1625 ||:  31%|###       | 34/111 [00:22<00:52,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9013, UAS: 0.9292, LAS: 0.8736, UEM: 0.4858, LEM: 0.2491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4041, partial_loss/deprel_loss: 0.5663, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6967, loss: 0.8827, batch_reg_loss: 0.1628, reg_loss: 0.1626 ||:  34%|###4      | 38/111 [00:25<00:48,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9295, LAS: 0.8742, UEM: 0.4897, LEM: 0.2530, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4659, partial_loss/deprel_loss: 0.6584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7828, loss: 0.8813, batch_reg_loss: 0.1629, reg_loss: 0.1626 ||:  38%|###7      | 42/111 [00:27<00:44,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9165, UAS: 0.9311, LAS: 0.8761, UEM: 0.5027, LEM: 0.2619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1957, partial_loss/deprel_loss: 0.3736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5010, loss: 0.8652, batch_reg_loss: 0.1630, reg_loss: 0.1626 ||:  41%|####1     | 46/111 [00:30<00:42,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9320, LAS: 0.8773, UEM: 0.5124, LEM: 0.2717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5651, partial_loss/deprel_loss: 0.5854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7444, loss: 0.8546, batch_reg_loss: 0.1630, reg_loss: 0.1627 ||:  45%|####5     | 50/111 [00:33<00:41,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8246, UAS: 0.9308, LAS: 0.8758, UEM: 0.5093, LEM: 0.2702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1829, partial_loss/deprel_loss: 0.9669, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1732, loss: 0.8625, batch_reg_loss: 0.1631, reg_loss: 0.1627 ||:  48%|####7     | 53/111 [00:35<00:40,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8019, UAS: 0.9278, LAS: 0.8724, UEM: 0.4995, LEM: 0.2647, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7117, partial_loss/deprel_loss: 1.1906, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4580, loss: 0.8887, batch_reg_loss: 0.1631, reg_loss: 0.1627 ||:  51%|#####1    | 57/111 [00:37<00:35,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8156, UAS: 0.9276, LAS: 0.8723, UEM: 0.4999, LEM: 0.2658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5744, partial_loss/deprel_loss: 1.0889, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3492, loss: 0.8901, batch_reg_loss: 0.1632, reg_loss: 0.1627 ||:  55%|#####4    | 61/111 [00:39<00:31,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8730, UAS: 0.9285, LAS: 0.8731, UEM: 0.5093, LEM: 0.2738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6473, partial_loss/deprel_loss: 0.7667, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9061, loss: 0.8856, batch_reg_loss: 0.1633, reg_loss: 0.1628 ||:  59%|#####8    | 65/111 [00:42<00:29,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9278, LAS: 0.8724, UEM: 0.5045, LEM: 0.2701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4895, partial_loss/deprel_loss: 0.5364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6903, loss: 0.8913, batch_reg_loss: 0.1633, reg_loss: 0.1628 ||:  62%|######2   | 69/111 [00:45<00:27,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8434, UAS: 0.9266, LAS: 0.8711, UEM: 0.4930, LEM: 0.2620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0492, partial_loss/deprel_loss: 1.0301, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1973, loss: 0.9030, batch_reg_loss: 0.1634, reg_loss: 0.1628 ||:  66%|######5   | 73/111 [00:47<00:24,  1.57it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9267, LAS: 0.8713, UEM: 0.4968, LEM: 0.2664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3645, partial_loss/deprel_loss: 0.5718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6938, loss: 0.9019, batch_reg_loss: 0.1635, reg_loss: 0.1629 ||:  69%|######9   | 77/111 [00:50<00:22,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8904, UAS: 0.9279, LAS: 0.8725, UEM: 0.5080, LEM: 0.2731, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4258, partial_loss/deprel_loss: 0.5856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7172, loss: 0.8911, batch_reg_loss: 0.1636, reg_loss: 0.1629 ||:  73%|#######2  | 81/111 [00:53<00:21,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9288, LAS: 0.8735, UEM: 0.5127, LEM: 0.2738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4960, partial_loss/deprel_loss: 0.7325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8488, loss: 0.8845, batch_reg_loss: 0.1636, reg_loss: 0.1629 ||:  76%|#######5  | 84/111 [00:55<00:19,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8745, UAS: 0.9295, LAS: 0.8742, UEM: 0.5182, LEM: 0.2763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6469, partial_loss/deprel_loss: 0.6858, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8417, loss: 0.8779, batch_reg_loss: 0.1637, reg_loss: 0.1630 ||:  78%|#######8  | 87/111 [00:58<00:17,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9290, LAS: 0.8735, UEM: 0.5111, LEM: 0.2713, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9573, partial_loss/deprel_loss: 0.9826, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1413, loss: 0.8841, batch_reg_loss: 0.1637, reg_loss: 0.1630 ||:  81%|########1 | 90/111 [01:00<00:14,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9303, LAS: 0.8751, UEM: 0.5402, LEM: 0.3059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2008, partial_loss/deprel_loss: 0.3759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5046, loss: 0.8728, batch_reg_loss: 0.1637, reg_loss: 0.1630 ||:  84%|########3 | 93/111 [01:02<00:13,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8101, UAS: 0.9297, LAS: 0.8744, UEM: 0.5358, LEM: 0.3025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3972, partial_loss/deprel_loss: 1.1130, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3336, loss: 0.8781, batch_reg_loss: 0.1638, reg_loss: 0.1630 ||:  87%|########7 | 97/111 [01:04<00:09,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8339, UAS: 0.9295, LAS: 0.8743, UEM: 0.5347, LEM: 0.3013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3269, partial_loss/deprel_loss: 1.0957, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3058, loss: 0.8800, batch_reg_loss: 0.1638, reg_loss: 0.1631 ||:  90%|######### | 100/111 [01:07<00:07,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9126, UAS: 0.9296, LAS: 0.8744, UEM: 0.5320, LEM: 0.2980, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3737, partial_loss/deprel_loss: 0.4763, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6197, loss: 0.8794, batch_reg_loss: 0.1639, reg_loss: 0.1631 ||:  94%|#########3| 104/111 [01:09<00:04,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8458, UAS: 0.9301, LAS: 0.8749, UEM: 0.5330, LEM: 0.2968, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9118, partial_loss/deprel_loss: 0.9566, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1116, loss: 0.8764, batch_reg_loss: 0.1639, reg_loss: 0.1631 ||:  97%|#########7| 108/111 [01:12<00:02,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8401, UAS: 0.9299, LAS: 0.8747, UEM: 0.5328, LEM: 0.2984, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0703, partial_loss/deprel_loss: 0.9871, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1677, loss: 0.8771, batch_reg_loss: 0.1640, reg_loss: 0.1631 ||: 100%|##########| 111/111 [01:14<00:00,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8401, UAS: 0.9299, LAS: 0.8747, UEM: 0.5328, LEM: 0.2984, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0703, partial_loss/deprel_loss: 0.9871, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1677, loss: 0.8771, batch_reg_loss: 0.1640, reg_loss: 0.1631 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
      "2023-04-07 00:00:26,510 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.987  |       N/A\n",
      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.070  |       N/A\n",
      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.163  |       N/A\n",
      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - UEM                      |     0.533  |       N/A\n",
      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - LAS                      |     0.875  |       N/A\n",
      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - loss                     |     0.877  |       N/A\n",
      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - LEM                      |     0.298  |       N/A\n",
      "2023-04-07 00:00:26,511 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:00:26,512 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:00:26,512 - INFO - combo.training.tensorboard_writer - UAS                      |     0.930  |       N/A\n",
      "2023-04-07 00:00:26,512 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:00:26,512 - INFO - combo.training.tensorboard_writer - EM                       |     0.840  |       N/A\n",
      "2023-04-07 00:00:26,512 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:00:26,512 - INFO - combo.training.trainer - Epoch duration: 0:01:14.736354\n",
      "2023-04-07 00:00:26,513 - INFO - combo.training.trainer - Estimated training time remaining: 7:32:42\n",
      "2023-04-07 00:00:26,513 - INFO - allennlp.training.trainer - Epoch 54/399\n",
      "2023-04-07 00:00:26,513 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:00:26,513 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:00:26,520 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9448, LAS: 0.8931, UEM: 0.7116, LEM: 0.4577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2033, partial_loss/deprel_loss: 0.3485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4835, loss: 0.7435, batch_reg_loss: 0.1640, reg_loss: 0.1640 ||:   3%|2         | 3/111 [00:02<01:14,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9409, LAS: 0.8887, UEM: 0.5927, LEM: 0.3441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3385, partial_loss/deprel_loss: 0.4904, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6241, loss: 0.7844, batch_reg_loss: 0.1641, reg_loss: 0.1640 ||:   6%|6         | 7/111 [00:04<01:10,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8577, UAS: 0.9355, LAS: 0.8830, UEM: 0.5229, LEM: 0.2916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8470, partial_loss/deprel_loss: 0.8782, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0361, loss: 0.8226, batch_reg_loss: 0.1641, reg_loss: 0.1641 ||:  10%|9         | 11/111 [00:06<01:05,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9305, LAS: 0.8779, UEM: 0.5623, LEM: 0.3476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1667, partial_loss/deprel_loss: 0.3135, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4483, loss: 0.8639, batch_reg_loss: 0.1642, reg_loss: 0.1641 ||:  13%|#2        | 14/111 [00:09<01:07,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8417, UAS: 0.9307, LAS: 0.8791, UEM: 0.6237, LEM: 0.4441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1766, partial_loss/deprel_loss: 0.9353, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1478, loss: 0.8571, batch_reg_loss: 0.1642, reg_loss: 0.1641 ||:  15%|#5        | 17/111 [00:13<01:29,  1.06it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8884, UAS: 0.9324, LAS: 0.8798, UEM: 0.5994, LEM: 0.4003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4481, partial_loss/deprel_loss: 0.6010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7347, loss: 0.8410, batch_reg_loss: 0.1643, reg_loss: 0.1641 ||:  19%|#8        | 21/111 [00:16<01:18,  1.15it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9320, LAS: 0.8789, UEM: 0.5892, LEM: 0.3873, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2499, partial_loss/deprel_loss: 0.4475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5723, loss: 0.8520, batch_reg_loss: 0.1643, reg_loss: 0.1642 ||:  22%|##1       | 24/111 [00:19<01:13,  1.18it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8887, UAS: 0.9321, LAS: 0.8784, UEM: 0.5624, LEM: 0.3576, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5136, partial_loss/deprel_loss: 0.6196, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7628, loss: 0.8548, batch_reg_loss: 0.1644, reg_loss: 0.1642 ||:  25%|##5       | 28/111 [00:21<01:04,  1.28it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9341, LAS: 0.8809, UEM: 0.5804, LEM: 0.3688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2605, partial_loss/deprel_loss: 0.3954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5329, loss: 0.8333, batch_reg_loss: 0.1644, reg_loss: 0.1642 ||:  28%|##7       | 31/111 [00:23<01:02,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9053, UAS: 0.9328, LAS: 0.8791, UEM: 0.5736, LEM: 0.3619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2956, partial_loss/deprel_loss: 0.4525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5856, loss: 0.8460, batch_reg_loss: 0.1645, reg_loss: 0.1642 ||:  31%|###       | 34/111 [00:26<00:59,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9333, LAS: 0.8795, UEM: 0.5669, LEM: 0.3517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4214, partial_loss/deprel_loss: 0.5140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6600, loss: 0.8440, batch_reg_loss: 0.1645, reg_loss: 0.1643 ||:  33%|###3      | 37/111 [00:28<00:55,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8372, UAS: 0.9334, LAS: 0.8801, UEM: 0.5717, LEM: 0.3553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3333, partial_loss/deprel_loss: 0.9017, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1526, loss: 0.8380, batch_reg_loss: 0.1646, reg_loss: 0.1643 ||:  36%|###6      | 40/111 [00:30<00:53,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8462, UAS: 0.9321, LAS: 0.8783, UEM: 0.5681, LEM: 0.3506, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1812, partial_loss/deprel_loss: 0.8796, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1046, loss: 0.8479, batch_reg_loss: 0.1646, reg_loss: 0.1643 ||:  39%|###8      | 43/111 [00:32<00:50,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8712, UAS: 0.9331, LAS: 0.8794, UEM: 0.5662, LEM: 0.3420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8001, partial_loss/deprel_loss: 0.7264, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9059, loss: 0.8421, batch_reg_loss: 0.1647, reg_loss: 0.1643 ||:  42%|####2     | 47/111 [00:35<00:45,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9321, LAS: 0.8786, UEM: 0.5562, LEM: 0.3339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3762, partial_loss/deprel_loss: 0.5160, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6528, loss: 0.8515, batch_reg_loss: 0.1647, reg_loss: 0.1644 ||:  46%|####5     | 51/111 [00:37<00:40,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9321, LAS: 0.8786, UEM: 0.5521, LEM: 0.3306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2895, partial_loss/deprel_loss: 0.4472, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5805, loss: 0.8509, batch_reg_loss: 0.1648, reg_loss: 0.1644 ||:  49%|####8     | 54/111 [00:39<00:39,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8934, UAS: 0.9332, LAS: 0.8799, UEM: 0.5667, LEM: 0.3470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4449, partial_loss/deprel_loss: 0.6679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7881, loss: 0.8421, batch_reg_loss: 0.1648, reg_loss: 0.1644 ||:  51%|#####1    | 57/111 [00:41<00:37,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7900, UAS: 0.9308, LAS: 0.8773, UEM: 0.5544, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8413, partial_loss/deprel_loss: 1.2192, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5085, loss: 0.8640, batch_reg_loss: 0.1649, reg_loss: 0.1644 ||:  55%|#####4    | 61/111 [00:44<00:33,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9321, LAS: 0.8786, UEM: 0.5625, LEM: 0.3386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1444, partial_loss/deprel_loss: 0.3851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5019, loss: 0.8516, batch_reg_loss: 0.1649, reg_loss: 0.1645 ||:  59%|#####8    | 65/111 [00:47<00:31,  1.47it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9318, LAS: 0.8784, UEM: 0.5630, LEM: 0.3356, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4898, partial_loss/deprel_loss: 0.6133, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7536, loss: 0.8540, batch_reg_loss: 0.1650, reg_loss: 0.1645 ||:  62%|######2   | 69/111 [00:49<00:28,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9320, LAS: 0.8785, UEM: 0.5594, LEM: 0.3298, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3849, partial_loss/deprel_loss: 0.5626, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6921, loss: 0.8529, batch_reg_loss: 0.1651, reg_loss: 0.1645 ||:  65%|######4   | 72/111 [00:52<00:26,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8562, UAS: 0.9308, LAS: 0.8771, UEM: 0.5510, LEM: 0.3240, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0675, partial_loss/deprel_loss: 0.8571, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0643, loss: 0.8638, batch_reg_loss: 0.1651, reg_loss: 0.1645 ||:  68%|######7   | 75/111 [00:54<00:24,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8299, UAS: 0.9300, LAS: 0.8759, UEM: 0.5432, LEM: 0.3184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3399, partial_loss/deprel_loss: 0.9877, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2233, loss: 0.8729, batch_reg_loss: 0.1652, reg_loss: 0.1646 ||:  70%|#######   | 78/111 [00:56<00:22,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9305, LAS: 0.8765, UEM: 0.5447, LEM: 0.3189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6205, partial_loss/deprel_loss: 0.7112, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8583, loss: 0.8691, batch_reg_loss: 0.1652, reg_loss: 0.1646 ||:  73%|#######2  | 81/111 [00:58<00:21,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8884, UAS: 0.9294, LAS: 0.8752, UEM: 0.5381, LEM: 0.3131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5750, partial_loss/deprel_loss: 0.6413, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7933, loss: 0.8801, batch_reg_loss: 0.1653, reg_loss: 0.1646 ||:  77%|#######6  | 85/111 [01:00<00:17,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8866, UAS: 0.9299, LAS: 0.8759, UEM: 0.5388, LEM: 0.3119, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5388, partial_loss/deprel_loss: 0.6564, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7982, loss: 0.8754, batch_reg_loss: 0.1653, reg_loss: 0.1646 ||:  79%|#######9  | 88/111 [01:02<00:15,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9307, LAS: 0.8765, UEM: 0.5455, LEM: 0.3163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2060, partial_loss/deprel_loss: 0.3806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5111, loss: 0.8701, batch_reg_loss: 0.1654, reg_loss: 0.1647 ||:  83%|########2 | 92/111 [01:05<00:12,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8516, UAS: 0.9298, LAS: 0.8756, UEM: 0.5412, LEM: 0.3124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0076, partial_loss/deprel_loss: 0.9710, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1438, loss: 0.8782, batch_reg_loss: 0.1655, reg_loss: 0.1647 ||:  86%|########6 | 96/111 [01:08<00:10,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8668, UAS: 0.9303, LAS: 0.8761, UEM: 0.5436, LEM: 0.3130, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7639, partial_loss/deprel_loss: 0.8132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9688, loss: 0.8738, batch_reg_loss: 0.1655, reg_loss: 0.1647 ||:  89%|########9 | 99/111 [01:10<00:08,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8463, UAS: 0.9296, LAS: 0.8754, UEM: 0.5380, LEM: 0.3088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1287, partial_loss/deprel_loss: 0.9364, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1404, loss: 0.8794, batch_reg_loss: 0.1656, reg_loss: 0.1648 ||:  92%|#########1| 102/111 [01:12<00:06,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9124, UAS: 0.9302, LAS: 0.8761, UEM: 0.5385, LEM: 0.3065, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2722, partial_loss/deprel_loss: 0.4483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5787, loss: 0.8726, batch_reg_loss: 0.1656, reg_loss: 0.1648 ||:  95%|#########5| 106/111 [01:14<00:03,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8582, UAS: 0.9303, LAS: 0.8761, UEM: 0.5354, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8501, partial_loss/deprel_loss: 0.8843, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0431, loss: 0.8737, batch_reg_loss: 0.1657, reg_loss: 0.1648 ||:  99%|#########9| 110/111 [01:17<00:00,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8651, UAS: 0.9302, LAS: 0.8760, UEM: 0.5334, LEM: 0.3015, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7965, partial_loss/deprel_loss: 0.7209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9017, loss: 0.8739, batch_reg_loss: 0.1657, reg_loss: 0.1648 ||: 100%|##########| 111/111 [01:17<00:00,  1.42it/s]\n",
      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.721  |       N/A\n",
      "2023-04-07 00:01:44,504 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.797  |       N/A\n",
      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.165  |       N/A\n",
      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - UEM                      |     0.533  |       N/A\n",
      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - LAS                      |     0.876  |       N/A\n",
      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - loss                     |     0.874  |       N/A\n",
      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - LEM                      |     0.302  |       N/A\n",
      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - UAS                      |     0.930  |       N/A\n",
      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - EM                       |     0.865  |       N/A\n",
      "2023-04-07 00:01:44,505 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:01:44,506 - INFO - combo.training.trainer - Epoch duration: 0:01:17.993194\n",
      "2023-04-07 00:01:44,506 - INFO - combo.training.trainer - Estimated training time remaining: 7:31:20\n",
      "2023-04-07 00:01:44,506 - INFO - allennlp.training.trainer - Epoch 55/399\n",
      "2023-04-07 00:01:44,506 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:01:44,507 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:01:44,513 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8958, UAS: 0.9378, LAS: 0.8843, UEM: 0.6189, LEM: 0.3503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3601, partial_loss/deprel_loss: 0.5774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6997, loss: 0.7860, batch_reg_loss: 0.1657, reg_loss: 0.1657 ||:   3%|2         | 3/111 [00:02<01:17,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8378, UAS: 0.9324, LAS: 0.8764, UEM: 0.4882, LEM: 0.2407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0905, partial_loss/deprel_loss: 1.0808, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2485, loss: 0.8774, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:   6%|6         | 7/111 [00:04<01:12,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8522, UAS: 0.9306, LAS: 0.8749, UEM: 0.4708, LEM: 0.2315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0105, partial_loss/deprel_loss: 0.8525, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0499, loss: 0.8856, batch_reg_loss: 0.1659, reg_loss: 0.1658 ||:  10%|9         | 11/111 [00:07<01:06,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9339, LAS: 0.8782, UEM: 0.5102, LEM: 0.2496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2956, partial_loss/deprel_loss: 0.4273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5669, loss: 0.8600, batch_reg_loss: 0.1659, reg_loss: 0.1658 ||:  14%|#3        | 15/111 [00:09<01:01,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8532, UAS: 0.9279, LAS: 0.8717, UEM: 0.4778, LEM: 0.2334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0383, partial_loss/deprel_loss: 0.8635, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0645, loss: 0.9098, batch_reg_loss: 0.1660, reg_loss: 0.1659 ||:  17%|#7        | 19/111 [00:11<00:58,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8922, UAS: 0.9278, LAS: 0.8715, UEM: 0.4733, LEM: 0.2227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3426, partial_loss/deprel_loss: 0.5423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6684, loss: 0.9059, batch_reg_loss: 0.1661, reg_loss: 0.1659 ||:  21%|##        | 23/111 [00:14<00:55,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9272, LAS: 0.8709, UEM: 0.4712, LEM: 0.2228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2936, partial_loss/deprel_loss: 0.4856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6133, loss: 0.9143, batch_reg_loss: 0.1661, reg_loss: 0.1659 ||:  23%|##3       | 26/111 [00:16<00:55,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8659, UAS: 0.9271, LAS: 0.8711, UEM: 0.4586, LEM: 0.2171, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7521, partial_loss/deprel_loss: 0.7589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9237, loss: 0.9126, batch_reg_loss: 0.1662, reg_loss: 0.1659 ||:  26%|##6       | 29/111 [00:18<00:57,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9291, LAS: 0.8736, UEM: 0.4894, LEM: 0.2468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4697, partial_loss/deprel_loss: 0.6005, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7406, loss: 0.8919, batch_reg_loss: 0.1662, reg_loss: 0.1660 ||:  29%|##8       | 32/111 [00:21<00:57,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9282, LAS: 0.8727, UEM: 0.5098, LEM: 0.2681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1440, partial_loss/deprel_loss: 0.3799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4990, loss: 0.8966, batch_reg_loss: 0.1663, reg_loss: 0.1660 ||:  32%|###2      | 36/111 [00:24<00:54,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9284, LAS: 0.8732, UEM: 0.5109, LEM: 0.2716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2249, partial_loss/deprel_loss: 0.3740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5105, loss: 0.8943, batch_reg_loss: 0.1664, reg_loss: 0.1660 ||:  36%|###6      | 40/111 [00:26<00:50,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9290, LAS: 0.8739, UEM: 0.5005, LEM: 0.2620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5359, partial_loss/deprel_loss: 0.5986, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7525, loss: 0.8865, batch_reg_loss: 0.1664, reg_loss: 0.1661 ||:  40%|###9      | 44/111 [00:29<00:44,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8538, UAS: 0.9300, LAS: 0.8750, UEM: 0.5045, LEM: 0.2663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0223, partial_loss/deprel_loss: 0.9283, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1136, loss: 0.8820, batch_reg_loss: 0.1665, reg_loss: 0.1661 ||:  43%|####3     | 48/111 [00:31<00:41,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9303, LAS: 0.8755, UEM: 0.5021, LEM: 0.2655, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7655, partial_loss/deprel_loss: 0.7056, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8842, loss: 0.8792, batch_reg_loss: 0.1665, reg_loss: 0.1661 ||:  47%|####6     | 52/111 [00:34<00:40,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9302, LAS: 0.8753, UEM: 0.4943, LEM: 0.2582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5434, partial_loss/deprel_loss: 0.5759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7360, loss: 0.8802, batch_reg_loss: 0.1666, reg_loss: 0.1662 ||:  50%|####9     | 55/111 [00:36<00:38,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9292, LAS: 0.8742, UEM: 0.4979, LEM: 0.2597, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3299, partial_loss/deprel_loss: 0.5148, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6445, loss: 0.8854, batch_reg_loss: 0.1666, reg_loss: 0.1662 ||:  52%|#####2    | 58/111 [00:38<00:37,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8848, UAS: 0.9300, LAS: 0.8748, UEM: 0.4960, LEM: 0.2542, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5726, partial_loss/deprel_loss: 0.6414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7943, loss: 0.8809, batch_reg_loss: 0.1667, reg_loss: 0.1662 ||:  56%|#####5    | 62/111 [00:41<00:33,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8270, UAS: 0.9287, LAS: 0.8734, UEM: 0.4838, LEM: 0.2459, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3249, partial_loss/deprel_loss: 0.9868, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2212, loss: 0.8900, batch_reg_loss: 0.1668, reg_loss: 0.1662 ||:  59%|#####9    | 66/111 [00:44<00:30,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9292, LAS: 0.8740, UEM: 0.4893, LEM: 0.2502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2609, partial_loss/deprel_loss: 0.4625, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5890, loss: 0.8867, batch_reg_loss: 0.1668, reg_loss: 0.1663 ||:  62%|######2   | 69/111 [00:46<00:29,  1.45it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9279, LAS: 0.8726, UEM: 0.4918, LEM: 0.2529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2447, partial_loss/deprel_loss: 0.3762, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5167, loss: 0.8979, batch_reg_loss: 0.1669, reg_loss: 0.1663 ||:  66%|######5   | 73/111 [00:49<00:26,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9283, LAS: 0.8730, UEM: 0.4954, LEM: 0.2557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4216, partial_loss/deprel_loss: 0.5738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7102, loss: 0.8955, batch_reg_loss: 0.1669, reg_loss: 0.1663 ||:  68%|######8   | 76/111 [00:51<00:24,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9292, LAS: 0.8739, UEM: 0.5096, LEM: 0.2727, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1119, partial_loss/deprel_loss: 0.2691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4047, loss: 0.8890, batch_reg_loss: 0.1670, reg_loss: 0.1663 ||:  71%|#######1  | 79/111 [00:53<00:22,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9568, UAS: 0.9288, LAS: 0.8736, UEM: 0.5289, LEM: 0.3012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0828, partial_loss/deprel_loss: 0.1641, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3149, loss: 0.8923, batch_reg_loss: 0.1670, reg_loss: 0.1664 ||:  74%|#######3  | 82/111 [00:55<00:21,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8655, UAS: 0.9287, LAS: 0.8735, UEM: 0.5236, LEM: 0.2972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8288, partial_loss/deprel_loss: 0.7915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9661, loss: 0.8928, batch_reg_loss: 0.1671, reg_loss: 0.1664 ||:  77%|#######7  | 86/111 [00:58<00:17,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9116, UAS: 0.9293, LAS: 0.8741, UEM: 0.5222, LEM: 0.2947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2973, partial_loss/deprel_loss: 0.4618, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5960, loss: 0.8897, batch_reg_loss: 0.1671, reg_loss: 0.1664 ||:  81%|########1 | 90/111 [01:00<00:14,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9300, LAS: 0.8750, UEM: 0.5309, LEM: 0.3014, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3646, partial_loss/deprel_loss: 0.4656, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6126, loss: 0.8813, batch_reg_loss: 0.1672, reg_loss: 0.1665 ||:  84%|########3 | 93/111 [01:02<00:12,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9304, LAS: 0.8754, UEM: 0.5302, LEM: 0.2991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5344, partial_loss/deprel_loss: 0.6124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7641, loss: 0.8764, batch_reg_loss: 0.1672, reg_loss: 0.1665 ||:  86%|########6 | 96/111 [01:05<00:10,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8599, UAS: 0.9304, LAS: 0.8755, UEM: 0.5246, LEM: 0.2934, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9842, partial_loss/deprel_loss: 0.9223, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1020, loss: 0.8779, batch_reg_loss: 0.1673, reg_loss: 0.1665 ||:  90%|######### | 100/111 [01:07<00:07,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9302, LAS: 0.8752, UEM: 0.5250, LEM: 0.2941, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3074, partial_loss/deprel_loss: 0.3868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5382, loss: 0.8795, batch_reg_loss: 0.1673, reg_loss: 0.1665 ||:  93%|#########2| 103/111 [01:09<00:05,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9021, UAS: 0.9305, LAS: 0.8756, UEM: 0.5243, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3452, partial_loss/deprel_loss: 0.4917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6297, loss: 0.8772, batch_reg_loss: 0.1673, reg_loss: 0.1666 ||:  96%|#########6| 107/111 [01:12<00:02,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8385, UAS: 0.9307, LAS: 0.8759, UEM: 0.5311, LEM: 0.2999, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0582, partial_loss/deprel_loss: 0.8997, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0988, loss: 0.8732, batch_reg_loss: 0.1674, reg_loss: 0.1666 ||:  99%|#########9| 110/111 [01:14<00:00,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9007, UAS: 0.9310, LAS: 0.8761, UEM: 0.5327, LEM: 0.3001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3381, partial_loss/deprel_loss: 0.5684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6897, loss: 0.8716, batch_reg_loss: 0.1674, reg_loss: 0.1666 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
      "2023-04-07 00:03:00,154 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9457, LAS: 0.8973, UEM: 0.7127, LEM: 0.5238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2112, partial_loss/deprel_loss: 20.6524, partial_loss/cycle_loss: 0.0000, batch_loss: 16.5642, loss: 23.9662, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:09,  1.08it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8186, UAS: 0.9355, LAS: 0.8835, UEM: 0.6797, LEM: 0.4542, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6319, partial_loss/deprel_loss: 58.9152, partial_loss/cycle_loss: 0.0000, batch_loss: 47.4585, loss: 28.1342, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:05<00:08,  1.01s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8836, UAS: 0.9338, LAS: 0.8808, UEM: 0.6146, LEM: 0.3880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7457, partial_loss/deprel_loss: 30.3347, partial_loss/cycle_loss: 0.0000, batch_loss: 24.4169, loss: 29.2772, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  54%|#####3    | 7/13 [00:07<00:06,  1.01s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9387, LAS: 0.8860, UEM: 0.6328, LEM: 0.3817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5421, partial_loss/deprel_loss: 24.5162, partial_loss/cycle_loss: 0.0000, batch_loss: 19.7214, loss: 27.9239, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  77%|#######6  | 10/13 [00:09<00:02,  1.03it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9427, LAS: 0.8904, UEM: 0.6369, LEM: 0.3681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7084, partial_loss/deprel_loss: 34.8308, partial_loss/cycle_loss: 0.0000, batch_loss: 28.0063, loss: 26.2605, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.07it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9427, LAS: 0.8904, UEM: 0.6369, LEM: 0.3681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7084, partial_loss/deprel_loss: 34.8308, partial_loss/cycle_loss: 0.0000, batch_loss: 28.0063, loss: 26.2605, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.05it/s]\n",
      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.568  |    34.831\n",
      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.338  |     0.708\n",
      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.167  |     0.000\n",
      "2023-04-07 00:03:12,593 - INFO - combo.training.tensorboard_writer - UEM                      |     0.533  |     0.637\n",
      "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - LAS                      |     0.876  |     0.890\n",
      "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - loss                     |     0.872  |    26.260\n",
      "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - LEM                      |     0.300  |     0.368\n",
      "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - UAS                      |     0.931  |     0.943\n",
      "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - EM                       |     0.901  |     0.886\n",
      "2023-04-07 00:03:12,594 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:03:12,595 - INFO - combo.training.trainer - Epoch duration: 0:01:28.088627\n",
      "2023-04-07 00:03:12,595 - INFO - combo.training.trainer - Estimated training time remaining: 7:31:01\n",
      "2023-04-07 00:03:12,595 - INFO - allennlp.training.trainer - Epoch 56/399\n",
      "2023-04-07 00:03:12,595 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:03:12,595 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:03:12,602 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9052, LAS: 0.8484, UEM: 0.3495, LEM: 0.1702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4177, partial_loss/deprel_loss: 0.5719, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7085, loss: 1.0817, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||:   3%|2         | 3/111 [00:02<01:19,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9245, LAS: 0.8711, UEM: 0.3775, LEM: 0.1822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7256, partial_loss/deprel_loss: 0.7942, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9480, loss: 0.9261, batch_reg_loss: 0.1675, reg_loss: 0.1675 ||:   6%|6         | 7/111 [00:04<01:13,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8121, UAS: 0.9251, LAS: 0.8701, UEM: 0.4158, LEM: 0.1978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5426, partial_loss/deprel_loss: 1.1777, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4182, loss: 0.9325, batch_reg_loss: 0.1675, reg_loss: 0.1675 ||:  10%|9         | 11/111 [00:06<01:06,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8936, UAS: 0.9213, LAS: 0.8668, UEM: 0.4016, LEM: 0.1869, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5635, partial_loss/deprel_loss: 0.6340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7875, loss: 0.9613, batch_reg_loss: 0.1676, reg_loss: 0.1675 ||:  14%|#3        | 15/111 [00:09<01:02,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8866, UAS: 0.9253, LAS: 0.8701, UEM: 0.4440, LEM: 0.2079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4793, partial_loss/deprel_loss: 0.6229, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7618, loss: 0.9270, batch_reg_loss: 0.1676, reg_loss: 0.1675 ||:  16%|#6        | 18/111 [00:11<01:02,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8692, UAS: 0.9262, LAS: 0.8708, UEM: 0.4256, LEM: 0.1955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7134, partial_loss/deprel_loss: 0.7947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9461, loss: 0.9189, batch_reg_loss: 0.1677, reg_loss: 0.1675 ||:  19%|#8        | 21/111 [00:13<01:00,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8419, UAS: 0.9281, LAS: 0.8735, UEM: 0.4891, LEM: 0.2687, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2322, partial_loss/deprel_loss: 0.9139, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1453, loss: 0.8989, batch_reg_loss: 0.1678, reg_loss: 0.1676 ||:  22%|##1       | 24/111 [00:15<00:59,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9323, LAS: 0.8779, UEM: 0.5258, LEM: 0.2887, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6955, partial_loss/deprel_loss: 0.6607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8355, loss: 0.8635, batch_reg_loss: 0.1678, reg_loss: 0.1676 ||:  25%|##5       | 28/111 [00:18<00:55,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8774, UAS: 0.9335, LAS: 0.8788, UEM: 0.5304, LEM: 0.2891, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6671, partial_loss/deprel_loss: 0.6794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8448, loss: 0.8535, batch_reg_loss: 0.1679, reg_loss: 0.1676 ||:  29%|##8       | 32/111 [00:20<00:51,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8620, UAS: 0.9307, LAS: 0.8755, UEM: 0.5065, LEM: 0.2739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8566, partial_loss/deprel_loss: 0.7906, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9718, loss: 0.8817, batch_reg_loss: 0.1679, reg_loss: 0.1677 ||:  32%|###2      | 36/111 [00:23<00:47,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8542, UAS: 0.9307, LAS: 0.8759, UEM: 0.5141, LEM: 0.2816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8571, partial_loss/deprel_loss: 0.7935, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9742, loss: 0.8756, batch_reg_loss: 0.1680, reg_loss: 0.1677 ||:  36%|###6      | 40/111 [00:26<00:47,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9301, LAS: 0.8756, UEM: 0.5189, LEM: 0.2918, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9675, partial_loss/deprel_loss: 0.9376, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1116, loss: 0.8777, batch_reg_loss: 0.1681, reg_loss: 0.1677 ||:  40%|###9      | 44/111 [00:28<00:43,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9300, LAS: 0.8757, UEM: 0.5087, LEM: 0.2809, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5739, partial_loss/deprel_loss: 0.5392, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7143, loss: 0.8775, batch_reg_loss: 0.1681, reg_loss: 0.1678 ||:  43%|####3     | 48/111 [00:31<00:40,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9298, LAS: 0.8754, UEM: 0.5231, LEM: 0.2937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3955, partial_loss/deprel_loss: 0.6056, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7318, loss: 0.8786, batch_reg_loss: 0.1682, reg_loss: 0.1678 ||:  47%|####6     | 52/111 [00:33<00:38,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9317, LAS: 0.8777, UEM: 0.5608, LEM: 0.3392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3015, partial_loss/deprel_loss: 0.4829, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6149, loss: 0.8624, batch_reg_loss: 0.1683, reg_loss: 0.1678 ||:  50%|#####     | 56/111 [00:36<00:35,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8687, UAS: 0.9320, LAS: 0.8779, UEM: 0.5538, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7732, partial_loss/deprel_loss: 0.8248, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9828, loss: 0.8628, batch_reg_loss: 0.1683, reg_loss: 0.1679 ||:  54%|#####4    | 60/111 [00:38<00:32,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9061, UAS: 0.9315, LAS: 0.8774, UEM: 0.5514, LEM: 0.3265, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2844, partial_loss/deprel_loss: 0.4435, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5800, loss: 0.8651, batch_reg_loss: 0.1684, reg_loss: 0.1679 ||:  58%|#####7    | 64/111 [00:41<00:31,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8592, UAS: 0.9296, LAS: 0.8752, UEM: 0.5375, LEM: 0.3173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8510, partial_loss/deprel_loss: 0.7962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9756, loss: 0.8823, batch_reg_loss: 0.1684, reg_loss: 0.1679 ||:  61%|######1   | 68/111 [00:44<00:28,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8740, UAS: 0.9303, LAS: 0.8758, UEM: 0.5345, LEM: 0.3132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6570, partial_loss/deprel_loss: 0.7377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8901, loss: 0.8786, batch_reg_loss: 0.1685, reg_loss: 0.1679 ||:  65%|######4   | 72/111 [00:46<00:25,  1.53it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.9287, LAS: 0.8742, UEM: 0.5252, LEM: 0.3058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5470, partial_loss/deprel_loss: 0.9589, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2450, loss: 0.8900, batch_reg_loss: 0.1686, reg_loss: 0.1680 ||:  68%|######8   | 76/111 [00:49<00:22,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8437, UAS: 0.9281, LAS: 0.8733, UEM: 0.5200, LEM: 0.3022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0865, partial_loss/deprel_loss: 0.9616, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1552, loss: 0.8975, batch_reg_loss: 0.1686, reg_loss: 0.1680 ||:  72%|#######2  | 80/111 [00:51<00:19,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9276, LAS: 0.8728, UEM: 0.5178, LEM: 0.3011, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2355, partial_loss/deprel_loss: 0.3739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5149, loss: 0.9017, batch_reg_loss: 0.1687, reg_loss: 0.1680 ||:  76%|#######5  | 84/111 [00:54<00:17,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8545, UAS: 0.9287, LAS: 0.8741, UEM: 0.5313, LEM: 0.3112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9235, partial_loss/deprel_loss: 0.8001, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9935, loss: 0.8910, batch_reg_loss: 0.1688, reg_loss: 0.1681 ||:  79%|#######9  | 88/111 [00:57<00:15,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9295, LAS: 0.8749, UEM: 0.5379, LEM: 0.3145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2532, partial_loss/deprel_loss: 0.3850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5275, loss: 0.8835, batch_reg_loss: 0.1688, reg_loss: 0.1681 ||:  82%|########1 | 91/111 [00:59<00:13,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8366, UAS: 0.9292, LAS: 0.8745, UEM: 0.5322, LEM: 0.3098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2230, partial_loss/deprel_loss: 1.0392, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2448, loss: 0.8888, batch_reg_loss: 0.1689, reg_loss: 0.1681 ||:  85%|########4 | 94/111 [01:01<00:11,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8414, UAS: 0.9293, LAS: 0.8746, UEM: 0.5293, LEM: 0.3064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1261, partial_loss/deprel_loss: 0.9523, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1560, loss: 0.8880, batch_reg_loss: 0.1689, reg_loss: 0.1681 ||:  87%|########7 | 97/111 [01:04<00:10,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9299, LAS: 0.8754, UEM: 0.5300, LEM: 0.3063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3975, partial_loss/deprel_loss: 0.5280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6709, loss: 0.8825, batch_reg_loss: 0.1690, reg_loss: 0.1682 ||:  91%|######### | 101/111 [01:06<00:06,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8993, UAS: 0.9300, LAS: 0.8756, UEM: 0.5286, LEM: 0.3041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4520, partial_loss/deprel_loss: 0.5662, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7124, loss: 0.8817, batch_reg_loss: 0.1690, reg_loss: 0.1682 ||:  94%|#########3| 104/111 [01:08<00:04,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9309, LAS: 0.8767, UEM: 0.5328, LEM: 0.3061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3614, partial_loss/deprel_loss: 0.5570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6869, loss: 0.8740, batch_reg_loss: 0.1691, reg_loss: 0.1682 ||:  97%|#########7| 108/111 [01:11<00:02,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9313, LAS: 0.8771, UEM: 0.5337, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3501, partial_loss/deprel_loss: 0.5126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6492, loss: 0.8706, batch_reg_loss: 0.1691, reg_loss: 0.1683 ||: 100%|##########| 111/111 [01:14<00:00,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9313, LAS: 0.8771, UEM: 0.5337, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3501, partial_loss/deprel_loss: 0.5126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6492, loss: 0.8706, batch_reg_loss: 0.1691, reg_loss: 0.1683 ||: 100%|##########| 111/111 [01:14<00:00,  1.50it/s]\n",
      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.513  |       N/A\n",
      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.350  |       N/A\n",
      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.168  |       N/A\n",
      "2023-04-07 00:04:26,673 - INFO - combo.training.tensorboard_writer - UEM                      |     0.534  |       N/A\n",
      "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - LAS                      |     0.877  |       N/A\n",
      "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - loss                     |     0.871  |       N/A\n",
      "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - LEM                      |     0.305  |       N/A\n",
      "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - UAS                      |     0.931  |       N/A\n",
      "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - EM                       |     0.904  |       N/A\n",
      "2023-04-07 00:04:26,674 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:04:26,675 - INFO - combo.training.trainer - Epoch duration: 0:01:14.079801\n",
      "2023-04-07 00:04:26,675 - INFO - combo.training.trainer - Estimated training time remaining: 7:29:14\n",
      "2023-04-07 00:04:26,675 - INFO - allennlp.training.trainer - Epoch 57/399\n",
      "2023-04-07 00:04:26,675 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:04:26,675 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:04:26,683 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9574, LAS: 0.9082, UEM: 0.6799, LEM: 0.3935, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2009, partial_loss/deprel_loss: 0.3836, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5162, loss: 0.6548, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||:   3%|2         | 3/111 [00:02<01:22,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8609, UAS: 0.9448, LAS: 0.8923, UEM: 0.5579, LEM: 0.2907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8817, partial_loss/deprel_loss: 0.7887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9765, loss: 0.7685, batch_reg_loss: 0.1692, reg_loss: 0.1692 ||:   5%|5         | 6/111 [00:04<01:21,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9053, UAS: 0.9418, LAS: 0.8873, UEM: 0.5336, LEM: 0.2565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4015, partial_loss/deprel_loss: 0.5489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6886, loss: 0.8019, batch_reg_loss: 0.1692, reg_loss: 0.1692 ||:   8%|8         | 9/111 [00:06<01:15,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9361, LAS: 0.8815, UEM: 0.5493, LEM: 0.2631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2932, partial_loss/deprel_loss: 0.4796, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6116, loss: 0.8263, batch_reg_loss: 0.1692, reg_loss: 0.1692 ||:  11%|#         | 12/111 [00:08<01:13,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8893, UAS: 0.9336, LAS: 0.8793, UEM: 0.5382, LEM: 0.2618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5175, partial_loss/deprel_loss: 0.6198, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7686, loss: 0.8427, batch_reg_loss: 0.1693, reg_loss: 0.1692 ||:  14%|#3        | 15/111 [00:10<01:09,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9344, LAS: 0.8807, UEM: 0.5316, LEM: 0.2545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3015, partial_loss/deprel_loss: 0.4974, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6276, loss: 0.8396, batch_reg_loss: 0.1693, reg_loss: 0.1692 ||:  16%|#6        | 18/111 [00:13<01:06,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9383, LAS: 0.8858, UEM: 0.5676, LEM: 0.2897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2669, partial_loss/deprel_loss: 0.4513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5838, loss: 0.8026, batch_reg_loss: 0.1694, reg_loss: 0.1692 ||:  20%|#9        | 22/111 [00:15<01:03,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8943, UAS: 0.9375, LAS: 0.8848, UEM: 0.5659, LEM: 0.2910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4388, partial_loss/deprel_loss: 0.5643, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7086, loss: 0.8037, batch_reg_loss: 0.1694, reg_loss: 0.1693 ||:  23%|##2       | 25/111 [00:17<01:01,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8627, UAS: 0.9375, LAS: 0.8849, UEM: 0.5632, LEM: 0.2917, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9904, partial_loss/deprel_loss: 0.8711, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0644, loss: 0.8074, batch_reg_loss: 0.1695, reg_loss: 0.1693 ||:  25%|##5       | 28/111 [00:20<01:00,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9383, LAS: 0.8857, UEM: 0.5685, LEM: 0.2989, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2511, partial_loss/deprel_loss: 0.4079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5460, loss: 0.7991, batch_reg_loss: 0.1695, reg_loss: 0.1693 ||:  28%|##7       | 31/111 [00:22<00:59,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8757, UAS: 0.9386, LAS: 0.8856, UEM: 0.5538, LEM: 0.2834, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6780, partial_loss/deprel_loss: 0.7338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8922, loss: 0.8009, batch_reg_loss: 0.1695, reg_loss: 0.1693 ||:  32%|###1      | 35/111 [00:24<00:53,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9393, LAS: 0.8863, UEM: 0.5712, LEM: 0.3050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1683, partial_loss/deprel_loss: 0.3453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4795, loss: 0.7953, batch_reg_loss: 0.1696, reg_loss: 0.1693 ||:  34%|###4      | 38/111 [00:27<00:50,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8656, UAS: 0.9381, LAS: 0.8853, UEM: 0.5535, LEM: 0.2932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8753, partial_loss/deprel_loss: 0.8562, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0296, loss: 0.8056, batch_reg_loss: 0.1696, reg_loss: 0.1694 ||:  38%|###7      | 42/111 [00:29<00:45,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9391, LAS: 0.8863, UEM: 0.5589, LEM: 0.2964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2931, partial_loss/deprel_loss: 0.4550, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5923, loss: 0.7981, batch_reg_loss: 0.1697, reg_loss: 0.1694 ||:  41%|####1     | 46/111 [00:32<00:45,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8319, UAS: 0.9383, LAS: 0.8852, UEM: 0.5596, LEM: 0.2990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2342, partial_loss/deprel_loss: 0.9472, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1743, loss: 0.8052, batch_reg_loss: 0.1697, reg_loss: 0.1694 ||:  44%|####4     | 49/111 [00:34<00:43,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9382, LAS: 0.8851, UEM: 0.5530, LEM: 0.2922, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4239, partial_loss/deprel_loss: 0.4945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6501, loss: 0.8059, batch_reg_loss: 0.1698, reg_loss: 0.1694 ||:  47%|####6     | 52/111 [00:36<00:41,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9035, UAS: 0.9379, LAS: 0.8845, UEM: 0.5488, LEM: 0.2867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3379, partial_loss/deprel_loss: 0.5204, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6537, loss: 0.8090, batch_reg_loss: 0.1698, reg_loss: 0.1695 ||:  50%|#####     | 56/111 [00:39<00:37,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8372, UAS: 0.9379, LAS: 0.8848, UEM: 0.5595, LEM: 0.3004, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2587, partial_loss/deprel_loss: 0.9625, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1916, loss: 0.8063, batch_reg_loss: 0.1699, reg_loss: 0.1695 ||:  53%|#####3    | 59/111 [00:41<00:35,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8707, UAS: 0.9372, LAS: 0.8841, UEM: 0.5497, LEM: 0.2937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8368, partial_loss/deprel_loss: 0.7492, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9366, loss: 0.8141, batch_reg_loss: 0.1699, reg_loss: 0.1695 ||:  56%|#####5    | 62/111 [00:43<00:35,  1.40it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9372, LAS: 0.8840, UEM: 0.5502, LEM: 0.2970, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2499, partial_loss/deprel_loss: 0.3824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5258, loss: 0.8138, batch_reg_loss: 0.1699, reg_loss: 0.1695 ||:  59%|#####8    | 65/111 [00:46<00:33,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8664, UAS: 0.9362, LAS: 0.8828, UEM: 0.5413, LEM: 0.2903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8034, partial_loss/deprel_loss: 0.7748, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9505, loss: 0.8236, batch_reg_loss: 0.1700, reg_loss: 0.1695 ||:  61%|######1   | 68/111 [00:48<00:30,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9134, UAS: 0.9372, LAS: 0.8837, UEM: 0.5485, LEM: 0.2933, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2735, partial_loss/deprel_loss: 0.4689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5999, loss: 0.8154, batch_reg_loss: 0.1700, reg_loss: 0.1696 ||:  65%|######4   | 72/111 [00:50<00:27,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8537, UAS: 0.9369, LAS: 0.8832, UEM: 0.5447, LEM: 0.2896, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8168, partial_loss/deprel_loss: 0.7835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9603, loss: 0.8159, batch_reg_loss: 0.1701, reg_loss: 0.1696 ||:  68%|######8   | 76/111 [00:53<00:23,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9351, LAS: 0.8814, UEM: 0.5352, LEM: 0.2840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8657, partial_loss/deprel_loss: 0.9087, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0703, loss: 0.8321, batch_reg_loss: 0.1702, reg_loss: 0.1696 ||:  72%|#######2  | 80/111 [00:55<00:20,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8396, UAS: 0.9344, LAS: 0.8804, UEM: 0.5286, LEM: 0.2782, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3138, partial_loss/deprel_loss: 0.9856, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2214, loss: 0.8418, batch_reg_loss: 0.1702, reg_loss: 0.1696 ||:  76%|#######5  | 84/111 [00:58<00:17,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7678, UAS: 0.9332, LAS: 0.8793, UEM: 0.5226, LEM: 0.2739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.4154, partial_loss/deprel_loss: 1.4659, partial_loss/cycle_loss: 0.0000, batch_loss: 1.8261, loss: 0.8530, batch_reg_loss: 0.1703, reg_loss: 0.1697 ||:  79%|#######9  | 88/111 [01:00<00:15,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8031, UAS: 0.9315, LAS: 0.8773, UEM: 0.5138, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6813, partial_loss/deprel_loss: 1.2116, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4759, loss: 0.8697, batch_reg_loss: 0.1704, reg_loss: 0.1697 ||:  83%|########2 | 92/111 [01:03<00:12,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8146, UAS: 0.9307, LAS: 0.8762, UEM: 0.5060, LEM: 0.2642, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5085, partial_loss/deprel_loss: 1.0874, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3421, loss: 0.8791, batch_reg_loss: 0.1704, reg_loss: 0.1697 ||:  86%|########6 | 96/111 [01:06<00:10,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8565, UAS: 0.9313, LAS: 0.8770, UEM: 0.5214, LEM: 0.2812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8799, partial_loss/deprel_loss: 0.7930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9809, loss: 0.8718, batch_reg_loss: 0.1705, reg_loss: 0.1698 ||:  89%|########9 | 99/111 [01:08<00:08,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8170, UAS: 0.9314, LAS: 0.8773, UEM: 0.5363, LEM: 0.3029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5947, partial_loss/deprel_loss: 1.1252, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3897, loss: 0.8706, batch_reg_loss: 0.1705, reg_loss: 0.1698 ||:  92%|#########1| 102/111 [01:10<00:06,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9312, LAS: 0.8771, UEM: 0.5340, LEM: 0.3009, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3184, partial_loss/deprel_loss: 0.5107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6428, loss: 0.8734, batch_reg_loss: 0.1706, reg_loss: 0.1698 ||:  95%|#########4| 105/111 [01:12<00:04,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9314, LAS: 0.8773, UEM: 0.5357, LEM: 0.3026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1379, partial_loss/deprel_loss: 0.4026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5203, loss: 0.8727, batch_reg_loss: 0.1707, reg_loss: 0.1698 ||:  98%|#########8| 109/111 [01:15<00:01,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8319, UAS: 0.9312, LAS: 0.8771, UEM: 0.5351, LEM: 0.3020, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3903, partial_loss/deprel_loss: 1.0609, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2975, loss: 0.8749, batch_reg_loss: 0.1707, reg_loss: 0.1698 ||: 100%|##########| 111/111 [01:16<00:00,  1.44it/s]\n",
      "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
      "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:05:43,646 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.061  |       N/A\n",
      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.390  |       N/A\n",
      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.170  |       N/A\n",
      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - UEM                      |     0.535  |       N/A\n",
      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - LAS                      |     0.877  |       N/A\n",
      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - loss                     |     0.875  |       N/A\n",
      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - LEM                      |     0.302  |       N/A\n",
      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - UAS                      |     0.931  |       N/A\n",
      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - EM                       |     0.832  |       N/A\n",
      "2023-04-07 00:05:43,647 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:05:43,648 - INFO - combo.training.trainer - Epoch duration: 0:01:16.973170\n",
      "2023-04-07 00:05:43,648 - INFO - combo.training.trainer - Estimated training time remaining: 7:27:46\n",
      "2023-04-07 00:05:43,648 - INFO - allennlp.training.trainer - Epoch 58/399\n",
      "2023-04-07 00:05:43,649 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:05:43,649 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:05:43,656 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9596, UAS: 0.9595, LAS: 0.9153, UEM: 0.8286, LEM: 0.6638, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0595, partial_loss/deprel_loss: 0.1632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3132, loss: 0.6007, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:   3%|2         | 3/111 [00:02<01:31,  1.17it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9561, LAS: 0.9084, UEM: 0.7561, LEM: 0.5438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3785, partial_loss/deprel_loss: 0.5578, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6927, loss: 0.6717, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:   5%|5         | 6/111 [00:04<01:24,  1.24it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8974, UAS: 0.9398, LAS: 0.8906, UEM: 0.6781, LEM: 0.4762, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4555, partial_loss/deprel_loss: 0.6072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7477, loss: 0.8015, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:   8%|8         | 9/111 [00:06<01:19,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9390, LAS: 0.8898, UEM: 0.6879, LEM: 0.4847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1247, partial_loss/deprel_loss: 0.2886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4267, loss: 0.7959, batch_reg_loss: 0.1709, reg_loss: 0.1708 ||:  11%|#         | 12/111 [00:09<01:16,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9394, LAS: 0.8893, UEM: 0.6638, LEM: 0.4483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4382, partial_loss/deprel_loss: 0.5194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6741, loss: 0.7959, batch_reg_loss: 0.1709, reg_loss: 0.1708 ||:  14%|#3        | 15/111 [00:11<01:13,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9375, LAS: 0.8866, UEM: 0.6227, LEM: 0.4106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4958, partial_loss/deprel_loss: 0.5977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7483, loss: 0.8116, batch_reg_loss: 0.1710, reg_loss: 0.1708 ||:  16%|#6        | 18/111 [00:13<01:09,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9390, LAS: 0.8878, UEM: 0.6204, LEM: 0.3971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3002, partial_loss/deprel_loss: 0.5513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6721, loss: 0.7963, batch_reg_loss: 0.1710, reg_loss: 0.1709 ||:  19%|#8        | 21/111 [00:15<01:06,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8683, UAS: 0.9392, LAS: 0.8883, UEM: 0.6134, LEM: 0.3908, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7934, partial_loss/deprel_loss: 0.7961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9666, loss: 0.7907, batch_reg_loss: 0.1711, reg_loss: 0.1709 ||:  22%|##1       | 24/111 [00:17<01:03,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9363, LAS: 0.8847, UEM: 0.5900, LEM: 0.3708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5115, partial_loss/deprel_loss: 0.6097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7612, loss: 0.8143, batch_reg_loss: 0.1711, reg_loss: 0.1709 ||:  24%|##4       | 27/111 [00:19<01:01,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8642, UAS: 0.9362, LAS: 0.8844, UEM: 0.5729, LEM: 0.3494, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9451, partial_loss/deprel_loss: 0.7701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9762, loss: 0.8149, batch_reg_loss: 0.1712, reg_loss: 0.1709 ||:  28%|##7       | 31/111 [00:22<00:55,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8648, UAS: 0.9355, LAS: 0.8831, UEM: 0.5606, LEM: 0.3357, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8069, partial_loss/deprel_loss: 0.7371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9223, loss: 0.8263, batch_reg_loss: 0.1712, reg_loss: 0.1710 ||:  31%|###       | 34/111 [00:24<00:52,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8912, UAS: 0.9365, LAS: 0.8844, UEM: 0.5572, LEM: 0.3297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5529, partial_loss/deprel_loss: 0.6048, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7657, loss: 0.8172, batch_reg_loss: 0.1712, reg_loss: 0.1710 ||:  33%|###3      | 37/111 [00:26<00:50,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8538, UAS: 0.9357, LAS: 0.8834, UEM: 0.5464, LEM: 0.3201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0253, partial_loss/deprel_loss: 0.8089, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0234, loss: 0.8234, batch_reg_loss: 0.1713, reg_loss: 0.1710 ||:  37%|###6      | 41/111 [00:29<00:47,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9355, LAS: 0.8831, UEM: 0.5659, LEM: 0.3355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2456, partial_loss/deprel_loss: 0.4127, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5506, loss: 0.8257, batch_reg_loss: 0.1713, reg_loss: 0.1710 ||:  40%|###9      | 44/111 [00:31<00:46,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8660, UAS: 0.9308, LAS: 0.8782, UEM: 0.5494, LEM: 0.3243, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9662, partial_loss/deprel_loss: 0.8248, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0244, loss: 0.8680, batch_reg_loss: 0.1714, reg_loss: 0.1711 ||:  43%|####3     | 48/111 [00:33<00:42,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9077, UAS: 0.9301, LAS: 0.8776, UEM: 0.5468, LEM: 0.3233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3291, partial_loss/deprel_loss: 0.4619, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6068, loss: 0.8733, batch_reg_loss: 0.1714, reg_loss: 0.1711 ||:  46%|####5     | 51/111 [00:36<00:42,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9141, UAS: 0.9301, LAS: 0.8774, UEM: 0.5459, LEM: 0.3225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2580, partial_loss/deprel_loss: 0.4262, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5641, loss: 0.8732, batch_reg_loss: 0.1715, reg_loss: 0.1711 ||:  49%|####8     | 54/111 [00:38<00:39,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8443, UAS: 0.9303, LAS: 0.8775, UEM: 0.5463, LEM: 0.3237, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9609, partial_loss/deprel_loss: 0.8621, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0534, loss: 0.8687, batch_reg_loss: 0.1716, reg_loss: 0.1711 ||:  51%|#####1    | 57/111 [00:40<00:38,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8988, UAS: 0.9323, LAS: 0.8796, UEM: 0.5627, LEM: 0.3346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4283, partial_loss/deprel_loss: 0.5501, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6973, loss: 0.8529, batch_reg_loss: 0.1716, reg_loss: 0.1712 ||:  55%|#####4    | 61/111 [00:42<00:34,  1.44it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8381, UAS: 0.9310, LAS: 0.8782, UEM: 0.5520, LEM: 0.3267, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1179, partial_loss/deprel_loss: 0.8586, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0821, loss: 0.8627, batch_reg_loss: 0.1717, reg_loss: 0.1712 ||:  59%|#####8    | 65/111 [00:45<00:31,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9320, LAS: 0.8792, UEM: 0.5555, LEM: 0.3268, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5933, partial_loss/deprel_loss: 0.6654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8227, loss: 0.8550, batch_reg_loss: 0.1717, reg_loss: 0.1712 ||:  61%|######1   | 68/111 [00:47<00:29,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9326, LAS: 0.8796, UEM: 0.5645, LEM: 0.3340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1658, partial_loss/deprel_loss: 0.4269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5465, loss: 0.8516, batch_reg_loss: 0.1718, reg_loss: 0.1712 ||:  64%|######3   | 71/111 [00:49<00:28,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8692, UAS: 0.9329, LAS: 0.8797, UEM: 0.5560, LEM: 0.3247, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6251, partial_loss/deprel_loss: 0.7558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9015, loss: 0.8517, batch_reg_loss: 0.1718, reg_loss: 0.1713 ||:  68%|######7   | 75/111 [00:52<00:23,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8435, UAS: 0.9324, LAS: 0.8787, UEM: 0.5451, LEM: 0.3162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0988, partial_loss/deprel_loss: 0.9087, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1186, loss: 0.8610, batch_reg_loss: 0.1719, reg_loss: 0.1713 ||:  71%|#######1  | 79/111 [00:54<00:21,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9328, LAS: 0.8791, UEM: 0.5434, LEM: 0.3127, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3353, partial_loss/deprel_loss: 0.5287, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6619, loss: 0.8598, batch_reg_loss: 0.1719, reg_loss: 0.1713 ||:  74%|#######3  | 82/111 [00:57<00:19,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9323, LAS: 0.8787, UEM: 0.5416, LEM: 0.3104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7752, partial_loss/deprel_loss: 0.7615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9362, loss: 0.8612, batch_reg_loss: 0.1719, reg_loss: 0.1713 ||:  77%|#######6  | 85/111 [00:59<00:18,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9317, LAS: 0.8779, UEM: 0.5354, LEM: 0.3063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5456, partial_loss/deprel_loss: 0.5851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7492, loss: 0.8666, batch_reg_loss: 0.1720, reg_loss: 0.1714 ||:  79%|#######9  | 88/111 [01:01<00:15,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9319, LAS: 0.8783, UEM: 0.5453, LEM: 0.3187, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1393, partial_loss/deprel_loss: 0.2585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4067, loss: 0.8646, batch_reg_loss: 0.1720, reg_loss: 0.1714 ||:  83%|########2 | 92/111 [01:04<00:13,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8494, UAS: 0.9318, LAS: 0.8782, UEM: 0.5385, LEM: 0.3119, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9511, partial_loss/deprel_loss: 0.9121, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0920, loss: 0.8661, batch_reg_loss: 0.1721, reg_loss: 0.1714 ||:  86%|########6 | 96/111 [01:06<00:10,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8852, UAS: 0.9316, LAS: 0.8780, UEM: 0.5317, LEM: 0.3060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6062, partial_loss/deprel_loss: 0.6751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8335, loss: 0.8693, batch_reg_loss: 0.1722, reg_loss: 0.1714 ||:  90%|######### | 100/111 [01:09<00:07,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9321, LAS: 0.8787, UEM: 0.5358, LEM: 0.3087, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2498, partial_loss/deprel_loss: 0.3508, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5029, loss: 0.8622, batch_reg_loss: 0.1722, reg_loss: 0.1715 ||:  94%|#########3| 104/111 [01:11<00:04,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8788, UAS: 0.9325, LAS: 0.8791, UEM: 0.5368, LEM: 0.3090, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6178, partial_loss/deprel_loss: 0.7346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8835, loss: 0.8581, batch_reg_loss: 0.1723, reg_loss: 0.1715 ||:  96%|#########6| 107/111 [01:13<00:02,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9318, LAS: 0.8783, UEM: 0.5331, LEM: 0.3068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2776, partial_loss/deprel_loss: 0.4357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5764, loss: 0.8651, batch_reg_loss: 0.1723, reg_loss: 0.1715 ||: 100%|##########| 111/111 [01:16<00:00,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9318, LAS: 0.8783, UEM: 0.5331, LEM: 0.3068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2776, partial_loss/deprel_loss: 0.4357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5764, loss: 0.8651, batch_reg_loss: 0.1723, reg_loss: 0.1715 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
      "2023-04-07 00:07:00,259 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:07:00,259 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:07:00,259 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.436  |       N/A\n",
      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.278  |       N/A\n",
      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.172  |       N/A\n",
      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - UEM                      |     0.533  |       N/A\n",
      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - LAS                      |     0.878  |       N/A\n",
      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - loss                     |     0.865  |       N/A\n",
      "2023-04-07 00:07:00,260 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:07:00,261 - INFO - combo.training.tensorboard_writer - LEM                      |     0.307  |       N/A\n",
      "2023-04-07 00:07:00,261 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:07:00,261 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:07:00,261 - INFO - combo.training.tensorboard_writer - UAS                      |     0.932  |       N/A\n",
      "2023-04-07 00:07:00,261 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:07:00,261 - INFO - combo.training.tensorboard_writer - EM                       |     0.913  |       N/A\n",
      "2023-04-07 00:07:00,261 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:07:00,262 - INFO - combo.training.trainer - Epoch duration: 0:01:16.613383\n",
      "2023-04-07 00:07:00,262 - INFO - combo.training.trainer - Estimated training time remaining: 7:26:16\n",
      "2023-04-07 00:07:00,262 - INFO - allennlp.training.trainer - Epoch 59/399\n",
      "2023-04-07 00:07:00,262 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:07:00,263 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:07:00,270 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8762, UAS: 0.9336, LAS: 0.8775, UEM: 0.3808, LEM: 0.1360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7637, partial_loss/deprel_loss: 0.6570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8507, loss: 0.8668, batch_reg_loss: 0.1724, reg_loss: 0.1724 ||:   4%|3         | 4/111 [00:02<01:07,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9333, LAS: 0.8780, UEM: 0.5207, LEM: 0.2574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2748, partial_loss/deprel_loss: 0.4359, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5761, loss: 0.8606, batch_reg_loss: 0.1724, reg_loss: 0.1724 ||:   6%|6         | 7/111 [00:04<01:08,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8552, UAS: 0.9347, LAS: 0.8794, UEM: 0.4916, LEM: 0.2364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9107, partial_loss/deprel_loss: 0.8228, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0128, loss: 0.8498, batch_reg_loss: 0.1725, reg_loss: 0.1724 ||:   9%|9         | 10/111 [00:06<01:07,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8452, UAS: 0.9266, LAS: 0.8729, UEM: 0.4409, LEM: 0.2103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3004, partial_loss/deprel_loss: 0.9704, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2089, loss: 0.8981, batch_reg_loss: 0.1725, reg_loss: 0.1724 ||:  12%|#1        | 13/111 [00:08<01:05,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9335, LAS: 0.8811, UEM: 0.5484, LEM: 0.3001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1577, partial_loss/deprel_loss: 0.3573, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4900, loss: 0.8355, batch_reg_loss: 0.1726, reg_loss: 0.1725 ||:  14%|#4        | 16/111 [00:11<01:06,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8034, UAS: 0.9277, LAS: 0.8738, UEM: 0.4982, LEM: 0.2656, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9376, partial_loss/deprel_loss: 1.0868, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4295, loss: 0.8938, batch_reg_loss: 0.1726, reg_loss: 0.1725 ||:  18%|#8        | 20/111 [00:13<01:00,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9292, LAS: 0.8751, UEM: 0.5387, LEM: 0.3178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1075, partial_loss/deprel_loss: 0.2709, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4109, loss: 0.8872, batch_reg_loss: 0.1727, reg_loss: 0.1725 ||:  21%|##        | 23/111 [00:15<00:59,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9124, UAS: 0.9307, LAS: 0.8770, UEM: 0.5338, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3092, partial_loss/deprel_loss: 0.4545, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5981, loss: 0.8721, batch_reg_loss: 0.1727, reg_loss: 0.1725 ||:  23%|##3       | 26/111 [00:18<01:01,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8828, UAS: 0.9296, LAS: 0.8759, UEM: 0.5318, LEM: 0.3076, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5820, partial_loss/deprel_loss: 0.6105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7775, loss: 0.8817, batch_reg_loss: 0.1728, reg_loss: 0.1726 ||:  26%|##6       | 29/111 [00:20<00:58,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9292, LAS: 0.8753, UEM: 0.5118, LEM: 0.2923, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8447, partial_loss/deprel_loss: 0.8250, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0018, loss: 0.8869, batch_reg_loss: 0.1728, reg_loss: 0.1726 ||:  29%|##8       | 32/111 [00:22<00:55,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9321, LAS: 0.8791, UEM: 0.5550, LEM: 0.3284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2176, partial_loss/deprel_loss: 0.3670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5100, loss: 0.8576, batch_reg_loss: 0.1728, reg_loss: 0.1726 ||:  32%|###1      | 35/111 [00:24<00:54,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9508, UAS: 0.9342, LAS: 0.8816, UEM: 0.5933, LEM: 0.3763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0539, partial_loss/deprel_loss: 0.1786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3265, loss: 0.8401, batch_reg_loss: 0.1729, reg_loss: 0.1726 ||:  34%|###4      | 38/111 [00:27<00:56,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8712, UAS: 0.9332, LAS: 0.8807, UEM: 0.5845, LEM: 0.3686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8210, partial_loss/deprel_loss: 0.7104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9054, loss: 0.8468, batch_reg_loss: 0.1729, reg_loss: 0.1726 ||:  37%|###6      | 41/111 [00:29<00:52,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8345, UAS: 0.9329, LAS: 0.8802, UEM: 0.5758, LEM: 0.3590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0728, partial_loss/deprel_loss: 0.9505, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1480, loss: 0.8477, batch_reg_loss: 0.1730, reg_loss: 0.1727 ||:  40%|###9      | 44/111 [00:31<00:49,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9333, LAS: 0.8805, UEM: 0.5705, LEM: 0.3506, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3542, partial_loss/deprel_loss: 0.4947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6395, loss: 0.8465, batch_reg_loss: 0.1730, reg_loss: 0.1727 ||:  42%|####2     | 47/111 [00:33<00:46,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9328, LAS: 0.8799, UEM: 0.5733, LEM: 0.3577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1635, partial_loss/deprel_loss: 0.3313, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4708, loss: 0.8541, batch_reg_loss: 0.1730, reg_loss: 0.1727 ||:  46%|####5     | 51/111 [00:36<00:43,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9341, LAS: 0.8814, UEM: 0.5789, LEM: 0.3594, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3308, partial_loss/deprel_loss: 0.5056, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6438, loss: 0.8426, batch_reg_loss: 0.1731, reg_loss: 0.1727 ||:  49%|####8     | 54/111 [00:38<00:41,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9337, LAS: 0.8810, UEM: 0.5784, LEM: 0.3584, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2728, partial_loss/deprel_loss: 0.4433, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5823, loss: 0.8452, batch_reg_loss: 0.1731, reg_loss: 0.1727 ||:  51%|#####1    | 57/111 [00:40<00:39,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9347, LAS: 0.8819, UEM: 0.5824, LEM: 0.3589, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5877, partial_loss/deprel_loss: 0.6521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8124, loss: 0.8381, batch_reg_loss: 0.1732, reg_loss: 0.1728 ||:  54%|#####4    | 60/111 [00:43<00:38,  1.33it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8242, UAS: 0.9333, LAS: 0.8805, UEM: 0.5715, LEM: 0.3503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4308, partial_loss/deprel_loss: 1.1157, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3520, loss: 0.8506, batch_reg_loss: 0.1732, reg_loss: 0.1728 ||:  57%|#####6    | 63/111 [00:45<00:35,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8745, UAS: 0.9334, LAS: 0.8804, UEM: 0.5614, LEM: 0.3395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7164, partial_loss/deprel_loss: 0.7620, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9261, loss: 0.8528, batch_reg_loss: 0.1733, reg_loss: 0.1728 ||:  60%|######    | 67/111 [00:47<00:29,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8562, UAS: 0.9334, LAS: 0.8803, UEM: 0.5556, LEM: 0.3320, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9412, partial_loss/deprel_loss: 0.8262, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0225, loss: 0.8533, batch_reg_loss: 0.1733, reg_loss: 0.1728 ||:  64%|######3   | 71/111 [00:49<00:25,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9320, LAS: 0.8785, UEM: 0.5549, LEM: 0.3308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1992, partial_loss/deprel_loss: 0.3865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5224, loss: 0.8659, batch_reg_loss: 0.1734, reg_loss: 0.1729 ||:  68%|######7   | 75/111 [00:52<00:23,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8442, UAS: 0.9316, LAS: 0.8779, UEM: 0.5463, LEM: 0.3221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0091, partial_loss/deprel_loss: 0.9599, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1432, loss: 0.8711, batch_reg_loss: 0.1734, reg_loss: 0.1729 ||:  71%|#######1  | 79/111 [00:55<00:21,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9326, LAS: 0.8789, UEM: 0.5523, LEM: 0.3229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2824, partial_loss/deprel_loss: 0.4500, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5900, loss: 0.8622, batch_reg_loss: 0.1735, reg_loss: 0.1729 ||:  75%|#######4  | 83/111 [00:58<00:19,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9327, LAS: 0.8790, UEM: 0.5486, LEM: 0.3190, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2842, partial_loss/deprel_loss: 0.5412, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6634, loss: 0.8606, batch_reg_loss: 0.1735, reg_loss: 0.1729 ||:  77%|#######7  | 86/111 [01:00<00:17,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9320, LAS: 0.8782, UEM: 0.5492, LEM: 0.3182, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2800, partial_loss/deprel_loss: 0.4778, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6118, loss: 0.8675, batch_reg_loss: 0.1736, reg_loss: 0.1730 ||:  80%|########  | 89/111 [01:02<00:15,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9325, LAS: 0.8787, UEM: 0.5477, LEM: 0.3148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6621, partial_loss/deprel_loss: 0.7544, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9096, loss: 0.8624, batch_reg_loss: 0.1736, reg_loss: 0.1730 ||:  84%|########3 | 93/111 [01:04<00:12,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8652, UAS: 0.9321, LAS: 0.8784, UEM: 0.5426, LEM: 0.3108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9823, partial_loss/deprel_loss: 0.8097, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0179, loss: 0.8656, batch_reg_loss: 0.1737, reg_loss: 0.1730 ||:  86%|########6 | 96/111 [01:06<00:10,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9319, LAS: 0.8782, UEM: 0.5405, LEM: 0.3084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4858, partial_loss/deprel_loss: 0.6298, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7747, loss: 0.8675, batch_reg_loss: 0.1737, reg_loss: 0.1730 ||:  90%|######### | 100/111 [01:09<00:07,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9323, LAS: 0.8785, UEM: 0.5404, LEM: 0.3064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5189, partial_loss/deprel_loss: 0.6216, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7748, loss: 0.8655, batch_reg_loss: 0.1738, reg_loss: 0.1731 ||:  94%|#########3| 104/111 [01:12<00:04,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8941, UAS: 0.9324, LAS: 0.8785, UEM: 0.5361, LEM: 0.3023, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4727, partial_loss/deprel_loss: 0.5968, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7458, loss: 0.8654, batch_reg_loss: 0.1738, reg_loss: 0.1731 ||:  96%|#########6| 107/111 [01:14<00:02,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8647, UAS: 0.9322, LAS: 0.8783, UEM: 0.5396, LEM: 0.3066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7106, partial_loss/deprel_loss: 0.7900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9480, loss: 0.8659, batch_reg_loss: 0.1739, reg_loss: 0.1731 ||:  99%|#########9| 110/111 [01:16<00:00,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8374, UAS: 0.9319, LAS: 0.8779, UEM: 0.5374, LEM: 0.3052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1673, partial_loss/deprel_loss: 0.9337, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1543, loss: 0.8685, batch_reg_loss: 0.1739, reg_loss: 0.1731 ||: 100%|##########| 111/111 [01:17<00:00,  1.44it/s]\n",
      "2023-04-07 00:08:17,587 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:08:17,587 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:08:17,587 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.934  |       N/A\n",
      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.167  |       N/A\n",
      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.173  |       N/A\n",
      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - UEM                      |     0.537  |       N/A\n",
      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - LAS                      |     0.878  |       N/A\n",
      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - loss                     |     0.869  |       N/A\n",
      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - LEM                      |     0.305  |       N/A\n",
      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:08:17,588 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:08:17,589 - INFO - combo.training.tensorboard_writer - UAS                      |     0.932  |       N/A\n",
      "2023-04-07 00:08:17,589 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:08:17,589 - INFO - combo.training.tensorboard_writer - EM                       |     0.837  |       N/A\n",
      "2023-04-07 00:08:17,589 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:08:17,589 - INFO - combo.training.trainer - Epoch duration: 0:01:17.327204\n",
      "2023-04-07 00:08:17,589 - INFO - combo.training.trainer - Estimated training time remaining: 7:24:51\n",
      "2023-04-07 00:08:17,590 - INFO - allennlp.training.trainer - Epoch 60/399\n",
      "2023-04-07 00:08:17,590 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:08:17,590 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:08:17,598 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9362, LAS: 0.8814, UEM: 0.3503, LEM: 0.1203, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8053, partial_loss/deprel_loss: 0.7054, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8993, loss: 0.8470, batch_reg_loss: 0.1739, reg_loss: 0.1739 ||:   3%|2         | 3/111 [00:02<01:20,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8333, UAS: 0.9321, LAS: 0.8779, UEM: 0.3913, LEM: 0.1676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2081, partial_loss/deprel_loss: 0.9663, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1886, loss: 0.8611, batch_reg_loss: 0.1740, reg_loss: 0.1739 ||:   6%|6         | 7/111 [00:04<01:13,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7929, UAS: 0.9231, LAS: 0.8686, UEM: 0.3932, LEM: 0.1813, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.0036, partial_loss/deprel_loss: 1.1850, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5227, loss: 0.9405, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||:   9%|9         | 10/111 [00:07<01:13,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9264, LAS: 0.8725, UEM: 0.4786, LEM: 0.2742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1777, partial_loss/deprel_loss: 0.3238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4686, loss: 0.9067, batch_reg_loss: 0.1741, reg_loss: 0.1740 ||:  12%|#1        | 13/111 [00:09<01:14,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9316, LAS: 0.8780, UEM: 0.5387, LEM: 0.3116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6095, partial_loss/deprel_loss: 0.6517, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8174, loss: 0.8575, batch_reg_loss: 0.1741, reg_loss: 0.1740 ||:  14%|#4        | 16/111 [00:11<01:10,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9362, LAS: 0.8836, UEM: 0.6020, LEM: 0.3786, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0994, partial_loss/deprel_loss: 0.2475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3920, loss: 0.8120, batch_reg_loss: 0.1742, reg_loss: 0.1740 ||:  18%|#8        | 20/111 [00:14<01:04,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8839, UAS: 0.9373, LAS: 0.8850, UEM: 0.5973, LEM: 0.3707, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5161, partial_loss/deprel_loss: 0.6815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8226, loss: 0.8053, batch_reg_loss: 0.1742, reg_loss: 0.1741 ||:  22%|##1       | 24/111 [00:16<00:59,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8917, UAS: 0.9403, LAS: 0.8883, UEM: 0.6151, LEM: 0.3769, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4976, partial_loss/deprel_loss: 0.6561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7986, loss: 0.7819, batch_reg_loss: 0.1742, reg_loss: 0.1741 ||:  25%|##5       | 28/111 [00:19<00:54,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8948, UAS: 0.9413, LAS: 0.8891, UEM: 0.6076, LEM: 0.3650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4554, partial_loss/deprel_loss: 0.5114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6744, loss: 0.7749, batch_reg_loss: 0.1743, reg_loss: 0.1741 ||:  28%|##7       | 31/111 [00:21<00:54,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9397, LAS: 0.8876, UEM: 0.6007, LEM: 0.3613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2657, partial_loss/deprel_loss: 0.4361, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5763, loss: 0.7878, batch_reg_loss: 0.1743, reg_loss: 0.1741 ||:  31%|###       | 34/111 [00:23<00:53,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8368, UAS: 0.9376, LAS: 0.8857, UEM: 0.5841, LEM: 0.3488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2452, partial_loss/deprel_loss: 0.9293, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1668, loss: 0.8026, batch_reg_loss: 0.1743, reg_loss: 0.1741 ||:  33%|###3      | 37/111 [00:25<00:52,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8688, UAS: 0.9343, LAS: 0.8819, UEM: 0.5689, LEM: 0.3378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8595, partial_loss/deprel_loss: 0.8019, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9878, loss: 0.8301, batch_reg_loss: 0.1743, reg_loss: 0.1741 ||:  36%|###6      | 40/111 [00:27<00:50,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8483, UAS: 0.9321, LAS: 0.8796, UEM: 0.5564, LEM: 0.3279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1939, partial_loss/deprel_loss: 0.9149, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1451, loss: 0.8517, batch_reg_loss: 0.1744, reg_loss: 0.1742 ||:  40%|###9      | 44/111 [00:30<00:47,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9065, UAS: 0.9335, LAS: 0.8809, UEM: 0.5663, LEM: 0.3323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3052, partial_loss/deprel_loss: 0.4650, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6075, loss: 0.8412, batch_reg_loss: 0.1744, reg_loss: 0.1742 ||:  42%|####2     | 47/111 [00:32<00:46,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8790, UAS: 0.9348, LAS: 0.8828, UEM: 0.5920, LEM: 0.3681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6005, partial_loss/deprel_loss: 0.6092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7820, loss: 0.8263, batch_reg_loss: 0.1745, reg_loss: 0.1742 ||:  45%|####5     | 50/111 [00:35<00:47,  1.28it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8130, UAS: 0.9329, LAS: 0.8806, UEM: 0.5860, LEM: 0.3640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5709, partial_loss/deprel_loss: 1.0503, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3290, loss: 0.8424, batch_reg_loss: 0.1745, reg_loss: 0.1742 ||:  48%|####7     | 53/111 [00:38<00:45,  1.27it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8496, UAS: 0.9336, LAS: 0.8812, UEM: 0.5811, LEM: 0.3567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9414, partial_loss/deprel_loss: 0.9016, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0842, loss: 0.8390, batch_reg_loss: 0.1746, reg_loss: 0.1742 ||:  51%|#####1    | 57/111 [00:40<00:39,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8404, UAS: 0.9304, LAS: 0.8778, UEM: 0.5673, LEM: 0.3474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2525, partial_loss/deprel_loss: 0.9174, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1591, loss: 0.8677, batch_reg_loss: 0.1746, reg_loss: 0.1743 ||:  55%|#####4    | 61/111 [00:43<00:35,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8513, UAS: 0.9310, LAS: 0.8782, UEM: 0.5702, LEM: 0.3472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9025, partial_loss/deprel_loss: 0.9015, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0764, loss: 0.8632, batch_reg_loss: 0.1747, reg_loss: 0.1743 ||:  58%|#####7    | 64/111 [00:45<00:33,  1.39it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9320, LAS: 0.8794, UEM: 0.5685, LEM: 0.3426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3395, partial_loss/deprel_loss: 0.4841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6300, loss: 0.8545, batch_reg_loss: 0.1748, reg_loss: 0.1743 ||:  61%|######1   | 68/111 [00:47<00:29,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8648, UAS: 0.9312, LAS: 0.8783, UEM: 0.5588, LEM: 0.3351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7327, partial_loss/deprel_loss: 0.7282, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9039, loss: 0.8620, batch_reg_loss: 0.1748, reg_loss: 0.1743 ||:  64%|######3   | 71/111 [00:50<00:28,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8554, UAS: 0.9307, LAS: 0.8778, UEM: 0.5490, LEM: 0.3263, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0077, partial_loss/deprel_loss: 0.8423, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0502, loss: 0.8669, batch_reg_loss: 0.1749, reg_loss: 0.1744 ||:  68%|######7   | 75/111 [00:52<00:24,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9031, UAS: 0.9306, LAS: 0.8776, UEM: 0.5447, LEM: 0.3214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3445, partial_loss/deprel_loss: 0.5258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6645, loss: 0.8677, batch_reg_loss: 0.1749, reg_loss: 0.1744 ||:  70%|#######   | 78/111 [00:54<00:22,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9295, LAS: 0.8763, UEM: 0.5389, LEM: 0.3160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3530, partial_loss/deprel_loss: 0.5616, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6949, loss: 0.8791, batch_reg_loss: 0.1750, reg_loss: 0.1744 ||:  74%|#######3  | 82/111 [00:57<00:19,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8676, UAS: 0.9295, LAS: 0.8762, UEM: 0.5307, LEM: 0.3081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8574, partial_loss/deprel_loss: 0.7822, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9723, loss: 0.8802, batch_reg_loss: 0.1750, reg_loss: 0.1744 ||:  77%|#######7  | 86/111 [00:59<00:16,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9299, LAS: 0.8766, UEM: 0.5393, LEM: 0.3177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1638, partial_loss/deprel_loss: 0.3223, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4657, loss: 0.8764, batch_reg_loss: 0.1751, reg_loss: 0.1745 ||:  81%|########1 | 90/111 [01:02<00:14,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9300, LAS: 0.8768, UEM: 0.5359, LEM: 0.3142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4274, partial_loss/deprel_loss: 0.5398, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6925, loss: 0.8751, batch_reg_loss: 0.1751, reg_loss: 0.1745 ||:  84%|########3 | 93/111 [01:05<00:12,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9306, LAS: 0.8774, UEM: 0.5408, LEM: 0.3163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2533, partial_loss/deprel_loss: 0.4176, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5599, loss: 0.8691, batch_reg_loss: 0.1752, reg_loss: 0.1745 ||:  87%|########7 | 97/111 [01:07<00:09,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9311, LAS: 0.8780, UEM: 0.5431, LEM: 0.3172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5743, partial_loss/deprel_loss: 0.6671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8238, loss: 0.8644, batch_reg_loss: 0.1752, reg_loss: 0.1745 ||:  90%|######### | 100/111 [01:10<00:08,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8498, UAS: 0.9306, LAS: 0.8773, UEM: 0.5365, LEM: 0.3118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0491, partial_loss/deprel_loss: 0.9409, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1378, loss: 0.8708, batch_reg_loss: 0.1753, reg_loss: 0.1746 ||:  94%|#########3| 104/111 [01:12<00:04,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9302, LAS: 0.8767, UEM: 0.5311, LEM: 0.3074, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4103, partial_loss/deprel_loss: 0.5165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6706, loss: 0.8771, batch_reg_loss: 0.1753, reg_loss: 0.1746 ||:  97%|#########7| 108/111 [01:14<00:01,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8729, UAS: 0.9305, LAS: 0.8769, UEM: 0.5294, LEM: 0.3047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6519, partial_loss/deprel_loss: 0.7411, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8986, loss: 0.8754, batch_reg_loss: 0.1754, reg_loss: 0.1746 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
      "2023-04-07 00:09:34,322 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8962, UAS: 0.9379, LAS: 0.8794, UEM: 0.4599, LEM: 0.1283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5266, partial_loss/deprel_loss: 24.2651, partial_loss/cycle_loss: 0.0000, batch_loss: 19.5174, loss: 24.7563, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:08,  1.13it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9527, LAS: 0.8970, UEM: 0.6623, LEM: 0.3284, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4145, partial_loss/deprel_loss: 26.3179, partial_loss/cycle_loss: 0.0000, batch_loss: 21.1372, loss: 22.3640, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:06,  1.11it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9426, LAS: 0.8873, UEM: 0.6137, LEM: 0.2966, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6098, partial_loss/deprel_loss: 34.3925, partial_loss/cycle_loss: 0.0000, batch_loss: 27.6359, loss: 26.0534, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:07<00:04,  1.07it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8674, UAS: 0.9435, LAS: 0.8887, UEM: 0.5935, LEM: 0.2872, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0499, partial_loss/deprel_loss: 43.7402, partial_loss/cycle_loss: 0.0000, batch_loss: 35.2022, loss: 25.6088, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:10<00:01,  1.07it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8610, UAS: 0.9441, LAS: 0.8910, UEM: 0.6411, LEM: 0.3718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3157, partial_loss/deprel_loss: 48.7881, partial_loss/cycle_loss: 0.0000, batch_loss: 39.2936, loss: 25.9567, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.01it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8610, UAS: 0.9441, LAS: 0.8910, UEM: 0.6411, LEM: 0.3718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3157, partial_loss/deprel_loss: 48.7881, partial_loss/cycle_loss: 0.0000, batch_loss: 39.2936, loss: 25.9567, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.04it/s]\n",
      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.741  |    48.788\n",
      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.652  |     1.316\n",
      "2023-04-07 00:09:46,834 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.175  |     0.000\n",
      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - UEM                      |     0.529  |     0.641\n",
      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - LAS                      |     0.877  |     0.891\n",
      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - loss                     |     0.875  |    25.957\n",
      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - LEM                      |     0.305  |     0.372\n",
      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - UAS                      |     0.930  |     0.944\n",
      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - EM                       |     0.873  |     0.861\n",
      "2023-04-07 00:09:46,835 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 00:09:49,183 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 00:09:50,393 - INFO - combo.training.trainer - Epoch duration: 0:01:32.803051\n",
      "2023-04-07 00:09:50,393 - INFO - combo.training.trainer - Estimated training time remaining: 7:24:52\n",
      "2023-04-07 00:09:50,393 - INFO - allennlp.training.trainer - Epoch 61/399\n",
      "2023-04-07 00:09:50,393 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:09:50,393 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:09:50,399 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8676, UAS: 0.9301, LAS: 0.8725, UEM: 0.4525, LEM: 0.2185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7400, partial_loss/deprel_loss: 0.8407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9960, loss: 0.8934, batch_reg_loss: 0.1754, reg_loss: 0.1754 ||:   3%|2         | 3/111 [00:02<01:12,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8804, UAS: 0.9359, LAS: 0.8807, UEM: 0.5602, LEM: 0.3259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5457, partial_loss/deprel_loss: 0.6338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7916, loss: 0.8117, batch_reg_loss: 0.1755, reg_loss: 0.1754 ||:   5%|5         | 6/111 [00:04<01:12,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9390, LAS: 0.8858, UEM: 0.5364, LEM: 0.3008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4178, partial_loss/deprel_loss: 0.5122, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6688, loss: 0.7848, batch_reg_loss: 0.1755, reg_loss: 0.1754 ||:   8%|8         | 9/111 [00:06<01:10,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7975, UAS: 0.9267, LAS: 0.8726, UEM: 0.4816, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7705, partial_loss/deprel_loss: 1.2301, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5137, loss: 0.9004, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  11%|#         | 12/111 [00:08<01:11,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9329, LAS: 0.8789, UEM: 0.5466, LEM: 0.3070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4847, partial_loss/deprel_loss: 0.5487, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7115, loss: 0.8472, batch_reg_loss: 0.1756, reg_loss: 0.1755 ||:  14%|#3        | 15/111 [00:10<01:07,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8232, UAS: 0.9263, LAS: 0.8721, UEM: 0.4951, LEM: 0.2746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4953, partial_loss/deprel_loss: 0.9569, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2402, loss: 0.9045, batch_reg_loss: 0.1757, reg_loss: 0.1755 ||:  17%|#7        | 19/111 [00:13<01:02,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9278, LAS: 0.8743, UEM: 0.5035, LEM: 0.2797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2306, partial_loss/deprel_loss: 0.3509, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5025, loss: 0.8852, batch_reg_loss: 0.1757, reg_loss: 0.1755 ||:  20%|#9        | 22/111 [00:15<01:00,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9288, LAS: 0.8748, UEM: 0.4971, LEM: 0.2717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2908, partial_loss/deprel_loss: 0.5508, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6746, loss: 0.8829, batch_reg_loss: 0.1758, reg_loss: 0.1756 ||:  23%|##2       | 25/111 [00:17<01:00,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9293, LAS: 0.8759, UEM: 0.5267, LEM: 0.2979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2407, partial_loss/deprel_loss: 0.4070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5496, loss: 0.8696, batch_reg_loss: 0.1758, reg_loss: 0.1756 ||:  25%|##5       | 28/111 [00:19<00:59,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8130, UAS: 0.9297, LAS: 0.8768, UEM: 0.5495, LEM: 0.3195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5913, partial_loss/deprel_loss: 1.1328, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4003, loss: 0.8653, batch_reg_loss: 0.1758, reg_loss: 0.1756 ||:  28%|##7       | 31/111 [00:21<00:58,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8659, UAS: 0.9309, LAS: 0.8782, UEM: 0.5469, LEM: 0.3167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7353, partial_loss/deprel_loss: 0.8071, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9686, loss: 0.8547, batch_reg_loss: 0.1759, reg_loss: 0.1756 ||:  31%|###       | 34/111 [00:24<00:56,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8492, UAS: 0.9306, LAS: 0.8777, UEM: 0.5350, LEM: 0.3066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9533, partial_loss/deprel_loss: 0.8344, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0341, loss: 0.8590, batch_reg_loss: 0.1759, reg_loss: 0.1757 ||:  33%|###3      | 37/111 [00:26<00:54,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9295, LAS: 0.8769, UEM: 0.5536, LEM: 0.3278, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4604, partial_loss/deprel_loss: 0.5286, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6909, loss: 0.8681, batch_reg_loss: 0.1760, reg_loss: 0.1757 ||:  36%|###6      | 40/111 [00:28<00:53,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9025, UAS: 0.9295, LAS: 0.8769, UEM: 0.5425, LEM: 0.3175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4519, partial_loss/deprel_loss: 0.5442, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7018, loss: 0.8705, batch_reg_loss: 0.1760, reg_loss: 0.1757 ||:  39%|###8      | 43/111 [00:30<00:49,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8691, UAS: 0.9290, LAS: 0.8759, UEM: 0.5314, LEM: 0.3073, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6497, partial_loss/deprel_loss: 0.7674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9200, loss: 0.8797, batch_reg_loss: 0.1761, reg_loss: 0.1757 ||:  42%|####2     | 47/111 [00:33<00:44,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8567, UAS: 0.9299, LAS: 0.8766, UEM: 0.5275, LEM: 0.3006, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0313, partial_loss/deprel_loss: 0.9238, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1214, loss: 0.8750, batch_reg_loss: 0.1761, reg_loss: 0.1758 ||:  46%|####5     | 51/111 [00:35<00:40,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9301, LAS: 0.8769, UEM: 0.5190, LEM: 0.2921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5316, partial_loss/deprel_loss: 0.5359, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7112, loss: 0.8718, batch_reg_loss: 0.1762, reg_loss: 0.1758 ||:  49%|####8     | 54/111 [00:38<00:39,  1.43it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9306, LAS: 0.8773, UEM: 0.5160, LEM: 0.2865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5170, partial_loss/deprel_loss: 0.6902, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8318, loss: 0.8682, batch_reg_loss: 0.1762, reg_loss: 0.1758 ||:  52%|#####2    | 58/111 [00:40<00:35,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8467, UAS: 0.9301, LAS: 0.8768, UEM: 0.5379, LEM: 0.3110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9494, partial_loss/deprel_loss: 0.8664, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0593, loss: 0.8701, batch_reg_loss: 0.1763, reg_loss: 0.1758 ||:  56%|#####5    | 62/111 [00:43<00:35,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9310, LAS: 0.8777, UEM: 0.5382, LEM: 0.3078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3715, partial_loss/deprel_loss: 0.5127, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6608, loss: 0.8643, batch_reg_loss: 0.1763, reg_loss: 0.1759 ||:  59%|#####8    | 65/111 [00:45<00:32,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9318, LAS: 0.8785, UEM: 0.5475, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3592, partial_loss/deprel_loss: 0.5754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7085, loss: 0.8581, batch_reg_loss: 0.1764, reg_loss: 0.1759 ||:  61%|######1   | 68/111 [00:48<00:32,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9326, LAS: 0.8792, UEM: 0.5501, LEM: 0.3122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4939, partial_loss/deprel_loss: 0.6939, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8303, loss: 0.8533, batch_reg_loss: 0.1764, reg_loss: 0.1759 ||:  64%|######3   | 71/111 [00:50<00:29,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8675, UAS: 0.9329, LAS: 0.8796, UEM: 0.5458, LEM: 0.3075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8771, partial_loss/deprel_loss: 0.8076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9980, loss: 0.8528, batch_reg_loss: 0.1764, reg_loss: 0.1759 ||:  68%|######7   | 75/111 [00:52<00:24,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8787, UAS: 0.9329, LAS: 0.8795, UEM: 0.5392, LEM: 0.3021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7339, partial_loss/deprel_loss: 0.8141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9745, loss: 0.8561, batch_reg_loss: 0.1765, reg_loss: 0.1760 ||:  70%|#######   | 78/111 [00:54<00:22,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8550, UAS: 0.9331, LAS: 0.8798, UEM: 0.5351, LEM: 0.2974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9806, partial_loss/deprel_loss: 0.8367, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0420, loss: 0.8542, batch_reg_loss: 0.1765, reg_loss: 0.1760 ||:  74%|#######3  | 82/111 [00:57<00:19,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8505, UAS: 0.9331, LAS: 0.8796, UEM: 0.5288, LEM: 0.2907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9883, partial_loss/deprel_loss: 0.8582, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0608, loss: 0.8549, batch_reg_loss: 0.1766, reg_loss: 0.1760 ||:  77%|#######7  | 86/111 [00:59<00:16,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8371, UAS: 0.9325, LAS: 0.8789, UEM: 0.5258, LEM: 0.2895, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1699, partial_loss/deprel_loss: 0.9620, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1802, loss: 0.8598, batch_reg_loss: 0.1766, reg_loss: 0.1760 ||:  81%|########1 | 90/111 [01:02<00:14,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9327, LAS: 0.8790, UEM: 0.5229, LEM: 0.2861, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5761, partial_loss/deprel_loss: 0.7385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8827, loss: 0.8601, batch_reg_loss: 0.1767, reg_loss: 0.1761 ||:  85%|########4 | 94/111 [01:05<00:11,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9327, LAS: 0.8789, UEM: 0.5254, LEM: 0.2875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2904, partial_loss/deprel_loss: 0.4370, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5844, loss: 0.8596, batch_reg_loss: 0.1767, reg_loss: 0.1761 ||:  88%|########8 | 98/111 [01:08<00:09,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8589, UAS: 0.9322, LAS: 0.8783, UEM: 0.5222, LEM: 0.2851, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8614, partial_loss/deprel_loss: 0.8358, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0177, loss: 0.8647, batch_reg_loss: 0.1768, reg_loss: 0.1761 ||:  92%|#########1| 102/111 [01:11<00:06,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8329, UAS: 0.9325, LAS: 0.8787, UEM: 0.5388, LEM: 0.3065, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3338, partial_loss/deprel_loss: 0.9728, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2218, loss: 0.8622, batch_reg_loss: 0.1768, reg_loss: 0.1761 ||:  95%|#########4| 105/111 [01:13<00:04,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8788, UAS: 0.9322, LAS: 0.8784, UEM: 0.5361, LEM: 0.3039, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6211, partial_loss/deprel_loss: 0.6854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8494, loss: 0.8656, batch_reg_loss: 0.1769, reg_loss: 0.1762 ||:  98%|#########8| 109/111 [01:16<00:01,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8162, UAS: 0.9319, LAS: 0.8781, UEM: 0.5376, LEM: 0.3051, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5148, partial_loss/deprel_loss: 1.0411, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3128, loss: 0.8674, batch_reg_loss: 0.1769, reg_loss: 0.1762 ||: 100%|##########| 111/111 [01:17<00:00,  1.43it/s]\n",
      "2023-04-07 00:11:10,307 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:11:10,307 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.041  |       N/A\n",
      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.515  |       N/A\n",
      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.176  |       N/A\n",
      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - UEM                      |     0.538  |       N/A\n",
      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - LAS                      |     0.878  |       N/A\n",
      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - loss                     |     0.867  |       N/A\n",
      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - LEM                      |     0.305  |       N/A\n",
      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:11:10,308 - INFO - combo.training.tensorboard_writer - UAS                      |     0.932  |       N/A\n",
      "2023-04-07 00:11:10,309 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:11:10,309 - INFO - combo.training.tensorboard_writer - EM                       |     0.816  |       N/A\n",
      "2023-04-07 00:11:10,309 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:11:10,313 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 00:11:15,962 - INFO - combo.training.trainer - Epoch duration: 0:01:25.568982\n",
      "2023-04-07 00:11:15,962 - INFO - combo.training.trainer - Estimated training time remaining: 7:24:11\n",
      "2023-04-07 00:11:15,962 - INFO - allennlp.training.trainer - Epoch 62/399\n",
      "2023-04-07 00:11:15,963 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:11:15,963 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:11:15,970 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8698, UAS: 0.9461, LAS: 0.8929, UEM: 0.6482, LEM: 0.3817, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8178, partial_loss/deprel_loss: 0.7325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9265, loss: 0.7051, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||:   3%|2         | 3/111 [00:02<01:19,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8685, UAS: 0.9367, LAS: 0.8823, UEM: 0.5942, LEM: 0.3705, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6823, partial_loss/deprel_loss: 0.8525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9954, loss: 0.8175, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||:   6%|6         | 7/111 [00:04<01:12,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7817, UAS: 0.9301, LAS: 0.8763, UEM: 0.5643, LEM: 0.3362, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2934, partial_loss/deprel_loss: 1.3399, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7076, loss: 0.8878, batch_reg_loss: 0.1770, reg_loss: 0.1769 ||:   9%|9         | 10/111 [00:06<01:10,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9312, LAS: 0.8783, UEM: 0.5568, LEM: 0.3322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2351, partial_loss/deprel_loss: 0.3993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5434, loss: 0.8788, batch_reg_loss: 0.1770, reg_loss: 0.1769 ||:  13%|#2        | 14/111 [00:09<01:05,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9361, LAS: 0.8829, UEM: 0.5695, LEM: 0.3216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4688, partial_loss/deprel_loss: 0.5094, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6782, loss: 0.8412, batch_reg_loss: 0.1770, reg_loss: 0.1769 ||:  15%|#5        | 17/111 [00:11<01:06,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8554, UAS: 0.9335, LAS: 0.8806, UEM: 0.5433, LEM: 0.3050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0345, partial_loss/deprel_loss: 0.7780, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0062, loss: 0.8508, batch_reg_loss: 0.1770, reg_loss: 0.1770 ||:  18%|#8        | 20/111 [00:13<01:03,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8884, UAS: 0.9343, LAS: 0.8818, UEM: 0.5205, LEM: 0.2839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6520, partial_loss/deprel_loss: 0.6173, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8012, loss: 0.8428, batch_reg_loss: 0.1770, reg_loss: 0.1770 ||:  22%|##1       | 24/111 [00:16<00:58,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8690, UAS: 0.9322, LAS: 0.8798, UEM: 0.4931, LEM: 0.2629, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7861, partial_loss/deprel_loss: 0.7325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9202, loss: 0.8579, batch_reg_loss: 0.1770, reg_loss: 0.1770 ||:  25%|##5       | 28/111 [00:18<00:55,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9330, LAS: 0.8811, UEM: 0.5272, LEM: 0.3073, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1210, partial_loss/deprel_loss: 0.2362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3901, loss: 0.8492, batch_reg_loss: 0.1770, reg_loss: 0.1770 ||:  28%|##7       | 31/111 [00:21<00:56,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9329, LAS: 0.8809, UEM: 0.5126, LEM: 0.2930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5720, partial_loss/deprel_loss: 0.6731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8298, loss: 0.8500, batch_reg_loss: 0.1769, reg_loss: 0.1770 ||:  31%|###       | 34/111 [00:23<00:54,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8891, UAS: 0.9333, LAS: 0.8813, UEM: 0.5162, LEM: 0.2939, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5572, partial_loss/deprel_loss: 0.5714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7455, loss: 0.8451, batch_reg_loss: 0.1769, reg_loss: 0.1770 ||:  33%|###3      | 37/111 [00:25<00:53,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9343, LAS: 0.8824, UEM: 0.5142, LEM: 0.2895, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4571, partial_loss/deprel_loss: 0.6004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7487, loss: 0.8359, batch_reg_loss: 0.1769, reg_loss: 0.1770 ||:  36%|###6      | 40/111 [00:27<00:52,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9351, LAS: 0.8832, UEM: 0.5291, LEM: 0.2997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3019, partial_loss/deprel_loss: 0.4755, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6177, loss: 0.8277, batch_reg_loss: 0.1769, reg_loss: 0.1770 ||:  39%|###8      | 43/111 [00:30<00:50,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9371, LAS: 0.8861, UEM: 0.5756, LEM: 0.3583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2111, partial_loss/deprel_loss: 0.3450, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4951, loss: 0.8072, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||:  41%|####1     | 46/111 [00:32<00:49,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8542, UAS: 0.9372, LAS: 0.8862, UEM: 0.5747, LEM: 0.3562, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0707, partial_loss/deprel_loss: 0.8576, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0771, loss: 0.8040, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||:  44%|####4     | 49/111 [00:34<00:47,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9126, UAS: 0.9382, LAS: 0.8872, UEM: 0.5813, LEM: 0.3621, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4093, partial_loss/deprel_loss: 0.4927, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6529, loss: 0.7991, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||:  47%|####6     | 52/111 [00:36<00:43,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8502, UAS: 0.9379, LAS: 0.8868, UEM: 0.5728, LEM: 0.3537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9311, partial_loss/deprel_loss: 0.9079, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0894, loss: 0.8040, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||:  50%|#####     | 56/111 [00:39<00:37,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9370, LAS: 0.8861, UEM: 0.5686, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2738, partial_loss/deprel_loss: 0.4237, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5706, loss: 0.8109, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||:  53%|#####3    | 59/111 [00:41<00:36,  1.44it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9375, LAS: 0.8867, UEM: 0.5667, LEM: 0.3447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4263, partial_loss/deprel_loss: 0.6020, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7437, loss: 0.8056, batch_reg_loss: 0.1769, reg_loss: 0.1769 ||:  56%|#####5    | 62/111 [00:43<00:34,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9110, UAS: 0.9370, LAS: 0.8863, UEM: 0.5694, LEM: 0.3457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3908, partial_loss/deprel_loss: 0.5036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6579, loss: 0.8078, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  59%|#####8    | 65/111 [00:45<00:33,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9366, LAS: 0.8859, UEM: 0.5667, LEM: 0.3430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2895, partial_loss/deprel_loss: 0.3820, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5403, loss: 0.8122, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  61%|######1   | 68/111 [00:47<00:30,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8628, UAS: 0.9359, LAS: 0.8850, UEM: 0.5564, LEM: 0.3342, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8085, partial_loss/deprel_loss: 0.8201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9946, loss: 0.8185, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  65%|######4   | 72/111 [00:50<00:26,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8626, UAS: 0.9351, LAS: 0.8842, UEM: 0.5619, LEM: 0.3422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0201, partial_loss/deprel_loss: 0.7898, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0127, loss: 0.8247, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  68%|######7   | 75/111 [00:52<00:25,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9361, LAS: 0.8853, UEM: 0.5672, LEM: 0.3431, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3834, partial_loss/deprel_loss: 0.5284, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6762, loss: 0.8170, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  70%|#######   | 78/111 [00:54<00:23,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9357, LAS: 0.8848, UEM: 0.5614, LEM: 0.3388, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2974, partial_loss/deprel_loss: 0.4016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5576, loss: 0.8223, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  74%|#######3  | 82/111 [00:57<00:20,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9364, LAS: 0.8856, UEM: 0.5646, LEM: 0.3391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3102, partial_loss/deprel_loss: 0.5018, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6403, loss: 0.8165, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  77%|#######6  | 85/111 [00:59<00:17,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8792, UAS: 0.9356, LAS: 0.8847, UEM: 0.5610, LEM: 0.3358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6688, partial_loss/deprel_loss: 0.6762, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8515, loss: 0.8214, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  80%|########  | 89/111 [01:01<00:14,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8611, UAS: 0.9349, LAS: 0.8840, UEM: 0.5549, LEM: 0.3313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9371, partial_loss/deprel_loss: 0.8498, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0440, loss: 0.8271, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  84%|########3 | 93/111 [01:04<00:11,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8845, UAS: 0.9349, LAS: 0.8841, UEM: 0.5478, LEM: 0.3248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6846, partial_loss/deprel_loss: 0.6411, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8266, loss: 0.8268, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  87%|########7 | 97/111 [01:06<00:08,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9355, LAS: 0.8848, UEM: 0.5496, LEM: 0.3244, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3925, partial_loss/deprel_loss: 0.5808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7199, loss: 0.8227, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  91%|######### | 101/111 [01:09<00:06,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9350, LAS: 0.8839, UEM: 0.5418, LEM: 0.3178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5451, partial_loss/deprel_loss: 0.6392, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7972, loss: 0.8280, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  95%|#########4| 105/111 [01:12<00:03,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9350, LAS: 0.8839, UEM: 0.5435, LEM: 0.3193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7372, partial_loss/deprel_loss: 0.6851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8723, loss: 0.8279, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||:  98%|#########8| 109/111 [01:15<00:01,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9352, LAS: 0.8843, UEM: 0.5459, LEM: 0.3214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2081, partial_loss/deprel_loss: 0.3644, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5099, loss: 0.8251, batch_reg_loss: 0.1768, reg_loss: 0.1769 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
      "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-07 00:12:35,728 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.364  |       N/A\n",
      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.208  |       N/A\n",
      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.177  |       N/A\n",
      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - UEM                      |     0.546  |       N/A\n",
      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - LAS                      |     0.884  |       N/A\n",
      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - loss                     |     0.825  |       N/A\n",
      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - LEM                      |     0.321  |       N/A\n",
      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - UAS                      |     0.935  |       N/A\n",
      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - EM                       |     0.926  |       N/A\n",
      "2023-04-07 00:12:35,729 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:12:35,734 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 00:12:40,483 - INFO - combo.training.trainer - Epoch duration: 0:01:24.520495\n",
      "2023-04-07 00:12:40,484 - INFO - combo.training.trainer - Estimated training time remaining: 7:23:22\n",
      "2023-04-07 00:12:40,484 - INFO - allennlp.training.trainer - Epoch 63/399\n",
      "2023-04-07 00:12:40,484 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:12:40,485 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:12:40,495 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9622, LAS: 0.9136, UEM: 0.7143, LEM: 0.3932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2952, partial_loss/deprel_loss: 0.4429, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5901, loss: 0.5662, batch_reg_loss: 0.1767, reg_loss: 0.1768 ||:   3%|2         | 3/111 [00:02<01:17,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9647, LAS: 0.9167, UEM: 0.7773, LEM: 0.5015, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1387, partial_loss/deprel_loss: 0.3915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5177, loss: 0.5657, batch_reg_loss: 0.1767, reg_loss: 0.1767 ||:   5%|5         | 6/111 [00:04<01:17,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9528, LAS: 0.9026, UEM: 0.7066, LEM: 0.4420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2673, partial_loss/deprel_loss: 0.3965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5474, loss: 0.6629, batch_reg_loss: 0.1767, reg_loss: 0.1767 ||:   9%|9         | 10/111 [00:07<01:11,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8438, UAS: 0.9508, LAS: 0.8998, UEM: 0.6968, LEM: 0.4310, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0591, partial_loss/deprel_loss: 0.9699, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1644, loss: 0.6890, batch_reg_loss: 0.1767, reg_loss: 0.1767 ||:  12%|#1        | 13/111 [00:09<01:10,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9486, LAS: 0.8977, UEM: 0.6604, LEM: 0.3974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3376, partial_loss/deprel_loss: 0.4769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6258, loss: 0.7111, batch_reg_loss: 0.1767, reg_loss: 0.1767 ||:  15%|#5        | 17/111 [00:11<01:04,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9484, LAS: 0.8977, UEM: 0.6432, LEM: 0.3808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2738, partial_loss/deprel_loss: 0.4217, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5688, loss: 0.7174, batch_reg_loss: 0.1767, reg_loss: 0.1767 ||:  19%|#8        | 21/111 [00:14<01:01,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9471, LAS: 0.8968, UEM: 0.6249, LEM: 0.3658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3350, partial_loss/deprel_loss: 0.4300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5877, loss: 0.7248, batch_reg_loss: 0.1767, reg_loss: 0.1767 ||:  22%|##1       | 24/111 [00:16<01:00,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9000, UAS: 0.9458, LAS: 0.8951, UEM: 0.6095, LEM: 0.3516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3742, partial_loss/deprel_loss: 0.5653, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7037, loss: 0.7378, batch_reg_loss: 0.1767, reg_loss: 0.1767 ||:  24%|##4       | 27/111 [00:18<00:58,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9469, LAS: 0.8963, UEM: 0.6098, LEM: 0.3461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2797, partial_loss/deprel_loss: 0.5113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6416, loss: 0.7258, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  28%|##7       | 31/111 [00:21<00:54,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9419, LAS: 0.8912, UEM: 0.5994, LEM: 0.3402, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3695, partial_loss/deprel_loss: 0.4635, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6213, loss: 0.7673, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  31%|###       | 34/111 [00:23<00:54,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8787, UAS: 0.9405, LAS: 0.8897, UEM: 0.5848, LEM: 0.3277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7267, partial_loss/deprel_loss: 0.6768, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8634, loss: 0.7788, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  33%|###3      | 37/111 [00:25<00:52,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8613, UAS: 0.9384, LAS: 0.8874, UEM: 0.5624, LEM: 0.3122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9695, partial_loss/deprel_loss: 0.7204, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9468, loss: 0.7958, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  37%|###6      | 41/111 [00:28<00:49,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9389, LAS: 0.8880, UEM: 0.5617, LEM: 0.3114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3551, partial_loss/deprel_loss: 0.4208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5843, loss: 0.7929, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  40%|###9      | 44/111 [00:30<00:48,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8821, UAS: 0.9394, LAS: 0.8883, UEM: 0.5660, LEM: 0.3136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5540, partial_loss/deprel_loss: 0.6572, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8132, loss: 0.7888, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  42%|####2     | 47/111 [00:33<00:47,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9408, LAS: 0.8902, UEM: 0.5851, LEM: 0.3367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4763, partial_loss/deprel_loss: 0.5986, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7508, loss: 0.7764, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  45%|####5     | 50/111 [00:35<00:47,  1.28it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8593, UAS: 0.9396, LAS: 0.8890, UEM: 0.5734, LEM: 0.3276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9640, partial_loss/deprel_loss: 0.7751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9895, loss: 0.7859, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  48%|####7     | 53/111 [00:38<00:44,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9395, LAS: 0.8891, UEM: 0.5686, LEM: 0.3225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4899, partial_loss/deprel_loss: 0.5436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7095, loss: 0.7854, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  50%|#####     | 56/111 [00:40<00:41,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9399, LAS: 0.8895, UEM: 0.5699, LEM: 0.3219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2513, partial_loss/deprel_loss: 0.4202, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5631, loss: 0.7826, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  53%|#####3    | 59/111 [00:42<00:39,  1.30it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8977, UAS: 0.9391, LAS: 0.8886, UEM: 0.5616, LEM: 0.3157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4519, partial_loss/deprel_loss: 0.5807, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7315, loss: 0.7914, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  56%|#####5    | 62/111 [00:44<00:36,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9392, LAS: 0.8885, UEM: 0.5575, LEM: 0.3106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2907, partial_loss/deprel_loss: 0.5125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6448, loss: 0.7910, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  59%|#####9    | 66/111 [00:47<00:32,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8826, UAS: 0.9386, LAS: 0.8878, UEM: 0.5526, LEM: 0.3064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6683, partial_loss/deprel_loss: 0.7764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9313, loss: 0.7982, batch_reg_loss: 0.1766, reg_loss: 0.1767 ||:  62%|######2   | 69/111 [00:49<00:29,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9385, LAS: 0.8875, UEM: 0.5494, LEM: 0.3030, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3060, partial_loss/deprel_loss: 0.5013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6389, loss: 0.8003, batch_reg_loss: 0.1766, reg_loss: 0.1766 ||:  65%|######4   | 72/111 [00:51<00:28,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9390, LAS: 0.8885, UEM: 0.5791, LEM: 0.3432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1575, partial_loss/deprel_loss: 0.2822, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4339, loss: 0.7948, batch_reg_loss: 0.1766, reg_loss: 0.1766 ||:  68%|######7   | 75/111 [00:54<00:27,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8232, UAS: 0.9369, LAS: 0.8863, UEM: 0.5684, LEM: 0.3360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7013, partial_loss/deprel_loss: 0.9147, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2486, loss: 0.8097, batch_reg_loss: 0.1766, reg_loss: 0.1766 ||:  71%|#######1  | 79/111 [00:56<00:23,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9371, LAS: 0.8866, UEM: 0.5699, LEM: 0.3353, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2117, partial_loss/deprel_loss: 0.3626, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5090, loss: 0.8084, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||:  75%|#######4  | 83/111 [00:59<00:19,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9266, UAS: 0.9383, LAS: 0.8878, UEM: 0.5797, LEM: 0.3419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1914, partial_loss/deprel_loss: 0.3426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4889, loss: 0.7984, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||:  78%|#######8  | 87/111 [01:02<00:16,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9379, LAS: 0.8874, UEM: 0.5752, LEM: 0.3376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3438, partial_loss/deprel_loss: 0.4141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5766, loss: 0.8011, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||:  82%|########1 | 91/111 [01:04<00:13,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9383, LAS: 0.8878, UEM: 0.5733, LEM: 0.3339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3745, partial_loss/deprel_loss: 0.4885, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6422, loss: 0.7969, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||:  85%|########4 | 94/111 [01:06<00:11,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8664, UAS: 0.9383, LAS: 0.8879, UEM: 0.5673, LEM: 0.3279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7117, partial_loss/deprel_loss: 0.7441, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9141, loss: 0.7961, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||:  88%|########8 | 98/111 [01:09<00:08,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9386, LAS: 0.8882, UEM: 0.5673, LEM: 0.3276, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2380, partial_loss/deprel_loss: 0.3630, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5145, loss: 0.7950, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||:  92%|#########1| 102/111 [01:12<00:06,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9243, UAS: 0.9391, LAS: 0.8888, UEM: 0.5696, LEM: 0.3285, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2042, partial_loss/deprel_loss: 0.3583, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5040, loss: 0.7909, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||:  95%|#########4| 105/111 [01:14<00:04,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8744, UAS: 0.9389, LAS: 0.8884, UEM: 0.5633, LEM: 0.3233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7002, partial_loss/deprel_loss: 0.7096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8842, loss: 0.7945, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||:  98%|#########8| 109/111 [01:16<00:01,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8158, UAS: 0.9386, LAS: 0.8880, UEM: 0.5631, LEM: 0.3230, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5034, partial_loss/deprel_loss: 1.0496, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3169, loss: 0.7973, batch_reg_loss: 0.1765, reg_loss: 0.1766 ||: 100%|##########| 111/111 [01:17<00:00,  1.43it/s]\n",
      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     1.050  |       N/A\n",
      "2023-04-07 00:14:00,969 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.503  |       N/A\n",
      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.177  |       N/A\n",
      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - UEM                      |     0.563  |       N/A\n",
      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - LAS                      |     0.888  |       N/A\n",
      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - loss                     |     0.797  |       N/A\n",
      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - LEM                      |     0.323  |       N/A\n",
      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - UAS                      |     0.939  |       N/A\n",
      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - EM                       |     0.816  |       N/A\n",
      "2023-04-07 00:14:00,970 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:14:00,976 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 00:14:07,569 - INFO - combo.training.trainer - Epoch duration: 0:01:27.085147\n",
      "2023-04-07 00:14:07,569 - INFO - combo.training.trainer - Estimated training time remaining: 7:22:46\n",
      "2023-04-07 00:14:07,570 - INFO - allennlp.training.trainer - Epoch 64/399\n",
      "2023-04-07 00:14:07,570 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:14:07,570 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:14:07,579 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9424, LAS: 0.8965, UEM: 0.7553, LEM: 0.5743, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4184, partial_loss/deprel_loss: 0.5698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7159, loss: 0.7365, batch_reg_loss: 0.1765, reg_loss: 0.1765 ||:   3%|2         | 3/111 [00:02<01:20,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9456, LAS: 0.8991, UEM: 0.6562, LEM: 0.4308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4812, partial_loss/deprel_loss: 0.5967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7501, loss: 0.7251, batch_reg_loss: 0.1764, reg_loss: 0.1765 ||:   6%|6         | 7/111 [00:04<01:13,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9400, LAS: 0.8915, UEM: 0.5800, LEM: 0.3541, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4154, partial_loss/deprel_loss: 0.5672, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7133, loss: 0.7932, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  10%|9         | 11/111 [00:07<01:10,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9398, LAS: 0.8908, UEM: 0.5572, LEM: 0.3242, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3106, partial_loss/deprel_loss: 0.4770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6202, loss: 0.7940, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  13%|#2        | 14/111 [00:09<01:08,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9379, LAS: 0.8888, UEM: 0.5385, LEM: 0.3089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5457, partial_loss/deprel_loss: 0.6542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8089, loss: 0.8111, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  15%|#5        | 17/111 [00:11<01:07,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9404, LAS: 0.8915, UEM: 0.5680, LEM: 0.3306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2816, partial_loss/deprel_loss: 0.4403, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5850, loss: 0.7857, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  18%|#8        | 20/111 [00:14<01:05,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.7952, UAS: 0.9377, LAS: 0.8885, UEM: 0.5705, LEM: 0.3313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 2.2371, partial_loss/deprel_loss: 1.3617, partial_loss/cycle_loss: 0.0000, batch_loss: 1.7132, loss: 0.8161, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  21%|##        | 23/111 [00:16<01:04,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9395, LAS: 0.8902, UEM: 0.5696, LEM: 0.3252, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4209, partial_loss/deprel_loss: 0.4874, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6505, loss: 0.8001, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  23%|##3       | 26/111 [00:18<01:00,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9428, LAS: 0.8938, UEM: 0.6109, LEM: 0.3625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2672, partial_loss/deprel_loss: 0.4811, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6147, loss: 0.7724, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  26%|##6       | 29/111 [00:20<00:58,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8613, UAS: 0.9427, LAS: 0.8934, UEM: 0.6043, LEM: 0.3556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8892, partial_loss/deprel_loss: 0.7627, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9644, loss: 0.7738, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  29%|##8       | 32/111 [00:22<00:55,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9042, UAS: 0.9429, LAS: 0.8938, UEM: 0.5867, LEM: 0.3388, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4316, partial_loss/deprel_loss: 0.5089, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6698, loss: 0.7712, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  32%|###2      | 36/111 [00:25<00:51,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8462, UAS: 0.9414, LAS: 0.8917, UEM: 0.5679, LEM: 0.3216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9932, partial_loss/deprel_loss: 0.8972, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0928, loss: 0.7831, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  36%|###6      | 40/111 [00:27<00:46,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8222, UAS: 0.9402, LAS: 0.8901, UEM: 0.5609, LEM: 0.3142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4805, partial_loss/deprel_loss: 1.1199, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3684, loss: 0.7962, batch_reg_loss: 0.1764, reg_loss: 0.1764 ||:  40%|###9      | 44/111 [00:30<00:43,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9421, LAS: 0.8927, UEM: 0.5967, LEM: 0.3622, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2505, partial_loss/deprel_loss: 0.4069, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5520, loss: 0.7783, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||:  43%|####3     | 48/111 [00:33<00:44,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9430, LAS: 0.8937, UEM: 0.5972, LEM: 0.3581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2783, partial_loss/deprel_loss: 0.5068, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6374, loss: 0.7690, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||:  47%|####6     | 52/111 [00:36<00:41,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8687, UAS: 0.9428, LAS: 0.8935, UEM: 0.5909, LEM: 0.3517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7752, partial_loss/deprel_loss: 0.7210, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9082, loss: 0.7704, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||:  50%|#####     | 56/111 [00:38<00:37,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9439, LAS: 0.8947, UEM: 0.6005, LEM: 0.3591, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4300, partial_loss/deprel_loss: 0.4863, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6514, loss: 0.7624, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||:  53%|#####3    | 59/111 [00:40<00:36,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8199, UAS: 0.9417, LAS: 0.8926, UEM: 0.5902, LEM: 0.3526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6636, partial_loss/deprel_loss: 0.9961, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3059, loss: 0.7789, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||:  56%|#####5    | 62/111 [00:42<00:33,  1.45it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8640, UAS: 0.9413, LAS: 0.8921, UEM: 0.5894, LEM: 0.3530, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0166, partial_loss/deprel_loss: 0.8454, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0559, loss: 0.7818, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||:  59%|#####8    | 65/111 [00:45<00:32,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9409, LAS: 0.8915, UEM: 0.5879, LEM: 0.3506, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2982, partial_loss/deprel_loss: 0.4384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5866, loss: 0.7857, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||:  61%|######1   | 68/111 [00:47<00:30,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8827, UAS: 0.9415, LAS: 0.8921, UEM: 0.5966, LEM: 0.3589, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7684, partial_loss/deprel_loss: 0.6968, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8874, loss: 0.7806, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||:  64%|######3   | 71/111 [00:49<00:29,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9415, LAS: 0.8920, UEM: 0.5889, LEM: 0.3513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3207, partial_loss/deprel_loss: 0.4941, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6357, loss: 0.7809, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||:  68%|######7   | 75/111 [00:52<00:25,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8619, UAS: 0.9410, LAS: 0.8913, UEM: 0.5785, LEM: 0.3428, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9618, partial_loss/deprel_loss: 0.8121, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0183, loss: 0.7868, batch_reg_loss: 0.1763, reg_loss: 0.1764 ||:  71%|#######1  | 79/111 [00:54<00:20,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9413, LAS: 0.8918, UEM: 0.5854, LEM: 0.3498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9237, partial_loss/deprel_loss: 0.8028, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0032, loss: 0.7828, batch_reg_loss: 0.1762, reg_loss: 0.1764 ||:  75%|#######4  | 83/111 [00:57<00:18,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9031, UAS: 0.9416, LAS: 0.8921, UEM: 0.5822, LEM: 0.3472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3736, partial_loss/deprel_loss: 0.5020, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6526, loss: 0.7811, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||:  78%|#######8  | 87/111 [01:00<00:17,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9419, LAS: 0.8924, UEM: 0.5824, LEM: 0.3462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2289, partial_loss/deprel_loss: 0.3876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5321, loss: 0.7777, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||:  81%|########1 | 90/111 [01:02<00:15,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9424, LAS: 0.8931, UEM: 0.5877, LEM: 0.3496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3492, partial_loss/deprel_loss: 0.5226, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6642, loss: 0.7721, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||:  84%|########3 | 93/111 [01:04<00:12,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9426, LAS: 0.8934, UEM: 0.5861, LEM: 0.3472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3260, partial_loss/deprel_loss: 0.4986, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6403, loss: 0.7709, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||:  87%|########7 | 97/111 [01:07<00:09,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8197, UAS: 0.9416, LAS: 0.8925, UEM: 0.5812, LEM: 0.3430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8202, partial_loss/deprel_loss: 0.9301, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2843, loss: 0.7767, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||:  91%|######### | 101/111 [01:09<00:06,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9417, LAS: 0.8925, UEM: 0.5748, LEM: 0.3369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5971, partial_loss/deprel_loss: 0.7558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9002, loss: 0.7791, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||:  95%|#########4| 105/111 [01:12<00:04,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8726, UAS: 0.9416, LAS: 0.8923, UEM: 0.5710, LEM: 0.3332, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7785, partial_loss/deprel_loss: 0.7124, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9018, loss: 0.7798, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||:  97%|#########7| 108/111 [01:14<00:02,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9410, LAS: 0.8915, UEM: 0.5651, LEM: 0.3290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9154, partial_loss/deprel_loss: 0.8018, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0006, loss: 0.7854, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||: 100%|##########| 111/111 [01:16<00:00,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8549, UAS: 0.9410, LAS: 0.8915, UEM: 0.5651, LEM: 0.3290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9154, partial_loss/deprel_loss: 0.8018, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0006, loss: 0.7854, batch_reg_loss: 0.1762, reg_loss: 0.1763 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.802  |       N/A\n",
      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.915  |       N/A\n",
      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.176  |       N/A\n",
      "2023-04-07 00:15:27,592 - INFO - combo.training.tensorboard_writer - UEM                      |     0.565  |       N/A\n",
      "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - LAS                      |     0.892  |       N/A\n",
      "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - loss                     |     0.785  |       N/A\n",
      "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - LEM                      |     0.329  |       N/A\n",
      "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - UAS                      |     0.941  |       N/A\n",
      "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - EM                       |     0.855  |       N/A\n",
      "2023-04-07 00:15:27,593 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:15:27,598 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 00:15:34,868 - INFO - combo.training.trainer - Epoch duration: 0:01:27.298867\n",
      "2023-04-07 00:15:34,869 - INFO - combo.training.trainer - Estimated training time remaining: 7:22:09\n",
      "2023-04-07 00:15:34,869 - INFO - allennlp.training.trainer - Epoch 65/399\n",
      "2023-04-07 00:15:34,869 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:15:34,869 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:15:34,876 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9188, UAS: 0.9502, LAS: 0.9006, UEM: 0.4792, LEM: 0.2152, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3437, partial_loss/deprel_loss: 0.4806, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6294, loss: 0.7186, batch_reg_loss: 0.1762, reg_loss: 0.1762 ||:   3%|2         | 3/111 [00:02<01:17,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9285, LAS: 0.8794, UEM: 0.3964, LEM: 0.1731, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6617, partial_loss/deprel_loss: 0.5697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7642, loss: 0.8714, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:   5%|5         | 6/111 [00:04<01:15,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8855, UAS: 0.9329, LAS: 0.8837, UEM: 0.4081, LEM: 0.1828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5837, partial_loss/deprel_loss: 0.6297, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7967, loss: 0.8328, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:   8%|8         | 9/111 [00:06<01:13,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8397, UAS: 0.9340, LAS: 0.8848, UEM: 0.4359, LEM: 0.2012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1888, partial_loss/deprel_loss: 0.8942, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1292, loss: 0.8237, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  12%|#1        | 13/111 [00:09<01:08,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9166, UAS: 0.9390, LAS: 0.8905, UEM: 0.5050, LEM: 0.2569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2596, partial_loss/deprel_loss: 0.3912, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5410, loss: 0.7799, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  14%|#4        | 16/111 [00:11<01:07,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9417, LAS: 0.8939, UEM: 0.5398, LEM: 0.2875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4567, partial_loss/deprel_loss: 0.5314, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6926, loss: 0.7536, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  17%|#7        | 19/111 [00:13<01:06,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8952, UAS: 0.9426, LAS: 0.8944, UEM: 0.5453, LEM: 0.2903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5512, partial_loss/deprel_loss: 0.5817, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7518, loss: 0.7517, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  20%|#9        | 22/111 [00:15<01:03,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8684, UAS: 0.9405, LAS: 0.8917, UEM: 0.5186, LEM: 0.2715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9198, partial_loss/deprel_loss: 0.7851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9881, loss: 0.7773, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  23%|##2       | 25/111 [00:17<01:00,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9414, LAS: 0.8929, UEM: 0.5435, LEM: 0.2940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3073, partial_loss/deprel_loss: 0.4587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6046, loss: 0.7677, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  25%|##5       | 28/111 [00:19<00:57,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9427, LAS: 0.8947, UEM: 0.5851, LEM: 0.3425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0904, partial_loss/deprel_loss: 0.2188, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3692, loss: 0.7532, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  28%|##7       | 31/111 [00:22<00:58,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9421, LAS: 0.8936, UEM: 0.5740, LEM: 0.3302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7529, partial_loss/deprel_loss: 0.8034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9694, loss: 0.7675, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  31%|###       | 34/111 [00:24<00:54,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9422, LAS: 0.8932, UEM: 0.5649, LEM: 0.3197, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5704, partial_loss/deprel_loss: 0.6786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8331, loss: 0.7708, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  33%|###3      | 37/111 [00:26<00:52,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8517, UAS: 0.9389, LAS: 0.8896, UEM: 0.5482, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9369, partial_loss/deprel_loss: 0.8963, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0805, loss: 0.7991, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  36%|###6      | 40/111 [00:28<00:51,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9398, LAS: 0.8907, UEM: 0.5574, LEM: 0.3179, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2348, partial_loss/deprel_loss: 0.3746, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5227, loss: 0.7898, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  39%|###8      | 43/111 [00:30<00:49,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9402, LAS: 0.8911, UEM: 0.5758, LEM: 0.3358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0961, partial_loss/deprel_loss: 0.3030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4377, loss: 0.7841, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  41%|####1     | 46/111 [00:33<00:48,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9412, LAS: 0.8924, UEM: 0.5791, LEM: 0.3347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3451, partial_loss/deprel_loss: 0.4574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6110, loss: 0.7733, batch_reg_loss: 0.1761, reg_loss: 0.1761 ||:  44%|####4     | 49/111 [00:35<00:48,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8615, UAS: 0.9405, LAS: 0.8913, UEM: 0.5642, LEM: 0.3226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9953, partial_loss/deprel_loss: 0.8299, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0390, loss: 0.7814, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||:  48%|####7     | 53/111 [00:38<00:42,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9404, LAS: 0.8914, UEM: 0.5579, LEM: 0.3160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3034, partial_loss/deprel_loss: 0.4683, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6113, loss: 0.7792, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||:  51%|#####1    | 57/111 [00:40<00:37,  1.43it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9410, LAS: 0.8922, UEM: 0.5655, LEM: 0.3256, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4643, partial_loss/deprel_loss: 0.6052, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7531, loss: 0.7743, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||:  54%|#####4    | 60/111 [00:42<00:36,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9420, LAS: 0.8935, UEM: 0.5793, LEM: 0.3406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4151, partial_loss/deprel_loss: 0.4695, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6346, loss: 0.7633, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||:  57%|#####6    | 63/111 [00:45<00:35,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9692, UAS: 0.9420, LAS: 0.8940, UEM: 0.6043, LEM: 0.3750, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0402, partial_loss/deprel_loss: 0.1250, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2840, loss: 0.7604, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||:  59%|#####9    | 66/111 [00:47<00:34,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9424, LAS: 0.8945, UEM: 0.6072, LEM: 0.3778, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8798, partial_loss/deprel_loss: 0.7190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9271, loss: 0.7567, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||:  62%|######2   | 69/111 [00:50<00:32,  1.28it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8730, UAS: 0.9417, LAS: 0.8937, UEM: 0.5964, LEM: 0.3689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9134, partial_loss/deprel_loss: 0.6988, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9177, loss: 0.7623, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||:  66%|######5   | 73/111 [00:52<00:27,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8693, UAS: 0.9425, LAS: 0.8946, UEM: 0.6038, LEM: 0.3737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8754, partial_loss/deprel_loss: 0.7352, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9392, loss: 0.7569, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||:  69%|######9   | 77/111 [00:57<00:30,  1.13it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9430, LAS: 0.8949, UEM: 0.6048, LEM: 0.3707, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2401, partial_loss/deprel_loss: 0.4459, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5807, loss: 0.7545, batch_reg_loss: 0.1760, reg_loss: 0.1761 ||:  72%|#######2  | 80/111 [01:00<00:26,  1.16it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8322, UAS: 0.9423, LAS: 0.8940, UEM: 0.6014, LEM: 0.3674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3299, partial_loss/deprel_loss: 1.0192, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2573, loss: 0.7618, batch_reg_loss: 0.1759, reg_loss: 0.1761 ||:  75%|#######4  | 83/111 [01:02<00:22,  1.24it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8742, UAS: 0.9428, LAS: 0.8945, UEM: 0.6022, LEM: 0.3674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8188, partial_loss/deprel_loss: 0.7814, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9648, loss: 0.7589, batch_reg_loss: 0.1759, reg_loss: 0.1761 ||:  78%|#######8  | 87/111 [01:04<00:18,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9432, LAS: 0.8950, UEM: 0.6033, LEM: 0.3691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4792, partial_loss/deprel_loss: 0.5202, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6879, loss: 0.7550, batch_reg_loss: 0.1759, reg_loss: 0.1761 ||:  81%|########1 | 90/111 [01:06<00:15,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8641, UAS: 0.9432, LAS: 0.8948, UEM: 0.5973, LEM: 0.3630, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7809, partial_loss/deprel_loss: 0.8364, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0012, loss: 0.7570, batch_reg_loss: 0.1759, reg_loss: 0.1760 ||:  85%|########4 | 94/111 [01:09<00:12,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8751, UAS: 0.9430, LAS: 0.8947, UEM: 0.5933, LEM: 0.3590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0805, partial_loss/deprel_loss: 0.7475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9900, loss: 0.7587, batch_reg_loss: 0.1759, reg_loss: 0.1760 ||:  87%|########7 | 97/111 [01:11<00:09,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8796, UAS: 0.9429, LAS: 0.8944, UEM: 0.5915, LEM: 0.3562, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6612, partial_loss/deprel_loss: 0.7524, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9101, loss: 0.7615, batch_reg_loss: 0.1759, reg_loss: 0.1760 ||:  91%|######### | 101/111 [01:14<00:06,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8512, UAS: 0.9425, LAS: 0.8939, UEM: 0.5845, LEM: 0.3498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2449, partial_loss/deprel_loss: 0.8082, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0714, loss: 0.7650, batch_reg_loss: 0.1759, reg_loss: 0.1760 ||:  95%|#########4| 105/111 [01:16<00:03,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9423, LAS: 0.8940, UEM: 0.5795, LEM: 0.3461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3786, partial_loss/deprel_loss: 0.4375, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6016, loss: 0.7645, batch_reg_loss: 0.1759, reg_loss: 0.1760 ||:  98%|#########8| 109/111 [01:18<00:01,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8829, UAS: 0.9422, LAS: 0.8938, UEM: 0.5751, LEM: 0.3426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6651, partial_loss/deprel_loss: 0.6879, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8592, loss: 0.7658, batch_reg_loss: 0.1759, reg_loss: 0.1760 ||: 100%|##########| 111/111 [01:20<00:00,  1.39it/s]\n",
      "2023-04-07 00:16:58,127 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8947, UAS: 0.9622, LAS: 0.9118, UEM: 0.7073, LEM: 0.3706, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5903, partial_loss/deprel_loss: 24.2431, partial_loss/cycle_loss: 0.0000, batch_loss: 19.5125, loss: 18.2181, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:09,  1.02it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8670, UAS: 0.9523, LAS: 0.9049, UEM: 0.7137, LEM: 0.4660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2693, partial_loss/deprel_loss: 48.4043, partial_loss/cycle_loss: 0.0000, batch_loss: 38.9773, loss: 22.4714, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:06,  1.02it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8718, UAS: 0.9472, LAS: 0.8970, UEM: 0.6454, LEM: 0.3894, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1023, partial_loss/deprel_loss: 43.3819, partial_loss/cycle_loss: 0.0000, batch_loss: 34.9260, loss: 24.5970, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  69%|######9   | 9/13 [00:08<00:03,  1.02it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9084, UAS: 0.9499, LAS: 0.8993, UEM: 0.6645, LEM: 0.3914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4265, partial_loss/deprel_loss: 24.5629, partial_loss/cycle_loss: 0.0000, batch_loss: 19.7356, loss: 24.1319, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  92%|#########2| 12/13 [00:11<00:00,  1.02it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8269, UAS: 0.9448, LAS: 0.8937, UEM: 0.6475, LEM: 0.3805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6012, partial_loss/deprel_loss: 57.6302, partial_loss/cycle_loss: 0.0000, batch_loss: 46.4244, loss: 25.8467, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.01it/s]\n",
      "2023-04-07 00:17:10,952 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:17:10,952 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-07 00:17:10,952 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 00:17:10,952 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.688  |    57.630\n",
      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.665  |     1.601\n",
      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.176  |     0.000\n",
      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - UEM                      |     0.575  |     0.648\n",
      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - LAS                      |     0.894  |     0.894\n",
      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - loss                     |     0.766  |    25.847\n",
      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - LEM                      |     0.343  |     0.381\n",
      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - UAS                      |     0.942  |     0.945\n",
      "2023-04-07 00:17:10,953 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-07 00:17:10,954 - INFO - combo.training.tensorboard_writer - EM                       |     0.883  |     0.827\n",
      "2023-04-07 00:17:10,954 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:17:10,958 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 00:17:15,921 - INFO - combo.training.trainer - Epoch duration: 0:01:41.052355\n",
      "2023-04-07 00:17:15,922 - INFO - combo.training.trainer - Estimated training time remaining: 7:22:41\n",
      "2023-04-07 00:17:15,928 - INFO - allennlp.training.trainer - Epoch 66/399\n",
      "2023-04-07 00:17:15,930 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:17:15,930 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:17:15,938 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9503, LAS: 0.9045, UEM: 0.6977, LEM: 0.5070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1065, partial_loss/deprel_loss: 0.2698, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4130, loss: 0.6921, batch_reg_loss: 0.1759, reg_loss: 0.1759 ||:   3%|2         | 3/111 [00:02<01:20,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8694, UAS: 0.9330, LAS: 0.8820, UEM: 0.5288, LEM: 0.3498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8724, partial_loss/deprel_loss: 0.7974, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9882, loss: 0.8708, batch_reg_loss: 0.1759, reg_loss: 0.1759 ||:   6%|6         | 7/111 [00:04<01:13,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9319, LAS: 0.8828, UEM: 0.4824, LEM: 0.2958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5042, partial_loss/deprel_loss: 0.6965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8339, loss: 0.8558, batch_reg_loss: 0.1758, reg_loss: 0.1759 ||:  10%|9         | 11/111 [00:07<01:08,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9382, LAS: 0.8904, UEM: 0.5645, LEM: 0.3581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2334, partial_loss/deprel_loss: 0.3449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4984, loss: 0.7947, batch_reg_loss: 0.1758, reg_loss: 0.1759 ||:  13%|#2        | 14/111 [00:09<01:08,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8779, UAS: 0.9392, LAS: 0.8913, UEM: 0.5810, LEM: 0.3711, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7095, partial_loss/deprel_loss: 0.7485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9165, loss: 0.7856, batch_reg_loss: 0.1758, reg_loss: 0.1759 ||:  15%|#5        | 17/111 [00:11<01:06,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9393, LAS: 0.8918, UEM: 0.5778, LEM: 0.3715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2544, partial_loss/deprel_loss: 0.3554, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5111, loss: 0.7788, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||:  18%|#8        | 20/111 [00:13<01:06,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9420, LAS: 0.8949, UEM: 0.5900, LEM: 0.3719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2620, partial_loss/deprel_loss: 0.4336, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5751, loss: 0.7566, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||:  21%|##        | 23/111 [00:16<01:04,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8643, UAS: 0.9413, LAS: 0.8942, UEM: 0.5750, LEM: 0.3566, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0092, partial_loss/deprel_loss: 0.7582, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9842, loss: 0.7636, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||:  23%|##3       | 26/111 [00:18<01:02,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9425, LAS: 0.8950, UEM: 0.5722, LEM: 0.3489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6922, partial_loss/deprel_loss: 0.7588, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9213, loss: 0.7595, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||:  26%|##6       | 29/111 [00:20<00:58,  1.40it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9426, LAS: 0.8947, UEM: 0.5539, LEM: 0.3315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5699, partial_loss/deprel_loss: 0.6186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7846, loss: 0.7658, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||:  30%|##9       | 33/111 [00:22<00:54,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8579, UAS: 0.9409, LAS: 0.8928, UEM: 0.5364, LEM: 0.3184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2077, partial_loss/deprel_loss: 0.7697, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0331, loss: 0.7801, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||:  32%|###2      | 36/111 [00:25<00:53,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9417, LAS: 0.8936, UEM: 0.5383, LEM: 0.3137, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6008, partial_loss/deprel_loss: 0.6349, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8038, loss: 0.7737, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||:  35%|###5      | 39/111 [00:27<00:50,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8771, UAS: 0.9419, LAS: 0.8937, UEM: 0.5330, LEM: 0.3057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7104, partial_loss/deprel_loss: 0.6737, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8568, loss: 0.7698, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||:  39%|###8      | 43/111 [00:30<00:47,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9002, UAS: 0.9435, LAS: 0.8958, UEM: 0.5762, LEM: 0.3582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4251, partial_loss/deprel_loss: 0.5221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6784, loss: 0.7536, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||:  41%|####1     | 46/111 [00:32<00:49,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9450, LAS: 0.8975, UEM: 0.6032, LEM: 0.3863, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1083, partial_loss/deprel_loss: 0.2278, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3797, loss: 0.7388, batch_reg_loss: 0.1758, reg_loss: 0.1758 ||:  44%|####4     | 49/111 [00:35<00:50,  1.22it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8851, UAS: 0.9446, LAS: 0.8970, UEM: 0.5923, LEM: 0.3751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5940, partial_loss/deprel_loss: 0.6613, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8236, loss: 0.7427, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||:  47%|####6     | 52/111 [00:37<00:46,  1.27it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8753, UAS: 0.9449, LAS: 0.8972, UEM: 0.5905, LEM: 0.3697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9129, partial_loss/deprel_loss: 0.7567, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9636, loss: 0.7413, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||:  50%|#####     | 56/111 [00:40<00:40,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9460, LAS: 0.8985, UEM: 0.6008, LEM: 0.3761, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2598, partial_loss/deprel_loss: 0.4018, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5491, loss: 0.7311, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||:  53%|#####3    | 59/111 [00:42<00:38,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8576, UAS: 0.9449, LAS: 0.8970, UEM: 0.5994, LEM: 0.3741, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9877, partial_loss/deprel_loss: 0.8369, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0427, loss: 0.7406, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||:  56%|#####5    | 62/111 [00:44<00:36,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8152, UAS: 0.9420, LAS: 0.8940, UEM: 0.5910, LEM: 0.3686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7323, partial_loss/deprel_loss: 0.9653, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2944, loss: 0.7644, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||:  59%|#####8    | 65/111 [00:46<00:33,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9423, LAS: 0.8944, UEM: 0.5933, LEM: 0.3714, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1783, partial_loss/deprel_loss: 0.3056, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4558, loss: 0.7605, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||:  61%|######1   | 68/111 [00:49<00:31,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9416, LAS: 0.8937, UEM: 0.5844, LEM: 0.3637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5059, partial_loss/deprel_loss: 0.5656, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7293, loss: 0.7655, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||:  65%|######4   | 72/111 [00:51<00:27,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8737, UAS: 0.9416, LAS: 0.8939, UEM: 0.5826, LEM: 0.3602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8336, partial_loss/deprel_loss: 0.6601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8705, loss: 0.7631, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||:  68%|######7   | 75/111 [00:53<00:25,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9319, UAS: 0.9426, LAS: 0.8951, UEM: 0.5931, LEM: 0.3691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2431, partial_loss/deprel_loss: 0.3982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5429, loss: 0.7539, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||:  70%|#######   | 78/111 [00:56<00:24,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8882, UAS: 0.9429, LAS: 0.8955, UEM: 0.5893, LEM: 0.3641, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6002, partial_loss/deprel_loss: 0.7296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8794, loss: 0.7525, batch_reg_loss: 0.1757, reg_loss: 0.1758 ||:  74%|#######3  | 82/111 [00:58<00:20,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9429, LAS: 0.8955, UEM: 0.5864, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3258, partial_loss/deprel_loss: 0.4505, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6012, loss: 0.7537, batch_reg_loss: 0.1756, reg_loss: 0.1758 ||:  77%|#######6  | 85/111 [01:00<00:18,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9425, LAS: 0.8951, UEM: 0.5812, LEM: 0.3552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7507, partial_loss/deprel_loss: 0.7151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8979, loss: 0.7580, batch_reg_loss: 0.1756, reg_loss: 0.1758 ||:  79%|#######9  | 88/111 [01:02<00:16,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8893, UAS: 0.9421, LAS: 0.8945, UEM: 0.5720, LEM: 0.3474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5785, partial_loss/deprel_loss: 0.6467, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8087, loss: 0.7620, batch_reg_loss: 0.1756, reg_loss: 0.1758 ||:  83%|########2 | 92/111 [01:05<00:13,  1.46it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9420, LAS: 0.8944, UEM: 0.5703, LEM: 0.3458, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2231, partial_loss/deprel_loss: 0.4463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5773, loss: 0.7642, batch_reg_loss: 0.1756, reg_loss: 0.1758 ||:  86%|########5 | 95/111 [01:07<00:11,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9420, LAS: 0.8944, UEM: 0.5656, LEM: 0.3414, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3783, partial_loss/deprel_loss: 0.4944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6468, loss: 0.7654, batch_reg_loss: 0.1756, reg_loss: 0.1757 ||:  88%|########8 | 98/111 [01:09<00:09,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9425, LAS: 0.8950, UEM: 0.5688, LEM: 0.3418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2546, partial_loss/deprel_loss: 0.4079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5528, loss: 0.7615, batch_reg_loss: 0.1756, reg_loss: 0.1757 ||:  91%|######### | 101/111 [01:12<00:07,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8398, UAS: 0.9421, LAS: 0.8945, UEM: 0.5678, LEM: 0.3398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2186, partial_loss/deprel_loss: 0.9452, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1755, loss: 0.7646, batch_reg_loss: 0.1756, reg_loss: 0.1757 ||:  95%|#########4| 105/111 [01:14<00:04,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8529, UAS: 0.9422, LAS: 0.8945, UEM: 0.5710, LEM: 0.3428, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1337, partial_loss/deprel_loss: 0.8690, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0975, loss: 0.7643, batch_reg_loss: 0.1756, reg_loss: 0.1757 ||:  97%|#########7| 108/111 [01:16<00:02,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9424, LAS: 0.8947, UEM: 0.5696, LEM: 0.3410, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4207, partial_loss/deprel_loss: 0.5379, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6900, loss: 0.7623, batch_reg_loss: 0.1756, reg_loss: 0.1757 ||: 100%|##########| 111/111 [01:18<00:00,  1.41it/s]\n",
      "2023-04-07 00:18:37,817 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.538  |       N/A\n",
      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.421  |       N/A\n",
      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.176  |       N/A\n",
      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - UEM                      |     0.570  |       N/A\n",
      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - LAS                      |     0.895  |       N/A\n",
      "2023-04-07 00:18:37,818 - INFO - combo.training.tensorboard_writer - loss                     |     0.762  |       N/A\n",
      "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - LEM                      |     0.341  |       N/A\n",
      "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - UAS                      |     0.942  |       N/A\n",
      "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - EM                       |     0.905  |       N/A\n",
      "2023-04-07 00:18:37,819 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:18:37,824 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 00:18:43,756 - INFO - combo.training.trainer - Epoch duration: 0:01:27.828285\n",
      "2023-04-07 00:18:43,756 - INFO - combo.training.trainer - Estimated training time remaining: 7:22:02\n",
      "2023-04-07 00:18:43,756 - INFO - allennlp.training.trainer - Epoch 67/399\n",
      "2023-04-07 00:18:43,756 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:18:43,757 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:18:43,764 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9642, LAS: 0.9136, UEM: 0.7103, LEM: 0.4176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4133, partial_loss/deprel_loss: 0.5074, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6642, loss: 0.5930, batch_reg_loss: 0.1756, reg_loss: 0.1756 ||:   3%|2         | 3/111 [00:02<01:17,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9569, LAS: 0.9091, UEM: 0.6867, LEM: 0.4183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8104, partial_loss/deprel_loss: 0.7143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9091, loss: 0.6318, batch_reg_loss: 0.1756, reg_loss: 0.1756 ||:   5%|5         | 6/111 [00:04<01:15,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8706, UAS: 0.9488, LAS: 0.9010, UEM: 0.6200, LEM: 0.3721, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8166, partial_loss/deprel_loss: 0.7593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9463, loss: 0.6963, batch_reg_loss: 0.1756, reg_loss: 0.1756 ||:   8%|8         | 9/111 [00:06<01:11,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9508, LAS: 0.9041, UEM: 0.6444, LEM: 0.3996, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5798, partial_loss/deprel_loss: 0.5682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7461, loss: 0.6720, batch_reg_loss: 0.1755, reg_loss: 0.1756 ||:  11%|#         | 12/111 [00:08<01:12,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8375, UAS: 0.9467, LAS: 0.8998, UEM: 0.6254, LEM: 0.3844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4919, partial_loss/deprel_loss: 0.8657, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1665, loss: 0.7057, batch_reg_loss: 0.1755, reg_loss: 0.1756 ||:  14%|#3        | 15/111 [00:10<01:10,  1.36it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9469, LAS: 0.8998, UEM: 0.6047, LEM: 0.3613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5035, partial_loss/deprel_loss: 0.5987, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7551, loss: 0.7078, batch_reg_loss: 0.1755, reg_loss: 0.1756 ||:  16%|#6        | 18/111 [00:12<01:06,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8705, UAS: 0.9442, LAS: 0.8963, UEM: 0.5739, LEM: 0.3340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7310, partial_loss/deprel_loss: 0.7217, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8991, loss: 0.7291, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  20%|#9        | 22/111 [00:15<01:01,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9013, UAS: 0.9430, LAS: 0.8945, UEM: 0.5612, LEM: 0.3196, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3415, partial_loss/deprel_loss: 0.5077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6500, loss: 0.7442, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  23%|##3       | 26/111 [00:18<00:57,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8734, UAS: 0.9418, LAS: 0.8931, UEM: 0.5430, LEM: 0.3052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8382, partial_loss/deprel_loss: 0.7788, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9661, loss: 0.7568, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  26%|##6       | 29/111 [00:20<00:56,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9279, UAS: 0.9410, LAS: 0.8926, UEM: 0.5419, LEM: 0.3050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1855, partial_loss/deprel_loss: 0.3591, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4999, loss: 0.7624, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  29%|##8       | 32/111 [00:22<00:54,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9414, LAS: 0.8931, UEM: 0.5294, LEM: 0.2942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4009, partial_loss/deprel_loss: 0.4967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6530, loss: 0.7629, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  32%|###2      | 36/111 [00:24<00:50,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9408, LAS: 0.8920, UEM: 0.5319, LEM: 0.2971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2387, partial_loss/deprel_loss: 0.4094, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5507, loss: 0.7721, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  35%|###5      | 39/111 [00:27<00:50,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9387, LAS: 0.8896, UEM: 0.5138, LEM: 0.2844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7333, partial_loss/deprel_loss: 0.7696, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9378, loss: 0.7934, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  39%|###8      | 43/111 [00:29<00:46,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9402, LAS: 0.8909, UEM: 0.5172, LEM: 0.2789, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4004, partial_loss/deprel_loss: 0.5476, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6936, loss: 0.7838, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  42%|####2     | 47/111 [00:32<00:41,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9420, LAS: 0.8928, UEM: 0.5398, LEM: 0.2949, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2967, partial_loss/deprel_loss: 0.4850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6228, loss: 0.7686, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  46%|####5     | 51/111 [00:34<00:40,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8131, UAS: 0.9405, LAS: 0.8912, UEM: 0.5303, LEM: 0.2880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9220, partial_loss/deprel_loss: 1.1761, partial_loss/cycle_loss: 0.0000, batch_loss: 1.5007, loss: 0.7840, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  49%|####8     | 54/111 [00:37<00:38,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9656, UAS: 0.9420, LAS: 0.8931, UEM: 0.5650, LEM: 0.3310, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0461, partial_loss/deprel_loss: 0.1304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2890, loss: 0.7724, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  51%|#####1    | 57/111 [00:39<00:40,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8863, UAS: 0.9416, LAS: 0.8928, UEM: 0.5562, LEM: 0.3234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6266, partial_loss/deprel_loss: 0.6746, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8405, loss: 0.7761, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  55%|#####4    | 61/111 [00:42<00:35,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8867, UAS: 0.9413, LAS: 0.8928, UEM: 0.5574, LEM: 0.3264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8080, partial_loss/deprel_loss: 0.7247, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9168, loss: 0.7787, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  58%|#####7    | 64/111 [00:44<00:33,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9412, LAS: 0.8928, UEM: 0.5553, LEM: 0.3234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2988, partial_loss/deprel_loss: 0.4409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5880, loss: 0.7789, batch_reg_loss: 0.1755, reg_loss: 0.1755 ||:  61%|######1   | 68/111 [00:46<00:29,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9407, LAS: 0.8924, UEM: 0.5512, LEM: 0.3204, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4814, partial_loss/deprel_loss: 0.5985, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7505, loss: 0.7839, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  65%|######4   | 72/111 [00:49<00:26,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9412, LAS: 0.8931, UEM: 0.5510, LEM: 0.3184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2814, partial_loss/deprel_loss: 0.3595, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5193, loss: 0.7792, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  68%|######8   | 76/111 [00:51<00:22,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9425, LAS: 0.8948, UEM: 0.5767, LEM: 0.3478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1161, partial_loss/deprel_loss: 0.2586, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4055, loss: 0.7664, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  72%|#######2  | 80/111 [00:54<00:21,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8449, UAS: 0.9419, LAS: 0.8942, UEM: 0.5766, LEM: 0.3485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3649, partial_loss/deprel_loss: 0.9268, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1898, loss: 0.7712, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  76%|#######5  | 84/111 [00:57<00:18,  1.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8738, UAS: 0.9419, LAS: 0.8943, UEM: 0.5731, LEM: 0.3455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8962, partial_loss/deprel_loss: 0.7475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9527, loss: 0.7723, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  79%|#######9  | 88/111 [01:00<00:15,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8731, UAS: 0.9417, LAS: 0.8942, UEM: 0.5688, LEM: 0.3422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0678, partial_loss/deprel_loss: 0.7556, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9934, loss: 0.7736, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  83%|########2 | 92/111 [01:02<00:12,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9423, LAS: 0.8947, UEM: 0.5730, LEM: 0.3437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3825, partial_loss/deprel_loss: 0.4802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6360, loss: 0.7677, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  86%|########5 | 95/111 [01:05<00:11,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8799, UAS: 0.9423, LAS: 0.8947, UEM: 0.5699, LEM: 0.3403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6675, partial_loss/deprel_loss: 0.6876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8590, loss: 0.7672, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  88%|########8 | 98/111 [01:07<00:09,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9031, UAS: 0.9425, LAS: 0.8949, UEM: 0.5694, LEM: 0.3394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4298, partial_loss/deprel_loss: 0.5523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7032, loss: 0.7656, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  91%|######### | 101/111 [01:09<00:07,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9427, LAS: 0.8950, UEM: 0.5679, LEM: 0.3363, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8124, partial_loss/deprel_loss: 0.7865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9671, loss: 0.7648, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  94%|#########3| 104/111 [01:12<00:05,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8479, UAS: 0.9427, LAS: 0.8950, UEM: 0.5721, LEM: 0.3398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1232, partial_loss/deprel_loss: 0.8301, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0640, loss: 0.7638, batch_reg_loss: 0.1754, reg_loss: 0.1755 ||:  96%|#########6| 107/111 [01:14<00:02,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9429, LAS: 0.8952, UEM: 0.5712, LEM: 0.3392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4432, partial_loss/deprel_loss: 0.5331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6905, loss: 0.7619, batch_reg_loss: 0.1753, reg_loss: 0.1755 ||: 100%|##########| 111/111 [01:16<00:00,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9429, LAS: 0.8952, UEM: 0.5712, LEM: 0.3392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4432, partial_loss/deprel_loss: 0.5331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6905, loss: 0.7619, batch_reg_loss: 0.1753, reg_loss: 0.1755 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
      "2023-04-07 00:20:03,747 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:20:03,747 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:20:03,747 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:20:03,747 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:20:03,747 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.533  |       N/A\n",
      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.443  |       N/A\n",
      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.175  |       N/A\n",
      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - UEM                      |     0.571  |       N/A\n",
      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - LAS                      |     0.895  |       N/A\n",
      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - loss                     |     0.762  |       N/A\n",
      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - LEM                      |     0.339  |       N/A\n",
      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - UAS                      |     0.943  |       N/A\n",
      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - EM                       |     0.898  |       N/A\n",
      "2023-04-07 00:20:03,748 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:20:03,753 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 00:20:08,702 - INFO - combo.training.trainer - Epoch duration: 0:01:24.945331\n",
      "2023-04-07 00:20:08,702 - INFO - combo.training.trainer - Estimated training time remaining: 7:21:09\n",
      "2023-04-07 00:20:08,702 - INFO - allennlp.training.trainer - Epoch 68/399\n",
      "2023-04-07 00:20:08,703 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:20:08,703 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:20:08,712 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9535, LAS: 0.9120, UEM: 0.6017, LEM: 0.3548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3017, partial_loss/deprel_loss: 0.4315, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5809, loss: 0.6322, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||:   4%|3         | 4/111 [00:02<01:05,  1.62it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8080, UAS: 0.9387, LAS: 0.8935, UEM: 0.5898, LEM: 0.3554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.9282, partial_loss/deprel_loss: 1.0957, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4375, loss: 0.7649, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||:   7%|7         | 8/111 [00:05<01:05,  1.57it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9419, LAS: 0.8966, UEM: 0.6199, LEM: 0.3896, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1184, partial_loss/deprel_loss: 0.2622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4087, loss: 0.7419, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||:  10%|9         | 11/111 [00:07<01:07,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8727, UAS: 0.9371, LAS: 0.8921, UEM: 0.6124, LEM: 0.3958, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9503, partial_loss/deprel_loss: 0.7199, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9412, loss: 0.7698, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||:  13%|#2        | 14/111 [00:09<01:07,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8850, UAS: 0.9398, LAS: 0.8943, UEM: 0.5887, LEM: 0.3609, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6932, partial_loss/deprel_loss: 0.7136, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8848, loss: 0.7637, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||:  16%|#6        | 18/111 [00:11<01:01,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9050, UAS: 0.9373, LAS: 0.8906, UEM: 0.5553, LEM: 0.3335, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4083, partial_loss/deprel_loss: 0.5014, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6580, loss: 0.7922, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||:  20%|#9        | 22/111 [00:14<00:57,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9363, LAS: 0.8891, UEM: 0.5288, LEM: 0.3147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6937, partial_loss/deprel_loss: 0.7187, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8890, loss: 0.8091, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||:  23%|##3       | 26/111 [00:16<00:52,  1.63it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9110, UAS: 0.9373, LAS: 0.8901, UEM: 0.5235, LEM: 0.3052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3720, partial_loss/deprel_loss: 0.4579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6160, loss: 0.7941, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||:  27%|##7       | 30/111 [00:19<00:50,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8641, UAS: 0.9370, LAS: 0.8900, UEM: 0.5187, LEM: 0.3013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1057, partial_loss/deprel_loss: 0.7296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9801, loss: 0.7943, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||:  31%|###       | 34/111 [00:21<00:46,  1.66it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9386, LAS: 0.8917, UEM: 0.5275, LEM: 0.3025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2765, partial_loss/deprel_loss: 0.3947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5464, loss: 0.7792, batch_reg_loss: 0.1753, reg_loss: 0.1753 ||:  34%|###4      | 38/111 [00:24<00:45,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9375, LAS: 0.8906, UEM: 0.5236, LEM: 0.3001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2414, partial_loss/deprel_loss: 0.3580, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5099, loss: 0.7878, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  38%|###7      | 42/111 [00:26<00:44,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9376, LAS: 0.8906, UEM: 0.5201, LEM: 0.2961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4612, partial_loss/deprel_loss: 0.5141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6788, loss: 0.7886, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  41%|####1     | 46/111 [00:30<00:44,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8714, UAS: 0.9371, LAS: 0.8898, UEM: 0.5100, LEM: 0.2858, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8646, partial_loss/deprel_loss: 0.7190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9233, loss: 0.7953, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  45%|####5     | 50/111 [00:32<00:40,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9379, LAS: 0.8905, UEM: 0.5044, LEM: 0.2793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3146, partial_loss/deprel_loss: 0.5010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6390, loss: 0.7904, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  49%|####8     | 54/111 [00:35<00:37,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9390, LAS: 0.8916, UEM: 0.5100, LEM: 0.2795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7704, partial_loss/deprel_loss: 0.6965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8865, loss: 0.7837, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  52%|#####2    | 58/111 [00:37<00:34,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9404, LAS: 0.8931, UEM: 0.5284, LEM: 0.2965, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2296, partial_loss/deprel_loss: 0.3919, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5346, loss: 0.7733, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  56%|#####5    | 62/111 [00:40<00:33,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8702, UAS: 0.9407, LAS: 0.8932, UEM: 0.5270, LEM: 0.2935, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9076, partial_loss/deprel_loss: 0.7910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9895, loss: 0.7728, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  59%|#####8    | 65/111 [00:42<00:31,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8835, UAS: 0.9411, LAS: 0.8936, UEM: 0.5325, LEM: 0.3001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7607, partial_loss/deprel_loss: 0.6914, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8805, loss: 0.7690, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  61%|######1   | 68/111 [00:45<00:31,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8679, UAS: 0.9413, LAS: 0.8941, UEM: 0.5542, LEM: 0.3325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8555, partial_loss/deprel_loss: 0.7473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9442, loss: 0.7660, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  64%|######3   | 71/111 [00:47<00:30,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9424, LAS: 0.8953, UEM: 0.5672, LEM: 0.3410, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2020, partial_loss/deprel_loss: 0.3738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5146, loss: 0.7573, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  67%|######6   | 74/111 [00:49<00:27,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9429, LAS: 0.8959, UEM: 0.5668, LEM: 0.3399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3585, partial_loss/deprel_loss: 0.4436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6018, loss: 0.7541, batch_reg_loss: 0.1752, reg_loss: 0.1753 ||:  69%|######9   | 77/111 [00:52<00:25,  1.33it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9074, UAS: 0.9430, LAS: 0.8959, UEM: 0.5699, LEM: 0.3420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3904, partial_loss/deprel_loss: 0.5182, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6678, loss: 0.7540, batch_reg_loss: 0.1752, reg_loss: 0.1752 ||:  72%|#######2  | 80/111 [00:54<00:23,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8795, UAS: 0.9431, LAS: 0.8959, UEM: 0.5689, LEM: 0.3386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7975, partial_loss/deprel_loss: 0.6776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8768, loss: 0.7528, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||:  76%|#######5  | 84/111 [00:57<00:19,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9435, LAS: 0.8963, UEM: 0.5747, LEM: 0.3448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4846, partial_loss/deprel_loss: 0.5977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7502, loss: 0.7493, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||:  78%|#######8  | 87/111 [00:59<00:17,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9434, LAS: 0.8962, UEM: 0.5679, LEM: 0.3372, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4348, partial_loss/deprel_loss: 0.5119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6716, loss: 0.7515, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||:  82%|########1 | 91/111 [01:01<00:13,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9430, LAS: 0.8956, UEM: 0.5675, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3792, partial_loss/deprel_loss: 0.5264, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6721, loss: 0.7560, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||:  86%|########5 | 95/111 [01:04<00:10,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8835, UAS: 0.9425, LAS: 0.8951, UEM: 0.5604, LEM: 0.3317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6581, partial_loss/deprel_loss: 0.6357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8153, loss: 0.7601, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||:  88%|########8 | 98/111 [01:06<00:09,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9430, LAS: 0.8956, UEM: 0.5657, LEM: 0.3356, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2269, partial_loss/deprel_loss: 0.3150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4725, loss: 0.7555, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||:  91%|######### | 101/111 [01:09<00:07,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9042, UAS: 0.9434, LAS: 0.8958, UEM: 0.5635, LEM: 0.3316, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3605, partial_loss/deprel_loss: 0.6125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7372, loss: 0.7544, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||:  94%|#########3| 104/111 [01:11<00:05,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9468, UAS: 0.9443, LAS: 0.8970, UEM: 0.5796, LEM: 0.3480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1041, partial_loss/deprel_loss: 0.2231, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3744, loss: 0.7458, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||:  97%|#########7| 108/111 [01:14<00:02,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.9443, LAS: 0.8969, UEM: 0.5791, LEM: 0.3471, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1234, partial_loss/deprel_loss: 0.8039, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0429, loss: 0.7461, batch_reg_loss: 0.1751, reg_loss: 0.1752 ||: 100%|##########| 111/111 [01:15<00:00,  1.46it/s]\n",
      "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:21:27,338 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.804  |       N/A\n",
      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.123  |       N/A\n",
      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.175  |       N/A\n",
      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - UEM                      |     0.579  |       N/A\n",
      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - LAS                      |     0.897  |       N/A\n",
      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - loss                     |     0.746  |       N/A\n",
      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - LEM                      |     0.347  |       N/A\n",
      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - UAS                      |     0.944  |       N/A\n",
      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - EM                       |     0.867  |       N/A\n",
      "2023-04-07 00:21:27,339 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:21:27,343 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 00:21:31,579 - INFO - combo.training.trainer - Epoch duration: 0:01:22.876591\n",
      "2023-04-07 00:21:31,579 - INFO - combo.training.trainer - Estimated training time remaining: 7:20:04\n",
      "2023-04-07 00:21:31,580 - INFO - allennlp.training.trainer - Epoch 69/399\n",
      "2023-04-07 00:21:31,580 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:21:31,580 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:21:31,588 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9372, LAS: 0.8856, UEM: 0.3389, LEM: 0.1217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4732, partial_loss/deprel_loss: 0.4556, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6342, loss: 0.8309, batch_reg_loss: 0.1751, reg_loss: 0.1751 ||:   4%|3         | 4/111 [00:02<01:07,  1.59it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9488, LAS: 0.9004, UEM: 0.5510, LEM: 0.2977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2803, partial_loss/deprel_loss: 0.4075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5571, loss: 0.7200, batch_reg_loss: 0.1750, reg_loss: 0.1751 ||:   7%|7         | 8/111 [00:04<01:02,  1.64it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9457, LAS: 0.8972, UEM: 0.5200, LEM: 0.2623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4084, partial_loss/deprel_loss: 0.4927, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6509, loss: 0.7452, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  11%|#         | 12/111 [00:07<01:01,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8633, UAS: 0.9434, LAS: 0.8948, UEM: 0.5249, LEM: 0.2788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9379, partial_loss/deprel_loss: 0.8857, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0712, loss: 0.7653, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  14%|#3        | 15/111 [00:09<01:02,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9402, LAS: 0.8918, UEM: 0.5390, LEM: 0.2953, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2273, partial_loss/deprel_loss: 0.3256, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4810, loss: 0.7944, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  16%|#6        | 18/111 [00:11<01:03,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9430, LAS: 0.8945, UEM: 0.5717, LEM: 0.3261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3787, partial_loss/deprel_loss: 0.5596, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6984, loss: 0.7723, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  19%|#8        | 21/111 [00:14<01:02,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8528, UAS: 0.9404, LAS: 0.8918, UEM: 0.5454, LEM: 0.3059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2247, partial_loss/deprel_loss: 0.8758, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1205, loss: 0.7921, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  22%|##1       | 24/111 [00:16<01:00,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8304, UAS: 0.9382, LAS: 0.8897, UEM: 0.5276, LEM: 0.2917, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6034, partial_loss/deprel_loss: 0.8647, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1875, loss: 0.8006, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  24%|##4       | 27/111 [00:18<00:58,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9380, LAS: 0.8899, UEM: 0.5353, LEM: 0.3041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2211, partial_loss/deprel_loss: 0.3530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5016, loss: 0.8007, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  27%|##7       | 30/111 [00:20<00:59,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9380, LAS: 0.8903, UEM: 0.5375, LEM: 0.3127, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2206, partial_loss/deprel_loss: 0.3535, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5019, loss: 0.7981, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  30%|##9       | 33/111 [00:22<00:57,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9395, LAS: 0.8919, UEM: 0.5439, LEM: 0.3135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5803, partial_loss/deprel_loss: 0.5271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7127, loss: 0.7799, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  33%|###3      | 37/111 [00:25<00:52,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9400, LAS: 0.8925, UEM: 0.5530, LEM: 0.3207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3376, partial_loss/deprel_loss: 0.4714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6196, loss: 0.7748, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  37%|###6      | 41/111 [00:28<00:49,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9632, UAS: 0.9408, LAS: 0.8937, UEM: 0.5844, LEM: 0.3672, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0568, partial_loss/deprel_loss: 0.1404, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2986, loss: 0.7665, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  40%|###9      | 44/111 [00:30<00:49,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9411, LAS: 0.8936, UEM: 0.5783, LEM: 0.3588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2504, partial_loss/deprel_loss: 0.4800, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6091, loss: 0.7676, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  42%|####2     | 47/111 [00:32<00:45,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8815, UAS: 0.9419, LAS: 0.8945, UEM: 0.5785, LEM: 0.3548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6921, partial_loss/deprel_loss: 0.7226, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8914, loss: 0.7608, batch_reg_loss: 0.1750, reg_loss: 0.1750 ||:  46%|####5     | 51/111 [00:35<00:41,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8731, UAS: 0.9407, LAS: 0.8931, UEM: 0.5619, LEM: 0.3419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9564, partial_loss/deprel_loss: 0.7671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9799, loss: 0.7714, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||:  50%|####9     | 55/111 [00:37<00:38,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9407, LAS: 0.8932, UEM: 0.5584, LEM: 0.3364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5583, partial_loss/deprel_loss: 0.5483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7253, loss: 0.7697, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||:  53%|#####3    | 59/111 [00:40<00:34,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8819, UAS: 0.9405, LAS: 0.8928, UEM: 0.5496, LEM: 0.3283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7194, partial_loss/deprel_loss: 0.7566, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9240, loss: 0.7737, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||:  57%|#####6    | 63/111 [00:43<00:31,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9013, UAS: 0.9410, LAS: 0.8932, UEM: 0.5453, LEM: 0.3202, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4204, partial_loss/deprel_loss: 0.5264, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6801, loss: 0.7715, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||:  60%|######    | 67/111 [00:45<00:27,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9418, LAS: 0.8937, UEM: 0.5471, LEM: 0.3167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3232, partial_loss/deprel_loss: 0.4991, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6388, loss: 0.7663, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||:  64%|######3   | 71/111 [00:48<00:26,  1.49it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8778, UAS: 0.9413, LAS: 0.8930, UEM: 0.5375, LEM: 0.3083, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7553, partial_loss/deprel_loss: 0.7453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9222, loss: 0.7724, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||:  68%|######7   | 75/111 [00:51<00:24,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8882, UAS: 0.9418, LAS: 0.8934, UEM: 0.5385, LEM: 0.3074, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5953, partial_loss/deprel_loss: 0.6810, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8388, loss: 0.7695, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||:  70%|#######   | 78/111 [00:53<00:24,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9427, LAS: 0.8946, UEM: 0.5573, LEM: 0.3260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2803, partial_loss/deprel_loss: 0.4075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5569, loss: 0.7609, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||:  73%|#######2  | 81/111 [00:55<00:21,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8745, UAS: 0.9429, LAS: 0.8948, UEM: 0.5602, LEM: 0.3283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8755, partial_loss/deprel_loss: 0.6715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8872, loss: 0.7592, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||:  76%|#######5  | 84/111 [00:58<00:19,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9429, LAS: 0.8950, UEM: 0.5685, LEM: 0.3388, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2962, partial_loss/deprel_loss: 0.4650, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6061, loss: 0.7592, batch_reg_loss: 0.1749, reg_loss: 0.1750 ||:  78%|#######8  | 87/111 [01:00<00:17,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9437, LAS: 0.8959, UEM: 0.5770, LEM: 0.3451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2044, partial_loss/deprel_loss: 0.3830, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5221, loss: 0.7520, batch_reg_loss: 0.1748, reg_loss: 0.1750 ||:  82%|########1 | 91/111 [01:02<00:14,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9440, LAS: 0.8962, UEM: 0.5740, LEM: 0.3409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4221, partial_loss/deprel_loss: 0.4896, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6510, loss: 0.7511, batch_reg_loss: 0.1748, reg_loss: 0.1750 ||:  85%|########4 | 94/111 [01:05<00:12,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9435, LAS: 0.8957, UEM: 0.5720, LEM: 0.3396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3220, partial_loss/deprel_loss: 0.4080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5656, loss: 0.7546, batch_reg_loss: 0.1748, reg_loss: 0.1749 ||:  88%|########8 | 98/111 [01:07<00:09,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8723, UAS: 0.9435, LAS: 0.8959, UEM: 0.5687, LEM: 0.3355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9934, partial_loss/deprel_loss: 0.7374, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9634, loss: 0.7537, batch_reg_loss: 0.1748, reg_loss: 0.1749 ||:  92%|#########1| 102/111 [01:10<00:06,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9441, LAS: 0.8966, UEM: 0.5770, LEM: 0.3420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1999, partial_loss/deprel_loss: 0.3860, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5236, loss: 0.7478, batch_reg_loss: 0.1748, reg_loss: 0.1749 ||:  95%|#########4| 105/111 [01:13<00:04,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9441, LAS: 0.8966, UEM: 0.5723, LEM: 0.3380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3267, partial_loss/deprel_loss: 0.3953, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5564, loss: 0.7484, batch_reg_loss: 0.1748, reg_loss: 0.1749 ||:  98%|#########8| 109/111 [01:15<00:01,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9445, LAS: 0.8970, UEM: 0.5766, LEM: 0.3406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2103, partial_loss/deprel_loss: 0.3635, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5076, loss: 0.7455, batch_reg_loss: 0.1748, reg_loss: 0.1749 ||: 100%|##########| 111/111 [01:16<00:00,  1.44it/s]\n",
      "2023-04-07 00:22:51,428 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:22:51,428 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:22:51,428 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:22:51,428 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:22:51,428 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:22:51,428 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:22:51,428 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.363  |       N/A\n",
      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.210  |       N/A\n",
      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.175  |       N/A\n",
      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - UEM                      |     0.577  |       N/A\n",
      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - LAS                      |     0.897  |       N/A\n",
      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - loss                     |     0.746  |       N/A\n",
      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - LEM                      |     0.341  |       N/A\n",
      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - UAS                      |     0.945  |       N/A\n",
      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - EM                       |     0.925  |       N/A\n",
      "2023-04-07 00:22:51,429 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:22:51,434 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 00:22:55,983 - INFO - combo.training.trainer - Epoch duration: 0:01:24.403512\n",
      "2023-04-07 00:22:55,983 - INFO - combo.training.trainer - Estimated training time remaining: 7:19:06\n",
      "2023-04-07 00:22:55,984 - INFO - allennlp.training.trainer - Epoch 70/399\n",
      "2023-04-07 00:22:55,984 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:22:55,984 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:22:55,993 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9506, LAS: 0.9042, UEM: 0.5290, LEM: 0.2968, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6881, partial_loss/deprel_loss: 0.6097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8001, loss: 0.6847, batch_reg_loss: 0.1748, reg_loss: 0.1748 ||:   3%|2         | 3/111 [00:02<01:22,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9477, LAS: 0.8997, UEM: 0.5508, LEM: 0.2936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2564, partial_loss/deprel_loss: 0.4398, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5779, loss: 0.7136, batch_reg_loss: 0.1748, reg_loss: 0.1748 ||:   6%|6         | 7/111 [00:04<01:14,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8665, UAS: 0.9454, LAS: 0.8973, UEM: 0.5153, LEM: 0.2580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8429, partial_loss/deprel_loss: 0.8392, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0147, loss: 0.7399, batch_reg_loss: 0.1747, reg_loss: 0.1748 ||:  10%|9         | 11/111 [00:07<01:10,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9452, LAS: 0.8978, UEM: 0.5334, LEM: 0.2912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5317, partial_loss/deprel_loss: 0.5513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7221, loss: 0.7331, batch_reg_loss: 0.1747, reg_loss: 0.1748 ||:  13%|#2        | 14/111 [00:09<01:08,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8345, UAS: 0.9460, LAS: 0.8982, UEM: 0.5915, LEM: 0.3525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1596, partial_loss/deprel_loss: 0.8480, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0851, loss: 0.7203, batch_reg_loss: 0.1747, reg_loss: 0.1748 ||:  16%|#6        | 18/111 [00:12<01:03,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8866, UAS: 0.9457, LAS: 0.8980, UEM: 0.5696, LEM: 0.3340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4944, partial_loss/deprel_loss: 0.6857, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8221, loss: 0.7229, batch_reg_loss: 0.1747, reg_loss: 0.1747 ||:  20%|#9        | 22/111 [00:14<00:58,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9450, LAS: 0.8981, UEM: 0.5822, LEM: 0.3567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1255, partial_loss/deprel_loss: 0.2653, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4120, loss: 0.7276, batch_reg_loss: 0.1747, reg_loss: 0.1747 ||:  23%|##3       | 26/111 [00:17<00:55,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9464, LAS: 0.8994, UEM: 0.6001, LEM: 0.3663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1067, partial_loss/deprel_loss: 0.3424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4700, loss: 0.7160, batch_reg_loss: 0.1747, reg_loss: 0.1747 ||:  27%|##7       | 30/111 [00:19<00:52,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8758, UAS: 0.9470, LAS: 0.9001, UEM: 0.6030, LEM: 0.3675, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7936, partial_loss/deprel_loss: 0.7543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9368, loss: 0.7124, batch_reg_loss: 0.1747, reg_loss: 0.1747 ||:  30%|##9       | 33/111 [00:21<00:51,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9049, UAS: 0.9472, LAS: 0.9003, UEM: 0.6065, LEM: 0.3669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4683, partial_loss/deprel_loss: 0.5891, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7396, loss: 0.7110, batch_reg_loss: 0.1747, reg_loss: 0.1747 ||:  32%|###2      | 36/111 [00:24<00:52,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9483, LAS: 0.9017, UEM: 0.6156, LEM: 0.3730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1905, partial_loss/deprel_loss: 0.3738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5118, loss: 0.7037, batch_reg_loss: 0.1747, reg_loss: 0.1747 ||:  35%|###5      | 39/111 [00:26<00:50,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9464, LAS: 0.8989, UEM: 0.5964, LEM: 0.3577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5875, partial_loss/deprel_loss: 0.6289, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7953, loss: 0.7232, batch_reg_loss: 0.1747, reg_loss: 0.1747 ||:  39%|###8      | 43/111 [00:28<00:46,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8798, UAS: 0.9463, LAS: 0.8987, UEM: 0.5899, LEM: 0.3501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8414, partial_loss/deprel_loss: 0.6776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8850, loss: 0.7244, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  41%|####1     | 46/111 [00:31<00:46,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9472, LAS: 0.8996, UEM: 0.5881, LEM: 0.3436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3002, partial_loss/deprel_loss: 0.4886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6255, loss: 0.7186, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  45%|####5     | 50/111 [00:33<00:41,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9467, LAS: 0.8991, UEM: 0.5861, LEM: 0.3422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2186, partial_loss/deprel_loss: 0.3734, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5171, loss: 0.7234, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  49%|####8     | 54/111 [00:36<00:39,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9007, UAS: 0.9450, LAS: 0.8975, UEM: 0.5755, LEM: 0.3348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5630, partial_loss/deprel_loss: 0.6081, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7737, loss: 0.7364, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  51%|#####1    | 57/111 [00:38<00:37,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9450, LAS: 0.8976, UEM: 0.5710, LEM: 0.3301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2503, partial_loss/deprel_loss: 0.3736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5236, loss: 0.7372, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  55%|#####4    | 61/111 [00:41<00:34,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8635, UAS: 0.9442, LAS: 0.8967, UEM: 0.5627, LEM: 0.3232, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9444, partial_loss/deprel_loss: 0.8030, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0059, loss: 0.7428, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  59%|#####8    | 65/111 [00:43<00:30,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9451, LAS: 0.8978, UEM: 0.5759, LEM: 0.3349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3515, partial_loss/deprel_loss: 0.4999, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6448, loss: 0.7330, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  62%|######2   | 69/111 [00:46<00:28,  1.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9447, LAS: 0.8976, UEM: 0.5749, LEM: 0.3324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3702, partial_loss/deprel_loss: 0.4574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6146, loss: 0.7347, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  66%|######5   | 73/111 [00:49<00:26,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8852, UAS: 0.9453, LAS: 0.8984, UEM: 0.5932, LEM: 0.3584, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6705, partial_loss/deprel_loss: 0.6253, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8089, loss: 0.7296, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  68%|######8   | 76/111 [00:52<00:26,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9058, UAS: 0.9456, LAS: 0.8986, UEM: 0.5912, LEM: 0.3558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3765, partial_loss/deprel_loss: 0.5242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6692, loss: 0.7272, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  71%|#######1  | 79/111 [00:54<00:23,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9146, UAS: 0.9456, LAS: 0.8988, UEM: 0.5885, LEM: 0.3543, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3512, partial_loss/deprel_loss: 0.3822, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5506, loss: 0.7257, batch_reg_loss: 0.1746, reg_loss: 0.1747 ||:  74%|#######3  | 82/111 [00:56<00:21,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9080, UAS: 0.9458, LAS: 0.8988, UEM: 0.5861, LEM: 0.3519, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4328, partial_loss/deprel_loss: 0.5251, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6812, loss: 0.7256, batch_reg_loss: 0.1745, reg_loss: 0.1747 ||:  77%|#######6  | 85/111 [00:58<00:18,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9459, LAS: 0.8990, UEM: 0.5836, LEM: 0.3492, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6683, partial_loss/deprel_loss: 0.6249, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8081, loss: 0.7242, batch_reg_loss: 0.1745, reg_loss: 0.1747 ||:  79%|#######9  | 88/111 [01:00<00:16,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9462, LAS: 0.8994, UEM: 0.5841, LEM: 0.3468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3782, partial_loss/deprel_loss: 0.5520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6918, loss: 0.7221, batch_reg_loss: 0.1745, reg_loss: 0.1746 ||:  83%|########2 | 92/111 [01:03<00:13,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9420, UAS: 0.9457, LAS: 0.8989, UEM: 0.5914, LEM: 0.3576, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1358, partial_loss/deprel_loss: 0.2361, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3906, loss: 0.7262, batch_reg_loss: 0.1745, reg_loss: 0.1746 ||:  86%|########5 | 95/111 [01:05<00:11,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9459, LAS: 0.8990, UEM: 0.5926, LEM: 0.3576, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2622, partial_loss/deprel_loss: 0.4041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5503, loss: 0.7256, batch_reg_loss: 0.1745, reg_loss: 0.1746 ||:  89%|########9 | 99/111 [01:08<00:08,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9452, LAS: 0.8983, UEM: 0.5850, LEM: 0.3516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6349, partial_loss/deprel_loss: 0.5700, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7575, loss: 0.7305, batch_reg_loss: 0.1745, reg_loss: 0.1746 ||:  93%|#########2| 103/111 [01:10<00:05,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8712, UAS: 0.9447, LAS: 0.8977, UEM: 0.5808, LEM: 0.3479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8001, partial_loss/deprel_loss: 0.7797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9583, loss: 0.7356, batch_reg_loss: 0.1745, reg_loss: 0.1746 ||:  96%|#########6| 107/111 [01:12<00:02,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9445, LAS: 0.8976, UEM: 0.5775, LEM: 0.3453, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5486, partial_loss/deprel_loss: 0.6677, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8184, loss: 0.7377, batch_reg_loss: 0.1745, reg_loss: 0.1746 ||: 100%|##########| 111/111 [01:15<00:00,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9445, LAS: 0.8976, UEM: 0.5775, LEM: 0.3453, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5486, partial_loss/deprel_loss: 0.6677, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8184, loss: 0.7377, batch_reg_loss: 0.1745, reg_loss: 0.1746 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
      "2023-04-07 00:24:14,896 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9108, UAS: 0.9488, LAS: 0.8951, UEM: 0.5461, LEM: 0.2057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4334, partial_loss/deprel_loss: 24.7874, partial_loss/cycle_loss: 0.0000, batch_loss: 19.9166, loss: 23.9872, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:08,  1.18it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9054, UAS: 0.9478, LAS: 0.8936, UEM: 0.5263, LEM: 0.1940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5667, partial_loss/deprel_loss: 24.3909, partial_loss/cycle_loss: 0.0000, batch_loss: 19.6260, loss: 25.3352, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:04<00:07,  1.10it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8277, UAS: 0.9436, LAS: 0.8916, UEM: 0.6500, LEM: 0.3974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5601, partial_loss/deprel_loss: 57.8863, partial_loss/cycle_loss: 0.0000, batch_loss: 46.6211, loss: 27.1227, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  54%|#####3    | 7/13 [00:06<00:05,  1.05it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9284, UAS: 0.9474, LAS: 0.8963, UEM: 0.6602, LEM: 0.3935, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3731, partial_loss/deprel_loss: 17.6734, partial_loss/cycle_loss: 0.0000, batch_loss: 14.2133, loss: 25.4952, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  77%|#######6  | 10/13 [00:09<00:02,  1.04it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9467, LAS: 0.8959, UEM: 0.6521, LEM: 0.3874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9122, partial_loss/deprel_loss: 31.0175, partial_loss/cycle_loss: 0.0000, batch_loss: 24.9964, loss: 26.0198, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.03it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9467, LAS: 0.8959, UEM: 0.6521, LEM: 0.3874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9122, partial_loss/deprel_loss: 31.0175, partial_loss/cycle_loss: 0.0000, batch_loss: 24.9964, loss: 26.0198, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.03it/s]\n",
      "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-07 00:24:27,552 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.668  |    31.017\n",
      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.549  |     0.912\n",
      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.175  |     0.000\n",
      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - UEM                      |     0.577  |     0.652\n",
      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - LAS                      |     0.898  |     0.896\n",
      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - loss                     |     0.738  |    26.020\n",
      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - LEM                      |     0.345  |     0.387\n",
      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - UAS                      |     0.944  |     0.947\n",
      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - EM                       |     0.896  |     0.884\n",
      "2023-04-07 00:24:27,553 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:24:27,558 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 00:24:32,516 - INFO - combo.training.trainer - Epoch duration: 0:01:36.532109\n",
      "2023-04-07 00:24:32,516 - INFO - combo.training.trainer - Estimated training time remaining: 7:19:04\n",
      "2023-04-07 00:24:32,516 - INFO - allennlp.training.trainer - Epoch 71/399\n",
      "2023-04-07 00:24:32,516 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:24:32,517 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:24:32,524 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9590, LAS: 0.9141, UEM: 0.6957, LEM: 0.4722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1020, partial_loss/deprel_loss: 0.2615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4041, loss: 0.6331, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||:   4%|3         | 4/111 [00:02<01:12,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8606, UAS: 0.9402, LAS: 0.8957, UEM: 0.6073, LEM: 0.4034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0627, partial_loss/deprel_loss: 0.6654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9193, loss: 0.7472, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||:   6%|6         | 7/111 [00:05<01:15,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9165, UAS: 0.9451, LAS: 0.9012, UEM: 0.5755, LEM: 0.3458, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3404, partial_loss/deprel_loss: 0.4493, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6020, loss: 0.7071, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||:  10%|9         | 11/111 [00:07<01:10,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8943, UAS: 0.9442, LAS: 0.8999, UEM: 0.5837, LEM: 0.3646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6201, partial_loss/deprel_loss: 0.6013, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7796, loss: 0.7150, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||:  14%|#3        | 15/111 [00:10<01:04,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9411, LAS: 0.8963, UEM: 0.5649, LEM: 0.3436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4521, partial_loss/deprel_loss: 0.5205, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6813, loss: 0.7479, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||:  16%|#6        | 18/111 [00:12<01:03,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9401, LAS: 0.8946, UEM: 0.5597, LEM: 0.3347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2594, partial_loss/deprel_loss: 0.4458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5830, loss: 0.7609, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||:  20%|#9        | 22/111 [00:15<01:01,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9231, UAS: 0.9421, LAS: 0.8969, UEM: 0.5898, LEM: 0.3564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2663, partial_loss/deprel_loss: 0.4187, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5626, loss: 0.7449, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||:  23%|##2       | 25/111 [00:17<01:00,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8760, UAS: 0.9435, LAS: 0.8984, UEM: 0.5941, LEM: 0.3574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9035, partial_loss/deprel_loss: 0.7504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9555, loss: 0.7326, batch_reg_loss: 0.1745, reg_loss: 0.1745 ||:  26%|##6       | 29/111 [00:19<00:56,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9435, LAS: 0.8980, UEM: 0.5835, LEM: 0.3432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2197, partial_loss/deprel_loss: 0.3918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5318, loss: 0.7323, batch_reg_loss: 0.1744, reg_loss: 0.1745 ||:  30%|##9       | 33/111 [00:22<00:51,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8720, UAS: 0.9419, LAS: 0.8962, UEM: 0.5642, LEM: 0.3297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8650, partial_loss/deprel_loss: 0.7420, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9410, loss: 0.7496, batch_reg_loss: 0.1744, reg_loss: 0.1745 ||:  32%|###2      | 36/111 [00:24<00:50,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9417, LAS: 0.8960, UEM: 0.5526, LEM: 0.3200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4917, partial_loss/deprel_loss: 0.5471, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7104, loss: 0.7502, batch_reg_loss: 0.1744, reg_loss: 0.1745 ||:  35%|###5      | 39/111 [00:26<00:49,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9422, LAS: 0.8962, UEM: 0.5459, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3982, partial_loss/deprel_loss: 0.4688, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6291, loss: 0.7475, batch_reg_loss: 0.1744, reg_loss: 0.1745 ||:  39%|###8      | 43/111 [00:28<00:45,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9426, LAS: 0.8967, UEM: 0.5581, LEM: 0.3228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2111, partial_loss/deprel_loss: 0.3592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5040, loss: 0.7444, batch_reg_loss: 0.1744, reg_loss: 0.1745 ||:  42%|####2     | 47/111 [00:32<00:45,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8804, UAS: 0.9429, LAS: 0.8970, UEM: 0.5574, LEM: 0.3219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6908, partial_loss/deprel_loss: 0.6305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8170, loss: 0.7423, batch_reg_loss: 0.1744, reg_loss: 0.1745 ||:  45%|####5     | 50/111 [00:34<00:44,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9442, LAS: 0.8986, UEM: 0.5893, LEM: 0.3646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2660, partial_loss/deprel_loss: 0.4181, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5620, loss: 0.7319, batch_reg_loss: 0.1744, reg_loss: 0.1745 ||:  48%|####7     | 53/111 [00:37<00:44,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8396, UAS: 0.9442, LAS: 0.8985, UEM: 0.5971, LEM: 0.3702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2169, partial_loss/deprel_loss: 0.9480, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1761, loss: 0.7328, batch_reg_loss: 0.1744, reg_loss: 0.1744 ||:  51%|#####1    | 57/111 [00:39<00:39,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9446, LAS: 0.8990, UEM: 0.5982, LEM: 0.3703, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2724, partial_loss/deprel_loss: 0.3848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5367, loss: 0.7271, batch_reg_loss: 0.1744, reg_loss: 0.1744 ||:  54%|#####4    | 60/111 [00:41<00:36,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8703, UAS: 0.9439, LAS: 0.8982, UEM: 0.5894, LEM: 0.3637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8146, partial_loss/deprel_loss: 0.7395, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9289, loss: 0.7332, batch_reg_loss: 0.1744, reg_loss: 0.1744 ||:  58%|#####7    | 64/111 [00:44<00:32,  1.46it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9441, LAS: 0.8983, UEM: 0.5906, LEM: 0.3623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2832, partial_loss/deprel_loss: 0.4338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5781, loss: 0.7327, batch_reg_loss: 0.1744, reg_loss: 0.1744 ||:  60%|######    | 67/111 [00:46<00:30,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9442, LAS: 0.8982, UEM: 0.5844, LEM: 0.3549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3510, partial_loss/deprel_loss: 0.5362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6735, loss: 0.7346, batch_reg_loss: 0.1744, reg_loss: 0.1744 ||:  64%|######3   | 71/111 [00:48<00:26,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9443, LAS: 0.8983, UEM: 0.5809, LEM: 0.3504, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4050, partial_loss/deprel_loss: 0.4906, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6479, loss: 0.7343, batch_reg_loss: 0.1744, reg_loss: 0.1744 ||:  68%|######7   | 75/111 [00:51<00:23,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9447, LAS: 0.8986, UEM: 0.5798, LEM: 0.3479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2284, partial_loss/deprel_loss: 0.3343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4875, loss: 0.7322, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||:  71%|#######1  | 79/111 [00:54<00:21,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9449, LAS: 0.8989, UEM: 0.5804, LEM: 0.3481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2282, partial_loss/deprel_loss: 0.3447, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4958, loss: 0.7293, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||:  75%|#######4  | 83/111 [00:56<00:19,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9453, LAS: 0.8992, UEM: 0.5786, LEM: 0.3446, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2871, partial_loss/deprel_loss: 0.4169, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5653, loss: 0.7271, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||:  77%|#######7  | 86/111 [00:59<00:17,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8387, UAS: 0.9448, LAS: 0.8986, UEM: 0.5749, LEM: 0.3413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3576, partial_loss/deprel_loss: 0.9162, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1788, loss: 0.7315, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||:  80%|########  | 89/111 [01:01<00:15,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9453, LAS: 0.8991, UEM: 0.5820, LEM: 0.3470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2507, partial_loss/deprel_loss: 0.3985, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5433, loss: 0.7274, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||:  84%|########3 | 93/111 [01:04<00:12,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9457, LAS: 0.8996, UEM: 0.5859, LEM: 0.3502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2463, partial_loss/deprel_loss: 0.3536, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5065, loss: 0.7239, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||:  86%|########6 | 96/111 [01:06<00:10,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8722, UAS: 0.9452, LAS: 0.8989, UEM: 0.5788, LEM: 0.3453, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8455, partial_loss/deprel_loss: 0.7369, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9329, loss: 0.7287, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||:  89%|########9 | 99/111 [01:08<00:08,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9451, LAS: 0.8987, UEM: 0.5735, LEM: 0.3395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4627, partial_loss/deprel_loss: 0.5341, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6941, loss: 0.7290, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||:  93%|#########2| 103/111 [01:10<00:05,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9452, LAS: 0.8988, UEM: 0.5804, LEM: 0.3492, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5536, partial_loss/deprel_loss: 0.6417, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7984, loss: 0.7292, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||:  95%|#########5| 106/111 [01:13<00:03,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9449, LAS: 0.8985, UEM: 0.5797, LEM: 0.3489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2004, partial_loss/deprel_loss: 0.3910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5271, loss: 0.7315, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||:  98%|#########8| 109/111 [01:15<00:01,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9453, LAS: 0.8989, UEM: 0.5821, LEM: 0.3497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2464, partial_loss/deprel_loss: 0.4372, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5733, loss: 0.7289, batch_reg_loss: 0.1743, reg_loss: 0.1744 ||: 100%|##########| 111/111 [01:16<00:00,  1.46it/s]\n",
      "2023-04-07 00:25:51,826 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.437  |       N/A\n",
      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.246  |       N/A\n",
      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.174  |       N/A\n",
      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - UEM                      |     0.582  |       N/A\n",
      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - LAS                      |     0.899  |       N/A\n",
      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - loss                     |     0.729  |       N/A\n",
      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:25:51,827 - INFO - combo.training.tensorboard_writer - LEM                      |     0.350  |       N/A\n",
      "2023-04-07 00:25:51,828 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:25:51,828 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:25:51,828 - INFO - combo.training.tensorboard_writer - UAS                      |     0.945  |       N/A\n",
      "2023-04-07 00:25:51,828 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:25:51,828 - INFO - combo.training.tensorboard_writer - EM                       |     0.919  |       N/A\n",
      "2023-04-07 00:25:51,828 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:25:51,833 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 00:25:58,450 - INFO - combo.training.trainer - Epoch duration: 0:01:25.934082\n",
      "2023-04-07 00:25:58,451 - INFO - combo.training.trainer - Estimated training time remaining: 7:18:10\n",
      "2023-04-07 00:25:58,451 - INFO - allennlp.training.trainer - Epoch 72/399\n",
      "2023-04-07 00:25:58,451 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:25:58,451 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:25:58,459 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8653, UAS: 0.9210, LAS: 0.8741, UEM: 0.1528, LEM: 0.0349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0325, partial_loss/deprel_loss: 0.7074, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9467, loss: 0.9111, batch_reg_loss: 0.1743, reg_loss: 0.1743 ||:   3%|2         | 3/111 [00:02<01:14,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9339, LAS: 0.8884, UEM: 0.3328, LEM: 0.1396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3098, partial_loss/deprel_loss: 0.4203, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5725, loss: 0.8094, batch_reg_loss: 0.1743, reg_loss: 0.1743 ||:   5%|5         | 6/111 [00:04<01:12,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9255, UAS: 0.9389, LAS: 0.8942, UEM: 0.3980, LEM: 0.1852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2779, partial_loss/deprel_loss: 0.4066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5551, loss: 0.7716, batch_reg_loss: 0.1742, reg_loss: 0.1743 ||:   8%|8         | 9/111 [00:06<01:12,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9455, LAS: 0.9005, UEM: 0.5356, LEM: 0.2947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2017, partial_loss/deprel_loss: 0.3285, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4774, loss: 0.7129, batch_reg_loss: 0.1742, reg_loss: 0.1743 ||:  11%|#         | 12/111 [00:08<01:10,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9476, LAS: 0.9035, UEM: 0.6410, LEM: 0.4393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0145, partial_loss/deprel_loss: 0.7799, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0010, loss: 0.6982, batch_reg_loss: 0.1742, reg_loss: 0.1743 ||:  14%|#3        | 15/111 [00:11<01:14,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9487, LAS: 0.9049, UEM: 0.6574, LEM: 0.4550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1425, partial_loss/deprel_loss: 0.2706, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4192, loss: 0.6935, batch_reg_loss: 0.1742, reg_loss: 0.1742 ||:  16%|#6        | 18/111 [00:13<01:09,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8470, UAS: 0.9461, LAS: 0.9020, UEM: 0.6318, LEM: 0.4214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3470, partial_loss/deprel_loss: 0.7804, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0679, loss: 0.7139, batch_reg_loss: 0.1742, reg_loss: 0.1742 ||:  20%|#9        | 22/111 [00:16<01:04,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9479, LAS: 0.9035, UEM: 0.6285, LEM: 0.4075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5938, partial_loss/deprel_loss: 0.5446, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7286, loss: 0.6959, batch_reg_loss: 0.1742, reg_loss: 0.1742 ||:  23%|##3       | 26/111 [00:18<00:59,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9480, LAS: 0.9035, UEM: 0.6255, LEM: 0.4011, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2719, partial_loss/deprel_loss: 0.4565, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5938, loss: 0.6938, batch_reg_loss: 0.1742, reg_loss: 0.1742 ||:  26%|##6       | 29/111 [00:21<00:59,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8860, UAS: 0.9482, LAS: 0.9034, UEM: 0.6138, LEM: 0.3845, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5769, partial_loss/deprel_loss: 0.6008, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7702, loss: 0.6935, batch_reg_loss: 0.1742, reg_loss: 0.1742 ||:  30%|##9       | 33/111 [00:23<00:55,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9489, LAS: 0.9044, UEM: 0.6279, LEM: 0.3985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6194, partial_loss/deprel_loss: 0.5291, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7213, loss: 0.6839, batch_reg_loss: 0.1742, reg_loss: 0.1742 ||:  32%|###2      | 36/111 [00:26<00:55,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9488, LAS: 0.9043, UEM: 0.6230, LEM: 0.3930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2512, partial_loss/deprel_loss: 0.3353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4926, loss: 0.6844, batch_reg_loss: 0.1742, reg_loss: 0.1742 ||:  36%|###6      | 40/111 [00:29<00:52,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8891, UAS: 0.9484, LAS: 0.9035, UEM: 0.6086, LEM: 0.3789, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5742, partial_loss/deprel_loss: 0.5775, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7509, loss: 0.6907, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  40%|###9      | 44/111 [00:31<00:46,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9182, UAS: 0.9482, LAS: 0.9033, UEM: 0.5955, LEM: 0.3669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3510, partial_loss/deprel_loss: 0.4102, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5725, loss: 0.6924, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  43%|####3     | 48/111 [00:33<00:41,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8468, UAS: 0.9474, LAS: 0.9021, UEM: 0.5940, LEM: 0.3668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2345, partial_loss/deprel_loss: 0.8553, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1053, loss: 0.7012, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  47%|####6     | 52/111 [00:36<00:38,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9483, LAS: 0.9031, UEM: 0.6069, LEM: 0.3767, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2363, partial_loss/deprel_loss: 0.3497, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5011, loss: 0.6941, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  50%|#####     | 56/111 [00:39<00:36,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9199, UAS: 0.9483, LAS: 0.9028, UEM: 0.5992, LEM: 0.3684, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2925, partial_loss/deprel_loss: 0.3917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5459, loss: 0.6959, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  54%|#####4    | 60/111 [00:41<00:33,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8667, UAS: 0.9464, LAS: 0.9008, UEM: 0.5965, LEM: 0.3693, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0754, partial_loss/deprel_loss: 0.7823, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0150, loss: 0.7112, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  58%|#####7    | 64/111 [00:44<00:31,  1.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8076, UAS: 0.9458, LAS: 0.9003, UEM: 0.6044, LEM: 0.3765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8518, partial_loss/deprel_loss: 1.1044, partial_loss/cycle_loss: 0.0000, batch_loss: 1.4279, loss: 0.7156, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  61%|######1   | 68/111 [00:47<00:29,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9458, LAS: 0.9002, UEM: 0.6026, LEM: 0.3740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6688, partial_loss/deprel_loss: 0.6208, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8045, loss: 0.7183, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  64%|######3   | 71/111 [00:49<00:29,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9061, UAS: 0.9461, LAS: 0.9006, UEM: 0.6006, LEM: 0.3704, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3879, partial_loss/deprel_loss: 0.5238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6707, loss: 0.7152, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  67%|######6   | 74/111 [00:52<00:26,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9453, LAS: 0.8996, UEM: 0.5901, LEM: 0.3609, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5763, partial_loss/deprel_loss: 0.6045, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7729, loss: 0.7218, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  70%|#######   | 78/111 [00:54<00:22,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8735, UAS: 0.9454, LAS: 0.8994, UEM: 0.5849, LEM: 0.3537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7327, partial_loss/deprel_loss: 0.6924, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8746, loss: 0.7226, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  74%|#######3  | 82/111 [00:56<00:19,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8878, UAS: 0.9455, LAS: 0.8995, UEM: 0.5842, LEM: 0.3510, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7146, partial_loss/deprel_loss: 0.6244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8165, loss: 0.7207, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  77%|#######7  | 86/111 [00:59<00:16,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8576, UAS: 0.9446, LAS: 0.8984, UEM: 0.5772, LEM: 0.3451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0883, partial_loss/deprel_loss: 0.7811, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0166, loss: 0.7292, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  81%|########1 | 90/111 [01:02<00:13,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8825, UAS: 0.9444, LAS: 0.8984, UEM: 0.5738, LEM: 0.3422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8949, partial_loss/deprel_loss: 0.6739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8922, loss: 0.7309, batch_reg_loss: 0.1741, reg_loss: 0.1742 ||:  85%|########4 | 94/111 [01:04<00:11,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9445, LAS: 0.8985, UEM: 0.5741, LEM: 0.3413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7387, partial_loss/deprel_loss: 0.6574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8477, loss: 0.7307, batch_reg_loss: 0.1741, reg_loss: 0.1741 ||:  88%|########8 | 98/111 [01:07<00:08,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9456, LAS: 0.8997, UEM: 0.5927, LEM: 0.3601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0877, partial_loss/deprel_loss: 0.2313, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3766, loss: 0.7215, batch_reg_loss: 0.1741, reg_loss: 0.1741 ||:  92%|#########1| 102/111 [01:10<00:06,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8893, UAS: 0.9453, LAS: 0.8995, UEM: 0.5870, LEM: 0.3552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6028, partial_loss/deprel_loss: 0.5774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7565, loss: 0.7237, batch_reg_loss: 0.1741, reg_loss: 0.1741 ||:  95%|#########4| 105/111 [01:12<00:04,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9456, LAS: 0.8997, UEM: 0.5861, LEM: 0.3529, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4799, partial_loss/deprel_loss: 0.5671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7237, loss: 0.7223, batch_reg_loss: 0.1741, reg_loss: 0.1741 ||:  97%|#########7| 108/111 [01:14<00:02,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9235, UAS: 0.9457, LAS: 0.8998, UEM: 0.5843, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2883, partial_loss/deprel_loss: 0.4537, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5946, loss: 0.7223, batch_reg_loss: 0.1740, reg_loss: 0.1741 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9235, UAS: 0.9457, LAS: 0.8998, UEM: 0.5843, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2883, partial_loss/deprel_loss: 0.4537, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5946, loss: 0.7223, batch_reg_loss: 0.1740, reg_loss: 0.1741 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
      "2023-04-07 00:27:18,544 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.454  |       N/A\n",
      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.288  |       N/A\n",
      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.174  |       N/A\n",
      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - UEM                      |     0.584  |       N/A\n",
      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - LAS                      |     0.900  |       N/A\n",
      "2023-04-07 00:27:18,545 - INFO - combo.training.tensorboard_writer - loss                     |     0.722  |       N/A\n",
      "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - LEM                      |     0.351  |       N/A\n",
      "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - UAS                      |     0.946  |       N/A\n",
      "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - EM                       |     0.924  |       N/A\n",
      "2023-04-07 00:27:18,546 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:27:18,552 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 00:27:24,771 - INFO - combo.training.trainer - Epoch duration: 0:01:26.320285\n",
      "2023-04-07 00:27:24,771 - INFO - combo.training.trainer - Estimated training time remaining: 7:17:18\n",
      "2023-04-07 00:27:24,771 - INFO - allennlp.training.trainer - Epoch 73/399\n",
      "2023-04-07 00:27:24,772 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:27:24,772 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:27:24,779 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9243, UAS: 0.9532, LAS: 0.9077, UEM: 0.5342, LEM: 0.2404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2385, partial_loss/deprel_loss: 0.4693, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5971, loss: 0.6751, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||:   4%|3         | 4/111 [00:02<01:12,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9652, UAS: 0.9604, LAS: 0.9180, UEM: 0.7379, LEM: 0.5320, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0522, partial_loss/deprel_loss: 0.1375, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2945, loss: 0.5981, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||:   6%|6         | 7/111 [00:05<01:14,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9118, UAS: 0.9585, LAS: 0.9155, UEM: 0.6843, LEM: 0.4623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3479, partial_loss/deprel_loss: 0.5002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6437, loss: 0.6111, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||:  10%|9         | 11/111 [00:07<01:10,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9587, LAS: 0.9153, UEM: 0.6754, LEM: 0.4484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6654, partial_loss/deprel_loss: 0.5753, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7673, loss: 0.6098, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||:  13%|#2        | 14/111 [00:10<01:09,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9597, LAS: 0.9163, UEM: 0.6823, LEM: 0.4418, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2609, partial_loss/deprel_loss: 0.4559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5908, loss: 0.6001, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||:  15%|#5        | 17/111 [00:12<01:09,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8714, UAS: 0.9560, LAS: 0.9106, UEM: 0.6453, LEM: 0.4084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8720, partial_loss/deprel_loss: 0.6651, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8805, loss: 0.6418, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||:  19%|#8        | 21/111 [00:15<01:04,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8644, UAS: 0.9553, LAS: 0.9103, UEM: 0.6530, LEM: 0.4157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0246, partial_loss/deprel_loss: 0.8085, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0257, loss: 0.6453, batch_reg_loss: 0.1740, reg_loss: 0.1740 ||:  22%|##1       | 24/111 [00:17<01:02,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9540, LAS: 0.9098, UEM: 0.6519, LEM: 0.4187, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3734, partial_loss/deprel_loss: 0.4383, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5992, loss: 0.6471, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  24%|##4       | 27/111 [00:19<01:00,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8607, UAS: 0.9525, LAS: 0.9076, UEM: 0.6388, LEM: 0.4050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9665, partial_loss/deprel_loss: 0.7185, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9421, loss: 0.6611, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  28%|##7       | 31/111 [00:21<00:55,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8631, UAS: 0.9514, LAS: 0.9063, UEM: 0.6255, LEM: 0.3937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0289, partial_loss/deprel_loss: 0.7669, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9932, loss: 0.6731, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  31%|###       | 34/111 [00:24<00:52,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9315, UAS: 0.9517, LAS: 0.9066, UEM: 0.6244, LEM: 0.3906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1890, partial_loss/deprel_loss: 0.3509, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4924, loss: 0.6727, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  33%|###3      | 37/111 [00:26<00:51,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9514, LAS: 0.9063, UEM: 0.6176, LEM: 0.3814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5196, partial_loss/deprel_loss: 0.5613, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7269, loss: 0.6731, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  36%|###6      | 40/111 [00:28<00:49,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8627, UAS: 0.9502, LAS: 0.9048, UEM: 0.6083, LEM: 0.3723, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0434, partial_loss/deprel_loss: 0.8135, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0334, loss: 0.6860, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  40%|###9      | 44/111 [00:30<00:45,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9485, LAS: 0.9032, UEM: 0.5897, LEM: 0.3579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9389, partial_loss/deprel_loss: 0.7671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9754, loss: 0.7012, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  43%|####3     | 48/111 [00:33<00:41,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9485, LAS: 0.9034, UEM: 0.5817, LEM: 0.3499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7179, partial_loss/deprel_loss: 0.6370, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8271, loss: 0.7025, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  47%|####6     | 52/111 [00:35<00:37,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9486, LAS: 0.9035, UEM: 0.5822, LEM: 0.3508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3235, partial_loss/deprel_loss: 0.4352, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5868, loss: 0.7005, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  50%|#####     | 56/111 [00:38<00:37,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9498, LAS: 0.9046, UEM: 0.6007, LEM: 0.3648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2713, partial_loss/deprel_loss: 0.4238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5672, loss: 0.6910, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  53%|#####3    | 59/111 [00:40<00:36,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9096, UAS: 0.9496, LAS: 0.9047, UEM: 0.6015, LEM: 0.3670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4178, partial_loss/deprel_loss: 0.4418, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6108, loss: 0.6893, batch_reg_loss: 0.1739, reg_loss: 0.1740 ||:  56%|#####5    | 62/111 [00:43<00:34,  1.42it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9491, LAS: 0.9041, UEM: 0.5914, LEM: 0.3569, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4079, partial_loss/deprel_loss: 0.4585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6222, loss: 0.6939, batch_reg_loss: 0.1739, reg_loss: 0.1739 ||:  59%|#####9    | 66/111 [00:45<00:30,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9480, LAS: 0.9030, UEM: 0.5828, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3412, partial_loss/deprel_loss: 0.4105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5705, loss: 0.7012, batch_reg_loss: 0.1739, reg_loss: 0.1739 ||:  63%|######3   | 70/111 [00:48<00:27,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8167, UAS: 0.9473, LAS: 0.9025, UEM: 0.5904, LEM: 0.3606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.8044, partial_loss/deprel_loss: 1.0041, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3380, loss: 0.7049, batch_reg_loss: 0.1739, reg_loss: 0.1739 ||:  67%|######6   | 74/111 [00:51<00:26,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9003, UAS: 0.9475, LAS: 0.9027, UEM: 0.5984, LEM: 0.3730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5672, partial_loss/deprel_loss: 0.6062, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7722, loss: 0.7044, batch_reg_loss: 0.1739, reg_loss: 0.1739 ||:  69%|######9   | 77/111 [00:53<00:23,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9465, LAS: 0.9015, UEM: 0.5902, LEM: 0.3671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6163, partial_loss/deprel_loss: 0.5954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7734, loss: 0.7126, batch_reg_loss: 0.1739, reg_loss: 0.1739 ||:  72%|#######2  | 80/111 [00:55<00:22,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8700, UAS: 0.9460, LAS: 0.9007, UEM: 0.5845, LEM: 0.3607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9029, partial_loss/deprel_loss: 0.7944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9899, loss: 0.7188, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||:  76%|#######5  | 84/111 [00:58<00:18,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8562, UAS: 0.9461, LAS: 0.9008, UEM: 0.5894, LEM: 0.3649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0194, partial_loss/deprel_loss: 0.7513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9788, loss: 0.7168, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||:  79%|#######9  | 88/111 [01:00<00:15,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9464, LAS: 0.9011, UEM: 0.5857, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3949, partial_loss/deprel_loss: 0.4863, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6419, loss: 0.7150, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||:  82%|########1 | 91/111 [01:03<00:14,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8849, UAS: 0.9463, LAS: 0.9008, UEM: 0.5802, LEM: 0.3548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7188, partial_loss/deprel_loss: 0.7382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9082, loss: 0.7179, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||:  85%|########4 | 94/111 [01:05<00:12,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9464, LAS: 0.9009, UEM: 0.5844, LEM: 0.3581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3451, partial_loss/deprel_loss: 0.4686, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6178, loss: 0.7152, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||:  87%|########7 | 97/111 [01:07<00:10,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9463, LAS: 0.9008, UEM: 0.5848, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3774, partial_loss/deprel_loss: 0.5079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6556, loss: 0.7175, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||:  90%|######### | 100/111 [01:09<00:08,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9466, LAS: 0.9012, UEM: 0.5866, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2466, partial_loss/deprel_loss: 0.4409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5759, loss: 0.7140, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||:  94%|#########3| 104/111 [01:12<00:05,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8519, UAS: 0.9466, LAS: 0.9010, UEM: 0.5883, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2192, partial_loss/deprel_loss: 0.8357, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0862, loss: 0.7151, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||:  96%|#########6| 107/111 [01:14<00:02,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9465, LAS: 0.9009, UEM: 0.5843, LEM: 0.3538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5333, partial_loss/deprel_loss: 0.6096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7682, loss: 0.7148, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||: 100%|##########| 111/111 [01:17<00:00,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9465, LAS: 0.9009, UEM: 0.5843, LEM: 0.3538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5333, partial_loss/deprel_loss: 0.6096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7682, loss: 0.7148, batch_reg_loss: 0.1738, reg_loss: 0.1739 ||: 100%|##########| 111/111 [01:17<00:00,  1.44it/s]\n",
      "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:28:45,374 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.610  |       N/A\n",
      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.533  |       N/A\n",
      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.174  |       N/A\n",
      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - UEM                      |     0.584  |       N/A\n",
      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - LAS                      |     0.901  |       N/A\n",
      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - loss                     |     0.715  |       N/A\n",
      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - LEM                      |     0.354  |       N/A\n",
      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - UAS                      |     0.947  |       N/A\n",
      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - EM                       |     0.894  |       N/A\n",
      "2023-04-07 00:28:45,375 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:28:45,380 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 00:28:50,593 - INFO - combo.training.trainer - Epoch duration: 0:01:25.821825\n",
      "2023-04-07 00:28:50,594 - INFO - combo.training.trainer - Estimated training time remaining: 7:16:22\n",
      "2023-04-07 00:28:50,594 - INFO - allennlp.training.trainer - Epoch 74/399\n",
      "2023-04-07 00:28:50,594 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:28:50,595 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:28:50,602 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8910, UAS: 0.9457, LAS: 0.8979, UEM: 0.4358, LEM: 0.1813, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4698, partial_loss/deprel_loss: 0.6442, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7831, loss: 0.7372, batch_reg_loss: 0.1738, reg_loss: 0.1738 ||:   4%|3         | 4/111 [00:02<01:04,  1.66it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8980, UAS: 0.9483, LAS: 0.8997, UEM: 0.4974, LEM: 0.2300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4275, partial_loss/deprel_loss: 0.6147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7511, loss: 0.7173, batch_reg_loss: 0.1738, reg_loss: 0.1738 ||:   6%|6         | 7/111 [00:04<01:06,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9457, LAS: 0.8984, UEM: 0.4551, LEM: 0.2003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5032, partial_loss/deprel_loss: 0.5335, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7012, loss: 0.7334, batch_reg_loss: 0.1738, reg_loss: 0.1738 ||:  10%|9         | 11/111 [00:07<01:03,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9439, LAS: 0.8984, UEM: 0.4737, LEM: 0.2324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2852, partial_loss/deprel_loss: 0.3420, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5044, loss: 0.7341, batch_reg_loss: 0.1738, reg_loss: 0.1738 ||:  13%|#2        | 14/111 [00:09<01:03,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9475, LAS: 0.9026, UEM: 0.5509, LEM: 0.3213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4653, partial_loss/deprel_loss: 0.5485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7056, loss: 0.7058, batch_reg_loss: 0.1738, reg_loss: 0.1738 ||:  16%|#6        | 18/111 [00:11<01:01,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9479, LAS: 0.9031, UEM: 0.5658, LEM: 0.3382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1822, partial_loss/deprel_loss: 0.3363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4793, loss: 0.6988, batch_reg_loss: 0.1738, reg_loss: 0.1738 ||:  20%|#9        | 22/111 [00:14<01:00,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9479, LAS: 0.9028, UEM: 0.5521, LEM: 0.3233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3213, partial_loss/deprel_loss: 0.4385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5888, loss: 0.7014, batch_reg_loss: 0.1738, reg_loss: 0.1738 ||:  23%|##2       | 25/111 [00:17<01:00,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9110, UAS: 0.9484, LAS: 0.9031, UEM: 0.5483, LEM: 0.3160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3309, partial_loss/deprel_loss: 0.5004, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6403, loss: 0.6986, batch_reg_loss: 0.1737, reg_loss: 0.1738 ||:  25%|##5       | 28/111 [00:19<01:00,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8777, UAS: 0.9473, LAS: 0.9015, UEM: 0.5368, LEM: 0.3037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6838, partial_loss/deprel_loss: 0.6598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8384, loss: 0.7088, batch_reg_loss: 0.1737, reg_loss: 0.1738 ||:  29%|##8       | 32/111 [00:21<00:54,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9080, UAS: 0.9485, LAS: 0.9027, UEM: 0.5627, LEM: 0.3290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3361, partial_loss/deprel_loss: 0.4837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6279, loss: 0.7007, batch_reg_loss: 0.1737, reg_loss: 0.1738 ||:  32%|###1      | 35/111 [00:24<00:53,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9201, UAS: 0.9499, LAS: 0.9039, UEM: 0.5790, LEM: 0.3363, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2282, partial_loss/deprel_loss: 0.4233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5580, loss: 0.6914, batch_reg_loss: 0.1737, reg_loss: 0.1738 ||:  34%|###4      | 38/111 [00:26<00:53,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8834, UAS: 0.9492, LAS: 0.9031, UEM: 0.5832, LEM: 0.3421, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5601, partial_loss/deprel_loss: 0.7277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8679, loss: 0.6963, batch_reg_loss: 0.1737, reg_loss: 0.1738 ||:  37%|###6      | 41/111 [00:28<00:50,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8833, UAS: 0.9482, LAS: 0.9020, UEM: 0.5690, LEM: 0.3308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8162, partial_loss/deprel_loss: 0.7002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8971, loss: 0.7059, batch_reg_loss: 0.1737, reg_loss: 0.1738 ||:  40%|###9      | 44/111 [00:30<00:48,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9478, LAS: 0.9018, UEM: 0.5640, LEM: 0.3279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2325, partial_loss/deprel_loss: 0.3602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5083, loss: 0.7076, batch_reg_loss: 0.1737, reg_loss: 0.1738 ||:  43%|####3     | 48/111 [00:33<00:42,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9472, LAS: 0.9016, UEM: 0.5642, LEM: 0.3289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2649, partial_loss/deprel_loss: 0.3708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5233, loss: 0.7090, batch_reg_loss: 0.1737, reg_loss: 0.1737 ||:  47%|####6     | 52/111 [00:35<00:40,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9473, LAS: 0.9019, UEM: 0.5663, LEM: 0.3295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2980, partial_loss/deprel_loss: 0.4821, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6190, loss: 0.7079, batch_reg_loss: 0.1737, reg_loss: 0.1737 ||:  50%|####9     | 55/111 [00:37<00:38,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9480, LAS: 0.9025, UEM: 0.5654, LEM: 0.3257, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2673, partial_loss/deprel_loss: 0.4732, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6057, loss: 0.7046, batch_reg_loss: 0.1737, reg_loss: 0.1737 ||:  52%|#####2    | 58/111 [00:40<00:37,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9475, LAS: 0.9022, UEM: 0.5687, LEM: 0.3288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2206, partial_loss/deprel_loss: 0.3796, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5214, loss: 0.7055, batch_reg_loss: 0.1737, reg_loss: 0.1737 ||:  56%|#####5    | 62/111 [00:42<00:34,  1.43it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9476, LAS: 0.9025, UEM: 0.6012, LEM: 0.3717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1395, partial_loss/deprel_loss: 0.3569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4871, loss: 0.7037, batch_reg_loss: 0.1737, reg_loss: 0.1737 ||:  59%|#####8    | 65/111 [00:45<00:33,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8939, UAS: 0.9469, LAS: 0.9016, UEM: 0.5897, LEM: 0.3617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5729, partial_loss/deprel_loss: 0.5866, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7575, loss: 0.7124, batch_reg_loss: 0.1737, reg_loss: 0.1737 ||:  62%|######2   | 69/111 [00:47<00:29,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8403, UAS: 0.9468, LAS: 0.9016, UEM: 0.5911, LEM: 0.3602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4491, partial_loss/deprel_loss: 0.8480, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1418, loss: 0.7127, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  66%|######5   | 73/111 [00:50<00:26,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8697, UAS: 0.9465, LAS: 0.9013, UEM: 0.5840, LEM: 0.3541, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7986, partial_loss/deprel_loss: 0.7437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9283, loss: 0.7160, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  68%|######8   | 76/111 [00:52<00:24,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9460, LAS: 0.9008, UEM: 0.5814, LEM: 0.3498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2858, partial_loss/deprel_loss: 0.4362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5797, loss: 0.7194, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  72%|#######2  | 80/111 [00:55<00:20,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9465, LAS: 0.9011, UEM: 0.5803, LEM: 0.3452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4513, partial_loss/deprel_loss: 0.5489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7031, loss: 0.7158, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  76%|#######5  | 84/111 [00:57<00:18,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8191, UAS: 0.9453, LAS: 0.8998, UEM: 0.5735, LEM: 0.3399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7406, partial_loss/deprel_loss: 1.0592, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3691, loss: 0.7262, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  78%|#######8  | 87/111 [01:00<00:16,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9462, LAS: 0.9008, UEM: 0.5816, LEM: 0.3452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1876, partial_loss/deprel_loss: 0.3523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4930, loss: 0.7184, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  82%|########1 | 91/111 [01:02<00:13,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8601, UAS: 0.9458, LAS: 0.9004, UEM: 0.5796, LEM: 0.3441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9515, partial_loss/deprel_loss: 0.8350, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0319, loss: 0.7209, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  86%|########5 | 95/111 [01:05<00:10,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9462, LAS: 0.9009, UEM: 0.5865, LEM: 0.3511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2142, partial_loss/deprel_loss: 0.3441, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4918, loss: 0.7158, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  88%|########8 | 98/111 [01:07<00:09,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9463, LAS: 0.9009, UEM: 0.5842, LEM: 0.3484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3423, partial_loss/deprel_loss: 0.5043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6456, loss: 0.7160, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  91%|######### | 101/111 [01:09<00:07,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8651, UAS: 0.9461, LAS: 0.9005, UEM: 0.5788, LEM: 0.3430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9346, partial_loss/deprel_loss: 0.7656, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9730, loss: 0.7180, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  95%|#########4| 105/111 [01:12<00:04,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9465, LAS: 0.9009, UEM: 0.5816, LEM: 0.3436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6470, partial_loss/deprel_loss: 0.5651, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7551, loss: 0.7137, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||:  98%|#########8| 109/111 [01:15<00:01,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9116, UAS: 0.9469, LAS: 0.9013, UEM: 0.5879, LEM: 0.3505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4319, partial_loss/deprel_loss: 0.4654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6323, loss: 0.7106, batch_reg_loss: 0.1736, reg_loss: 0.1737 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.465  |       N/A\n",
      "2023-04-07 00:30:10,471 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.432  |       N/A\n",
      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.174  |       N/A\n",
      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - UEM                      |     0.588  |       N/A\n",
      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - LAS                      |     0.901  |       N/A\n",
      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - loss                     |     0.711  |       N/A\n",
      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - LEM                      |     0.351  |       N/A\n",
      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - UAS                      |     0.947  |       N/A\n",
      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - EM                       |     0.912  |       N/A\n",
      "2023-04-07 00:30:10,472 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 00:30:10,477 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 00:30:15,615 - INFO - combo.training.trainer - Epoch duration: 0:01:25.020714\n",
      "2023-04-07 00:30:15,615 - INFO - combo.training.trainer - Estimated training time remaining: 7:15:22\n",
      "2023-04-07 00:30:15,616 - INFO - allennlp.training.trainer - Epoch 75/399\n",
      "2023-04-07 00:30:15,616 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:30:15,616 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:30:15,626 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9491, LAS: 0.9042, UEM: 0.4891, LEM: 0.2782, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6299, partial_loss/deprel_loss: 0.6336, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8064, loss: 0.7056, batch_reg_loss: 0.1736, reg_loss: 0.1736 ||:   4%|3         | 4/111 [00:02<01:08,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9146, UAS: 0.9499, LAS: 0.9071, UEM: 0.4945, LEM: 0.2844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3865, partial_loss/deprel_loss: 0.4271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5926, loss: 0.6799, batch_reg_loss: 0.1736, reg_loss: 0.1736 ||:   6%|6         | 7/111 [00:04<01:07,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9516, LAS: 0.9080, UEM: 0.5327, LEM: 0.3093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4005, partial_loss/deprel_loss: 0.5567, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6990, loss: 0.6671, batch_reg_loss: 0.1735, reg_loss: 0.1736 ||:   9%|9         | 10/111 [00:06<01:06,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9507, LAS: 0.9067, UEM: 0.5098, LEM: 0.2815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4433, partial_loss/deprel_loss: 0.5343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6896, loss: 0.6811, batch_reg_loss: 0.1735, reg_loss: 0.1736 ||:  12%|#1        | 13/111 [00:08<01:05,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8704, UAS: 0.9465, LAS: 0.9025, UEM: 0.4974, LEM: 0.2796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9581, partial_loss/deprel_loss: 0.7562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9701, loss: 0.7203, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  15%|#5        | 17/111 [00:11<01:02,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9489, LAS: 0.9046, UEM: 0.5301, LEM: 0.2974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2274, partial_loss/deprel_loss: 0.4505, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5794, loss: 0.6991, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  19%|#8        | 21/111 [00:14<01:00,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9478, LAS: 0.9035, UEM: 0.5397, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5845, partial_loss/deprel_loss: 0.5930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7648, loss: 0.7022, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  22%|##1       | 24/111 [00:16<00:58,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9468, LAS: 0.9015, UEM: 0.5314, LEM: 0.3007, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2592, partial_loss/deprel_loss: 0.4407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5779, loss: 0.7139, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  24%|##4       | 27/111 [00:18<00:58,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.9464, LAS: 0.9007, UEM: 0.5205, LEM: 0.2877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8469, partial_loss/deprel_loss: 0.7144, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9144, loss: 0.7212, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  28%|##7       | 31/111 [00:20<00:54,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9458, LAS: 0.9003, UEM: 0.5028, LEM: 0.2713, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7110, partial_loss/deprel_loss: 0.5689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7708, loss: 0.7229, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  32%|###1      | 35/111 [00:23<00:49,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9259, UAS: 0.9465, LAS: 0.9008, UEM: 0.5095, LEM: 0.2718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2651, partial_loss/deprel_loss: 0.4027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5487, loss: 0.7180, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  35%|###5      | 39/111 [00:25<00:46,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8458, UAS: 0.9450, LAS: 0.8992, UEM: 0.5146, LEM: 0.2811, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3986, partial_loss/deprel_loss: 0.8601, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1413, loss: 0.7268, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  39%|###8      | 43/111 [00:28<00:46,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9453, LAS: 0.8996, UEM: 0.5111, LEM: 0.2752, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7778, partial_loss/deprel_loss: 0.7009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8898, loss: 0.7258, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  42%|####2     | 47/111 [00:31<00:42,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9460, LAS: 0.9001, UEM: 0.5274, LEM: 0.2936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1283, partial_loss/deprel_loss: 0.2925, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4332, loss: 0.7209, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  45%|####5     | 50/111 [00:33<00:41,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9331, UAS: 0.9465, LAS: 0.9009, UEM: 0.5576, LEM: 0.3287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1901, partial_loss/deprel_loss: 0.3367, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4808, loss: 0.7148, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  48%|####7     | 53/111 [00:35<00:41,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9470, LAS: 0.9016, UEM: 0.5619, LEM: 0.3321, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4573, partial_loss/deprel_loss: 0.5106, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6734, loss: 0.7086, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  50%|#####     | 56/111 [00:38<00:40,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9478, LAS: 0.9026, UEM: 0.5709, LEM: 0.3398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2196, partial_loss/deprel_loss: 0.3034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4601, loss: 0.7010, batch_reg_loss: 0.1735, reg_loss: 0.1735 ||:  53%|#####3    | 59/111 [00:40<00:40,  1.29it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9140, UAS: 0.9478, LAS: 0.9028, UEM: 0.5694, LEM: 0.3376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3711, partial_loss/deprel_loss: 0.4710, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6245, loss: 0.6999, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  56%|#####5    | 62/111 [00:42<00:36,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8679, UAS: 0.9477, LAS: 0.9025, UEM: 0.5648, LEM: 0.3325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9499, partial_loss/deprel_loss: 0.7206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9399, loss: 0.7035, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  59%|#####8    | 65/111 [00:44<00:33,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8757, UAS: 0.9478, LAS: 0.9026, UEM: 0.5617, LEM: 0.3290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7457, partial_loss/deprel_loss: 0.7231, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9010, loss: 0.7022, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  62%|######2   | 69/111 [00:47<00:29,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8668, UAS: 0.9464, LAS: 0.9012, UEM: 0.5578, LEM: 0.3260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0939, partial_loss/deprel_loss: 0.8407, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0648, loss: 0.7157, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  65%|######4   | 72/111 [00:49<00:27,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9469, LAS: 0.9017, UEM: 0.5644, LEM: 0.3297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5945, partial_loss/deprel_loss: 0.5757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7529, loss: 0.7114, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  68%|######7   | 75/111 [00:51<00:25,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8894, UAS: 0.9467, LAS: 0.9014, UEM: 0.5578, LEM: 0.3226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6574, partial_loss/deprel_loss: 0.6179, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7992, loss: 0.7137, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  71%|#######1  | 79/111 [00:54<00:21,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8979, UAS: 0.9470, LAS: 0.9017, UEM: 0.5695, LEM: 0.3354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5613, partial_loss/deprel_loss: 0.5691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7409, loss: 0.7098, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  75%|#######4  | 83/111 [00:56<00:19,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9227, UAS: 0.9473, LAS: 0.9019, UEM: 0.5681, LEM: 0.3323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3195, partial_loss/deprel_loss: 0.4217, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5746, loss: 0.7095, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  78%|#######8  | 87/111 [00:59<00:16,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9471, LAS: 0.9017, UEM: 0.5661, LEM: 0.3293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4214, partial_loss/deprel_loss: 0.4737, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6366, loss: 0.7102, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  82%|########1 | 91/111 [01:01<00:12,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8424, UAS: 0.9471, LAS: 0.9017, UEM: 0.5694, LEM: 0.3318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3132, partial_loss/deprel_loss: 0.8401, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1081, loss: 0.7094, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  86%|########5 | 95/111 [01:04<00:10,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9166, UAS: 0.9467, LAS: 0.9015, UEM: 0.5678, LEM: 0.3295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4053, partial_loss/deprel_loss: 0.4962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6514, loss: 0.7116, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  89%|########9 | 99/111 [01:07<00:07,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9283, UAS: 0.9472, LAS: 0.9019, UEM: 0.5759, LEM: 0.3360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1922, partial_loss/deprel_loss: 0.3905, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5242, loss: 0.7089, batch_reg_loss: 0.1734, reg_loss: 0.1735 ||:  93%|#########2| 103/111 [01:10<00:05,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8366, UAS: 0.9472, LAS: 0.9020, UEM: 0.5894, LEM: 0.3556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3455, partial_loss/deprel_loss: 1.0114, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2516, loss: 0.7093, batch_reg_loss: 0.1733, reg_loss: 0.1735 ||:  95%|#########5| 106/111 [01:12<00:03,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8681, UAS: 0.9473, LAS: 0.9022, UEM: 0.5902, LEM: 0.3549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0149, partial_loss/deprel_loss: 0.6764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9174, loss: 0.7074, batch_reg_loss: 0.1733, reg_loss: 0.1735 ||:  99%|#########9| 110/111 [01:14<00:00,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9474, LAS: 0.9022, UEM: 0.5892, LEM: 0.3539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5141, partial_loss/deprel_loss: 0.4841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6635, loss: 0.7070, batch_reg_loss: 0.1733, reg_loss: 0.1735 ||: 100%|##########| 111/111 [01:15<00:00,  1.47it/s]\n",
      "2023-04-07 00:31:33,915 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8312, UAS: 0.9126, LAS: 0.8528, UEM: 0.2678, LEM: 0.0820, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5891, partial_loss/deprel_loss: 57.0978, partial_loss/cycle_loss: 0.0000, batch_loss: 45.9961, loss: 35.5607, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:11,  1.04s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9458, LAS: 0.8918, UEM: 0.6731, LEM: 0.3689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4201, partial_loss/deprel_loss: 24.8719, partial_loss/cycle_loss: 0.0000, batch_loss: 19.9815, loss: 26.3380, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:04<00:08,  1.01s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8755, UAS: 0.9447, LAS: 0.8922, UEM: 0.6285, LEM: 0.3438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0363, partial_loss/deprel_loss: 36.5851, partial_loss/cycle_loss: 0.0000, batch_loss: 29.4754, loss: 26.2771, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:07<00:04,  1.03it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9436, LAS: 0.8913, UEM: 0.6011, LEM: 0.3155, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5407, partial_loss/deprel_loss: 24.4729, partial_loss/cycle_loss: 0.0000, batch_loss: 19.6864, loss: 26.8626, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  77%|#######6  | 10/13 [00:09<00:02,  1.02it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9466, LAS: 0.8953, UEM: 0.6564, LEM: 0.3961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1730, partial_loss/deprel_loss: 20.4255, partial_loss/cycle_loss: 0.0000, batch_loss: 16.3750, loss: 25.7702, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  92%|#########2| 12/13 [00:11<00:00,  1.01it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9464, LAS: 0.8949, UEM: 0.6475, LEM: 0.3824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6519, partial_loss/deprel_loss: 34.6901, partial_loss/cycle_loss: 0.0000, batch_loss: 27.8825, loss: 25.9327, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.04it/s]\n",
      "2023-04-07 00:31:46,420 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.484  |    34.690\n",
      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.514  |     0.652\n",
      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.173  |     0.000\n",
      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - UEM                      |     0.589  |     0.648\n",
      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - LAS                      |     0.902  |     0.895\n",
      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - loss                     |     0.707  |    25.933\n",
      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:31:46,421 - INFO - combo.training.tensorboard_writer - LEM                      |     0.354  |     0.382\n",
      "2023-04-07 00:31:46,422 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-07 00:31:46,422 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-07 00:31:46,422 - INFO - combo.training.tensorboard_writer - UAS                      |     0.947  |     0.946\n",
      "2023-04-07 00:31:46,422 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-07 00:31:46,422 - INFO - combo.training.tensorboard_writer - EM                       |     0.907  |     0.890\n",
      "2023-04-07 00:31:46,422 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:31:46,427 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 00:31:51,593 - INFO - combo.training.trainer - Epoch duration: 0:01:35.977183\n",
      "2023-04-07 00:31:51,595 - INFO - combo.training.trainer - Estimated training time remaining: 7:15:08\n",
      "2023-04-07 00:31:51,595 - INFO - allennlp.training.trainer - Epoch 76/399\n",
      "2023-04-07 00:31:51,595 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:31:51,596 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:31:51,605 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8557, UAS: 0.9347, LAS: 0.8909, UEM: 0.5095, LEM: 0.2695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2675, partial_loss/deprel_loss: 0.8097, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0746, loss: 0.7894, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:   4%|3         | 4/111 [00:02<01:09,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8760, UAS: 0.9366, LAS: 0.8924, UEM: 0.3993, LEM: 0.1864, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9186, partial_loss/deprel_loss: 0.7514, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9581, loss: 0.7899, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:   7%|7         | 8/111 [00:05<01:05,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8899, UAS: 0.9376, LAS: 0.8935, UEM: 0.3859, LEM: 0.1759, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6642, partial_loss/deprel_loss: 0.6574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8321, loss: 0.7815, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  10%|9         | 11/111 [00:07<01:05,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9429, LAS: 0.8999, UEM: 0.5021, LEM: 0.2824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1660, partial_loss/deprel_loss: 0.3516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4878, loss: 0.7301, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  13%|#2        | 14/111 [00:09<01:07,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8859, UAS: 0.9421, LAS: 0.8981, UEM: 0.4642, LEM: 0.2499, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5952, partial_loss/deprel_loss: 0.5753, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7526, loss: 0.7337, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  16%|#6        | 18/111 [00:12<01:03,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8869, UAS: 0.9433, LAS: 0.8993, UEM: 0.4622, LEM: 0.2416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7205, partial_loss/deprel_loss: 0.6275, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8194, loss: 0.7294, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  19%|#8        | 21/111 [00:14<01:01,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8956, UAS: 0.9412, LAS: 0.8971, UEM: 0.4414, LEM: 0.2264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5751, partial_loss/deprel_loss: 0.5682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7429, loss: 0.7399, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  22%|##1       | 24/111 [00:16<00:59,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9438, LAS: 0.9003, UEM: 0.4829, LEM: 0.2618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1826, partial_loss/deprel_loss: 0.2829, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4361, loss: 0.7217, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  25%|##5       | 28/111 [00:18<00:53,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9451, LAS: 0.9016, UEM: 0.5168, LEM: 0.2964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6928, partial_loss/deprel_loss: 0.6290, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8150, loss: 0.7092, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  28%|##7       | 31/111 [00:20<00:56,  1.42it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8856, UAS: 0.9432, LAS: 0.8997, UEM: 0.5206, LEM: 0.3000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7606, partial_loss/deprel_loss: 0.6660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8582, loss: 0.7262, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  31%|###       | 34/111 [00:23<00:55,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9443, LAS: 0.9008, UEM: 0.5325, LEM: 0.3093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2798, partial_loss/deprel_loss: 0.3900, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5412, loss: 0.7177, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  33%|###3      | 37/111 [00:25<00:52,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9536, UAS: 0.9462, LAS: 0.9029, UEM: 0.5708, LEM: 0.3511, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0746, partial_loss/deprel_loss: 0.1974, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3461, loss: 0.7017, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  36%|###6      | 40/111 [00:27<00:49,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9462, LAS: 0.9027, UEM: 0.5641, LEM: 0.3419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3328, partial_loss/deprel_loss: 0.4941, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6351, loss: 0.7032, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  39%|###8      | 43/111 [00:29<00:48,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8922, UAS: 0.9468, LAS: 0.9032, UEM: 0.5601, LEM: 0.3345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5435, partial_loss/deprel_loss: 0.6927, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8361, loss: 0.7015, batch_reg_loss: 0.1733, reg_loss: 0.1733 ||:  42%|####2     | 47/111 [00:32<00:44,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9016, UAS: 0.9467, LAS: 0.9027, UEM: 0.5492, LEM: 0.3239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4341, partial_loss/deprel_loss: 0.5543, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7035, loss: 0.7062, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  45%|####5     | 50/111 [00:34<00:41,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8707, UAS: 0.9462, LAS: 0.9021, UEM: 0.5426, LEM: 0.3180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0915, partial_loss/deprel_loss: 0.7196, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9672, loss: 0.7087, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  49%|####8     | 54/111 [00:36<00:37,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9400, UAS: 0.9460, LAS: 0.9020, UEM: 0.5445, LEM: 0.3212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1289, partial_loss/deprel_loss: 0.2808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4237, loss: 0.7099, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  52%|#####2    | 58/111 [00:39<00:34,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8858, UAS: 0.9462, LAS: 0.9021, UEM: 0.5429, LEM: 0.3164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7801, partial_loss/deprel_loss: 0.6634, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8600, loss: 0.7097, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  56%|#####5    | 62/111 [00:42<00:33,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9451, LAS: 0.9010, UEM: 0.5357, LEM: 0.3106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4855, partial_loss/deprel_loss: 0.4707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6469, loss: 0.7182, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  59%|#####8    | 65/111 [00:44<00:32,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9461, LAS: 0.9021, UEM: 0.5474, LEM: 0.3176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2151, partial_loss/deprel_loss: 0.3456, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4927, loss: 0.7102, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  61%|######1   | 68/111 [00:46<00:30,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9467, LAS: 0.9027, UEM: 0.5512, LEM: 0.3201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1928, partial_loss/deprel_loss: 0.3655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5042, loss: 0.7054, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  65%|######4   | 72/111 [00:49<00:27,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9475, LAS: 0.9035, UEM: 0.5626, LEM: 0.3277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2363, partial_loss/deprel_loss: 0.3691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5158, loss: 0.6985, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  68%|######7   | 75/111 [00:51<00:24,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8756, UAS: 0.9473, LAS: 0.9034, UEM: 0.5586, LEM: 0.3227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8980, partial_loss/deprel_loss: 0.7342, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9401, loss: 0.7008, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  72%|#######2  | 80/111 [00:53<00:19,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9467, LAS: 0.9025, UEM: 0.5626, LEM: 0.3271, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0960, partial_loss/deprel_loss: 0.3072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4381, loss: 0.7070, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  76%|#######5  | 84/111 [00:56<00:17,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9468, LAS: 0.9025, UEM: 0.5600, LEM: 0.3238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2817, partial_loss/deprel_loss: 0.4330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5759, loss: 0.7073, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  79%|#######9  | 88/111 [00:59<00:15,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9472, LAS: 0.9029, UEM: 0.5658, LEM: 0.3264, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2821, partial_loss/deprel_loss: 0.4354, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5779, loss: 0.7038, batch_reg_loss: 0.1732, reg_loss: 0.1733 ||:  83%|########2 | 92/111 [01:02<00:13,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9481, LAS: 0.9040, UEM: 0.5924, LEM: 0.3602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1210, partial_loss/deprel_loss: 0.2562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4023, loss: 0.6952, batch_reg_loss: 0.1732, reg_loss: 0.1732 ||:  86%|########5 | 95/111 [01:05<00:12,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9480, LAS: 0.9038, UEM: 0.5892, LEM: 0.3560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3368, partial_loss/deprel_loss: 0.5038, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6435, loss: 0.6965, batch_reg_loss: 0.1731, reg_loss: 0.1732 ||:  89%|########9 | 99/111 [01:07<00:08,  1.39it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9482, LAS: 0.9040, UEM: 0.5977, LEM: 0.3651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1306, partial_loss/deprel_loss: 0.2463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3963, loss: 0.6941, batch_reg_loss: 0.1731, reg_loss: 0.1732 ||:  92%|#########1| 102/111 [01:10<00:06,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8735, UAS: 0.9480, LAS: 0.9038, UEM: 0.5968, LEM: 0.3653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9104, partial_loss/deprel_loss: 0.7103, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9235, loss: 0.6946, batch_reg_loss: 0.1731, reg_loss: 0.1732 ||:  95%|#########4| 105/111 [01:12<00:04,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8919, UAS: 0.9480, LAS: 0.9037, UEM: 0.5927, LEM: 0.3607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5892, partial_loss/deprel_loss: 0.6759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8316, loss: 0.6965, batch_reg_loss: 0.1731, reg_loss: 0.1732 ||:  98%|#########8| 109/111 [01:14<00:01,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8419, UAS: 0.9473, LAS: 0.9031, UEM: 0.5895, LEM: 0.3579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4323, partial_loss/deprel_loss: 0.8211, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1164, loss: 0.7008, batch_reg_loss: 0.1731, reg_loss: 0.1732 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.821  |       N/A\n",
      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.432  |       N/A\n",
      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.173  |       N/A\n",
      "2023-04-07 00:33:10,831 - INFO - combo.training.tensorboard_writer - UEM                      |     0.590  |       N/A\n",
      "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - LAS                      |     0.903  |       N/A\n",
      "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - loss                     |     0.701  |       N/A\n",
      "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - LEM                      |     0.358  |       N/A\n",
      "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - UAS                      |     0.947  |       N/A\n",
      "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - EM                       |     0.842  |       N/A\n",
      "2023-04-07 00:33:10,832 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:33:10,837 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 00:33:15,301 - INFO - combo.training.trainer - Epoch duration: 0:01:23.706250\n",
      "2023-04-07 00:33:15,302 - INFO - combo.training.trainer - Estimated training time remaining: 7:14:01\n",
      "2023-04-07 00:33:15,302 - INFO - allennlp.training.trainer - Epoch 77/399\n",
      "2023-04-07 00:33:15,302 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:33:15,303 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:33:15,313 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9540, LAS: 0.9091, UEM: 0.4911, LEM: 0.2216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3272, partial_loss/deprel_loss: 0.4489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5977, loss: 0.6525, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:   4%|3         | 4/111 [00:02<01:08,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9550, LAS: 0.9096, UEM: 0.5444, LEM: 0.2853, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1937, partial_loss/deprel_loss: 0.3571, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4976, loss: 0.6352, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:   6%|6         | 7/111 [00:04<01:10,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9568, LAS: 0.9127, UEM: 0.6099, LEM: 0.3717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3553, partial_loss/deprel_loss: 0.4601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6122, loss: 0.6160, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:   9%|9         | 10/111 [00:06<01:08,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9056, UAS: 0.9545, LAS: 0.9111, UEM: 0.5946, LEM: 0.3607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4713, partial_loss/deprel_loss: 0.5090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6746, loss: 0.6297, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:  12%|#1        | 13/111 [00:09<01:08,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9542, LAS: 0.9106, UEM: 0.5909, LEM: 0.3562, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3604, partial_loss/deprel_loss: 0.4224, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5831, loss: 0.6357, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:  14%|#4        | 16/111 [00:11<01:07,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9000, UAS: 0.9499, LAS: 0.9057, UEM: 0.5877, LEM: 0.3513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5063, partial_loss/deprel_loss: 0.5628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7246, loss: 0.6704, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:  17%|#7        | 19/111 [00:13<01:07,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9477, LAS: 0.9023, UEM: 0.5584, LEM: 0.3260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7295, partial_loss/deprel_loss: 0.6436, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8338, loss: 0.6924, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:  20%|#9        | 22/111 [00:15<01:04,  1.38it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9458, LAS: 0.9005, UEM: 0.5394, LEM: 0.3091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4192, partial_loss/deprel_loss: 0.4877, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6471, loss: 0.7056, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:  23%|##2       | 25/111 [00:18<01:03,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9250, UAS: 0.9491, LAS: 0.9041, UEM: 0.5924, LEM: 0.3523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2642, partial_loss/deprel_loss: 0.3273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4878, loss: 0.6803, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:  25%|##5       | 28/111 [00:20<00:59,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9486, LAS: 0.9040, UEM: 0.5864, LEM: 0.3475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5366, partial_loss/deprel_loss: 0.5191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6956, loss: 0.6813, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:  28%|##7       | 31/111 [00:22<00:56,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9203, UAS: 0.9480, LAS: 0.9034, UEM: 0.5770, LEM: 0.3385, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2727, partial_loss/deprel_loss: 0.4163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5606, loss: 0.6854, batch_reg_loss: 0.1731, reg_loss: 0.1731 ||:  32%|###1      | 35/111 [00:24<00:52,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9487, LAS: 0.9038, UEM: 0.5780, LEM: 0.3365, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2471, partial_loss/deprel_loss: 0.4322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5682, loss: 0.6814, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||:  34%|###4      | 38/111 [00:26<00:50,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8962, UAS: 0.9490, LAS: 0.9041, UEM: 0.5731, LEM: 0.3308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5803, partial_loss/deprel_loss: 0.6454, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8054, loss: 0.6820, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||:  37%|###6      | 41/111 [00:29<00:49,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9311, UAS: 0.9507, LAS: 0.9061, UEM: 0.5970, LEM: 0.3520, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2123, partial_loss/deprel_loss: 0.3388, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4865, loss: 0.6680, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||:  40%|###9      | 44/111 [00:31<00:47,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9510, LAS: 0.9065, UEM: 0.5949, LEM: 0.3489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5873, partial_loss/deprel_loss: 0.5985, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7692, loss: 0.6658, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||:  42%|####2     | 47/111 [00:33<00:46,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9517, LAS: 0.9072, UEM: 0.6124, LEM: 0.3671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2415, partial_loss/deprel_loss: 0.3660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.6589, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||:  45%|####5     | 50/111 [00:35<00:45,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9068, UAS: 0.9508, LAS: 0.9060, UEM: 0.6017, LEM: 0.3565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3449, partial_loss/deprel_loss: 0.5163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6550, loss: 0.6699, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||:  49%|####8     | 54/111 [00:38<00:40,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9676, UAS: 0.9505, LAS: 0.9062, UEM: 0.6242, LEM: 0.3916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0425, partial_loss/deprel_loss: 0.1334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2883, loss: 0.6690, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||:  51%|#####1    | 57/111 [00:41<00:42,  1.27it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9501, LAS: 0.9056, UEM: 0.6222, LEM: 0.3901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3604, partial_loss/deprel_loss: 0.4116, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5743, loss: 0.6729, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||:  55%|#####4    | 61/111 [00:43<00:36,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9498, LAS: 0.9051, UEM: 0.6129, LEM: 0.3819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6639, partial_loss/deprel_loss: 0.6474, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8237, loss: 0.6772, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||:  58%|#####7    | 64/111 [00:45<00:33,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9495, LAS: 0.9047, UEM: 0.6096, LEM: 0.3764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3216, partial_loss/deprel_loss: 0.4934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6320, loss: 0.6809, batch_reg_loss: 0.1730, reg_loss: 0.1731 ||:  60%|######    | 67/111 [00:48<00:32,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9498, LAS: 0.9050, UEM: 0.6106, LEM: 0.3777, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1373, partial_loss/deprel_loss: 0.2911, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4333, loss: 0.6803, batch_reg_loss: 0.1730, reg_loss: 0.1730 ||:  63%|######3   | 70/111 [00:50<00:29,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9489, LAS: 0.9041, UEM: 0.6022, LEM: 0.3710, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4646, partial_loss/deprel_loss: 0.4755, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6463, loss: 0.6865, batch_reg_loss: 0.1730, reg_loss: 0.1730 ||:  66%|######5   | 73/111 [00:52<00:28,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9125, UAS: 0.9492, LAS: 0.9046, UEM: 0.6020, LEM: 0.3689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3846, partial_loss/deprel_loss: 0.5038, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6530, loss: 0.6829, batch_reg_loss: 0.1730, reg_loss: 0.1730 ||:  68%|######8   | 76/111 [00:54<00:26,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8673, UAS: 0.9493, LAS: 0.9047, UEM: 0.5995, LEM: 0.3650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0225, partial_loss/deprel_loss: 0.7170, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9511, loss: 0.6818, batch_reg_loss: 0.1730, reg_loss: 0.1730 ||:  72%|#######2  | 80/111 [00:57<00:21,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9496, LAS: 0.9049, UEM: 0.5995, LEM: 0.3628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3052, partial_loss/deprel_loss: 0.4495, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5936, loss: 0.6812, batch_reg_loss: 0.1730, reg_loss: 0.1730 ||:  75%|#######4  | 83/111 [00:59<00:20,  1.39it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9490, LAS: 0.9043, UEM: 0.5976, LEM: 0.3622, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9099, partial_loss/deprel_loss: 0.7320, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9406, loss: 0.6865, batch_reg_loss: 0.1730, reg_loss: 0.1730 ||:  78%|#######8  | 87/111 [01:02<00:16,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9490, LAS: 0.9044, UEM: 0.5949, LEM: 0.3608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3954, partial_loss/deprel_loss: 0.4187, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5870, loss: 0.6859, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||:  81%|########1 | 90/111 [01:06<00:20,  1.04it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9448, UAS: 0.9494, LAS: 0.9049, UEM: 0.6072, LEM: 0.3764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0955, partial_loss/deprel_loss: 0.2082, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3586, loss: 0.6819, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||:  84%|########3 | 93/111 [01:09<00:17,  1.06it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8814, UAS: 0.9491, LAS: 0.9046, UEM: 0.6034, LEM: 0.3721, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7977, partial_loss/deprel_loss: 0.6350, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8405, loss: 0.6841, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||:  86%|########6 | 96/111 [01:11<00:13,  1.15it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9492, LAS: 0.9047, UEM: 0.6042, LEM: 0.3730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2056, partial_loss/deprel_loss: 0.3270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4756, loss: 0.6822, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||:  89%|########9 | 99/111 [01:13<00:09,  1.21it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9485, LAS: 0.9039, UEM: 0.5998, LEM: 0.3694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6815, partial_loss/deprel_loss: 0.5970, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7868, loss: 0.6867, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||:  92%|#########1| 102/111 [01:15<00:07,  1.27it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8910, UAS: 0.9487, LAS: 0.9040, UEM: 0.5997, LEM: 0.3681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6866, partial_loss/deprel_loss: 0.6442, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8256, loss: 0.6861, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||:  95%|#########4| 105/111 [01:18<00:04,  1.28it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8776, UAS: 0.9485, LAS: 0.9037, UEM: 0.5933, LEM: 0.3618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8087, partial_loss/deprel_loss: 0.8120, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9843, loss: 0.6896, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||:  98%|#########8| 109/111 [01:20<00:01,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8752, UAS: 0.9480, LAS: 0.9032, UEM: 0.5896, LEM: 0.3592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0166, partial_loss/deprel_loss: 0.6683, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9109, loss: 0.6941, batch_reg_loss: 0.1729, reg_loss: 0.1730 ||: 100%|##########| 111/111 [01:21<00:00,  1.35it/s]\n",
      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.668  |       N/A\n",
      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     1.017  |       N/A\n",
      "2023-04-07 00:34:40,190 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.173  |       N/A\n",
      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - UEM                      |     0.590  |       N/A\n",
      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - LAS                      |     0.903  |       N/A\n",
      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - loss                     |     0.694  |       N/A\n",
      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - LEM                      |     0.359  |       N/A\n",
      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - UAS                      |     0.948  |       N/A\n",
      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - EM                       |     0.875  |       N/A\n",
      "2023-04-07 00:34:40,191 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:34:40,196 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 00:34:44,979 - INFO - combo.training.trainer - Epoch duration: 0:01:29.676969\n",
      "2023-04-07 00:34:44,980 - INFO - combo.training.trainer - Estimated training time remaining: 7:13:18\n",
      "2023-04-07 00:34:44,980 - INFO - allennlp.training.trainer - Epoch 78/399\n",
      "2023-04-07 00:34:44,980 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:34:44,981 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:34:44,988 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9679, LAS: 0.9231, UEM: 0.7181, LEM: 0.4050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3375, partial_loss/deprel_loss: 0.3727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5386, loss: 0.5293, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:   3%|2         | 3/111 [00:02<01:15,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9566, LAS: 0.9133, UEM: 0.6358, LEM: 0.3537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6508, partial_loss/deprel_loss: 0.6221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8007, loss: 0.6167, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:   5%|5         | 6/111 [00:04<01:13,  1.43it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9543, LAS: 0.9101, UEM: 0.6182, LEM: 0.3409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3246, partial_loss/deprel_loss: 0.4870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6274, loss: 0.6452, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:   9%|9         | 10/111 [00:06<01:08,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8786, UAS: 0.9486, LAS: 0.9035, UEM: 0.5601, LEM: 0.3033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8651, partial_loss/deprel_loss: 0.6585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8727, loss: 0.6916, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  12%|#1        | 13/111 [00:08<01:07,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9496, LAS: 0.9042, UEM: 0.5650, LEM: 0.2982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5894, partial_loss/deprel_loss: 0.5549, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7347, loss: 0.6833, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  14%|#4        | 16/111 [00:11<01:06,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8911, UAS: 0.9507, LAS: 0.9051, UEM: 0.5807, LEM: 0.3174, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5727, partial_loss/deprel_loss: 0.6267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7888, loss: 0.6759, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  17%|#7        | 19/111 [00:13<01:07,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9504, LAS: 0.9054, UEM: 0.5797, LEM: 0.3181, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5428, partial_loss/deprel_loss: 0.5371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7111, loss: 0.6827, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  20%|#9        | 22/111 [00:15<01:05,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8458, UAS: 0.9482, LAS: 0.9033, UEM: 0.5805, LEM: 0.3326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2453, partial_loss/deprel_loss: 0.8579, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1083, loss: 0.6936, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  23%|##2       | 25/111 [00:17<01:03,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9480, LAS: 0.9034, UEM: 0.5686, LEM: 0.3231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7153, partial_loss/deprel_loss: 0.5758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7766, loss: 0.6925, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  25%|##5       | 28/111 [00:20<01:03,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9279, UAS: 0.9483, LAS: 0.9041, UEM: 0.5652, LEM: 0.3186, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2857, partial_loss/deprel_loss: 0.3994, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5495, loss: 0.6867, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  28%|##7       | 31/111 [00:22<01:02,  1.28it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8680, UAS: 0.9485, LAS: 0.9044, UEM: 0.5621, LEM: 0.3129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0274, partial_loss/deprel_loss: 0.8121, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0280, loss: 0.6880, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  32%|###1      | 35/111 [00:25<00:54,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8752, UAS: 0.9465, LAS: 0.9023, UEM: 0.5479, LEM: 0.3012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8060, partial_loss/deprel_loss: 0.7816, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9593, loss: 0.7045, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  35%|###5      | 39/111 [00:27<00:50,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8914, UAS: 0.9456, LAS: 0.9013, UEM: 0.5402, LEM: 0.2945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5544, partial_loss/deprel_loss: 0.6268, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7852, loss: 0.7115, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  38%|###7      | 42/111 [00:29<00:47,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8893, UAS: 0.9461, LAS: 0.9019, UEM: 0.5449, LEM: 0.2997, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7151, partial_loss/deprel_loss: 0.7046, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8796, loss: 0.7092, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  41%|####      | 45/111 [00:31<00:45,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9474, LAS: 0.9031, UEM: 0.5644, LEM: 0.3191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5186, partial_loss/deprel_loss: 0.6419, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7901, loss: 0.7012, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  43%|####3     | 48/111 [00:34<00:45,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8818, UAS: 0.9469, LAS: 0.9025, UEM: 0.5606, LEM: 0.3189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8224, partial_loss/deprel_loss: 0.6433, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8520, loss: 0.7051, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  47%|####6     | 52/111 [00:36<00:40,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9475, LAS: 0.9031, UEM: 0.5585, LEM: 0.3156, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2593, partial_loss/deprel_loss: 0.3815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5299, loss: 0.7007, batch_reg_loss: 0.1729, reg_loss: 0.1729 ||:  50%|####9     | 55/111 [00:38<00:39,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9470, LAS: 0.9024, UEM: 0.5479, LEM: 0.3069, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4642, partial_loss/deprel_loss: 0.5490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7049, loss: 0.7073, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  53%|#####3    | 59/111 [00:41<00:34,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9475, LAS: 0.9030, UEM: 0.5552, LEM: 0.3137, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4942, partial_loss/deprel_loss: 0.5451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7077, loss: 0.7039, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  57%|#####6    | 63/111 [00:43<00:32,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9472, LAS: 0.9028, UEM: 0.5517, LEM: 0.3139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3959, partial_loss/deprel_loss: 0.4358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6006, loss: 0.7036, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  60%|######    | 67/111 [00:46<00:30,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9478, LAS: 0.9035, UEM: 0.5566, LEM: 0.3166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2160, partial_loss/deprel_loss: 0.3595, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5036, loss: 0.6997, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  64%|######3   | 71/111 [00:49<00:27,  1.46it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9544, UAS: 0.9476, LAS: 0.9032, UEM: 0.5699, LEM: 0.3348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0714, partial_loss/deprel_loss: 0.2042, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3505, loss: 0.7030, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  67%|######6   | 74/111 [00:51<00:25,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9465, LAS: 0.9023, UEM: 0.5679, LEM: 0.3350, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8180, partial_loss/deprel_loss: 0.6136, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8273, loss: 0.7098, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  69%|######9   | 77/111 [00:54<00:24,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9465, LAS: 0.9021, UEM: 0.5639, LEM: 0.3299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6078, partial_loss/deprel_loss: 0.6108, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7830, loss: 0.7105, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  73%|#######2  | 81/111 [00:56<00:21,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9470, LAS: 0.9028, UEM: 0.5722, LEM: 0.3391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1430, partial_loss/deprel_loss: 0.2524, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4033, loss: 0.7049, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  76%|#######5  | 84/111 [00:58<00:19,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8863, UAS: 0.9474, LAS: 0.9034, UEM: 0.5887, LEM: 0.3620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6315, partial_loss/deprel_loss: 0.6066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7844, loss: 0.6999, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  78%|#######8  | 87/111 [01:01<00:17,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9481, LAS: 0.9040, UEM: 0.5977, LEM: 0.3680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2512, partial_loss/deprel_loss: 0.4475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5810, loss: 0.6947, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  81%|########1 | 90/111 [01:03<00:15,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9479, LAS: 0.9036, UEM: 0.5902, LEM: 0.3608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6856, partial_loss/deprel_loss: 0.5673, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7637, loss: 0.6968, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  85%|########4 | 94/111 [01:06<00:12,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9479, LAS: 0.9038, UEM: 0.5882, LEM: 0.3587, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3477, partial_loss/deprel_loss: 0.5077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6485, loss: 0.6960, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  87%|########7 | 97/111 [01:08<00:10,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9475, LAS: 0.9035, UEM: 0.5840, LEM: 0.3553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6664, partial_loss/deprel_loss: 0.5377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7362, loss: 0.6976, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  90%|######### | 100/111 [01:10<00:07,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9480, LAS: 0.9041, UEM: 0.5887, LEM: 0.3604, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1575, partial_loss/deprel_loss: 0.2746, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4240, loss: 0.6932, batch_reg_loss: 0.1728, reg_loss: 0.1729 ||:  94%|#########3| 104/111 [01:13<00:04,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9486, LAS: 0.9047, UEM: 0.5946, LEM: 0.3647, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2394, partial_loss/deprel_loss: 0.3851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5287, loss: 0.6893, batch_reg_loss: 0.1728, reg_loss: 0.1728 ||:  96%|#########6| 107/111 [01:15<00:02,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9489, LAS: 0.9049, UEM: 0.5942, LEM: 0.3639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6411, partial_loss/deprel_loss: 0.6306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8055, loss: 0.6882, batch_reg_loss: 0.1728, reg_loss: 0.1728 ||:  99%|#########9| 110/111 [01:17<00:00,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9489, LAS: 0.9048, UEM: 0.5932, LEM: 0.3620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4630, partial_loss/deprel_loss: 0.6202, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7615, loss: 0.6888, batch_reg_loss: 0.1728, reg_loss: 0.1728 ||: 100%|##########| 111/111 [01:18<00:00,  1.42it/s]\n",
      "2023-04-07 00:36:06,576 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.620  |       N/A\n",
      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.463  |       N/A\n",
      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.173  |       N/A\n",
      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - UEM                      |     0.593  |       N/A\n",
      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - LAS                      |     0.905  |       N/A\n",
      "2023-04-07 00:36:06,577 - INFO - combo.training.tensorboard_writer - loss                     |     0.689  |       N/A\n",
      "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - LEM                      |     0.362  |       N/A\n",
      "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - UAS                      |     0.949  |       N/A\n",
      "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - EM                       |     0.898  |       N/A\n",
      "2023-04-07 00:36:06,578 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:36:06,583 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 00:36:11,692 - INFO - combo.training.trainer - Epoch duration: 0:01:26.712266\n",
      "2023-04-07 00:36:11,693 - INFO - combo.training.trainer - Estimated training time remaining: 7:12:21\n",
      "2023-04-07 00:36:11,693 - INFO - allennlp.training.trainer - Epoch 79/399\n",
      "2023-04-07 00:36:11,693 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:36:11,693 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:36:11,701 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9323, UAS: 0.9567, LAS: 0.9180, UEM: 0.5695, LEM: 0.3250, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2451, partial_loss/deprel_loss: 0.4015, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5430, loss: 0.6235, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:   4%|3         | 4/111 [00:02<01:09,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8239, UAS: 0.9426, LAS: 0.9010, UEM: 0.4922, LEM: 0.2686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7117, partial_loss/deprel_loss: 1.0595, partial_loss/cycle_loss: 0.0000, batch_loss: 1.3627, loss: 0.7478, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:   7%|7         | 8/111 [00:05<01:08,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9500, LAS: 0.9082, UEM: 0.6338, LEM: 0.4162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3560, partial_loss/deprel_loss: 0.5119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6534, loss: 0.6912, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:  10%|9         | 11/111 [00:07<01:08,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9078, UAS: 0.9476, LAS: 0.9051, UEM: 0.5838, LEM: 0.3653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3645, partial_loss/deprel_loss: 0.4990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6448, loss: 0.7086, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:  14%|#3        | 15/111 [00:10<01:04,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9468, LAS: 0.9040, UEM: 0.5621, LEM: 0.3448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3119, partial_loss/deprel_loss: 0.4127, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5653, loss: 0.7126, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:  16%|#6        | 18/111 [00:12<01:03,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9495, LAS: 0.9071, UEM: 0.6012, LEM: 0.3786, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1973, partial_loss/deprel_loss: 0.3137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4632, loss: 0.6835, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:  19%|#8        | 21/111 [00:14<01:00,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9512, LAS: 0.9097, UEM: 0.6573, LEM: 0.4541, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7300, partial_loss/deprel_loss: 0.6385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8295, loss: 0.6655, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:  22%|##1       | 24/111 [00:16<01:02,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9152, UAS: 0.9509, LAS: 0.9091, UEM: 0.6380, LEM: 0.4309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3313, partial_loss/deprel_loss: 0.4382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5895, loss: 0.6719, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:  25%|##5       | 28/111 [00:19<00:57,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9527, LAS: 0.9108, UEM: 0.6429, LEM: 0.4273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2971, partial_loss/deprel_loss: 0.4320, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5777, loss: 0.6572, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:  29%|##8       | 32/111 [00:21<00:51,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9526, LAS: 0.9103, UEM: 0.6318, LEM: 0.4139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3001, partial_loss/deprel_loss: 0.4517, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5941, loss: 0.6554, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:  32%|###1      | 35/111 [00:23<00:50,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8422, UAS: 0.9514, LAS: 0.9086, UEM: 0.6262, LEM: 0.4088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2311, partial_loss/deprel_loss: 0.8674, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1128, loss: 0.6664, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:  34%|###4      | 38/111 [00:25<00:49,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9524, LAS: 0.9097, UEM: 0.6317, LEM: 0.4082, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2377, partial_loss/deprel_loss: 0.3761, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5211, loss: 0.6570, batch_reg_loss: 0.1727, reg_loss: 0.1727 ||:  37%|###6      | 41/111 [00:27<00:48,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9507, LAS: 0.9078, UEM: 0.6229, LEM: 0.4022, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1997, partial_loss/deprel_loss: 0.3551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4966, loss: 0.6716, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  41%|####      | 45/111 [00:30<00:45,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9501, LAS: 0.9073, UEM: 0.6259, LEM: 0.4101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1513, partial_loss/deprel_loss: 0.2561, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4078, loss: 0.6734, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  44%|####4     | 49/111 [00:33<00:43,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9051, UAS: 0.9506, LAS: 0.9077, UEM: 0.6257, LEM: 0.4059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5370, partial_loss/deprel_loss: 0.5998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7598, loss: 0.6716, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  47%|####6     | 52/111 [00:35<00:41,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9509, LAS: 0.9082, UEM: 0.6271, LEM: 0.4067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2181, partial_loss/deprel_loss: 0.2975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4542, loss: 0.6671, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  50%|#####     | 56/111 [00:38<00:38,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9504, LAS: 0.9075, UEM: 0.6145, LEM: 0.3936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5854, partial_loss/deprel_loss: 0.5008, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6903, loss: 0.6702, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  54%|#####4    | 60/111 [00:40<00:33,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9176, UAS: 0.9511, LAS: 0.9083, UEM: 0.6169, LEM: 0.3916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3994, partial_loss/deprel_loss: 0.4495, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6121, loss: 0.6644, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  58%|#####7    | 64/111 [00:43<00:32,  1.46it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9515, LAS: 0.9084, UEM: 0.6153, LEM: 0.3867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2341, partial_loss/deprel_loss: 0.4211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5563, loss: 0.6629, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  60%|######    | 67/111 [00:45<00:30,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8708, UAS: 0.9511, LAS: 0.9079, UEM: 0.6110, LEM: 0.3826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8882, partial_loss/deprel_loss: 0.7016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9115, loss: 0.6672, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  63%|######3   | 70/111 [00:48<00:29,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9509, LAS: 0.9078, UEM: 0.6095, LEM: 0.3815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1806, partial_loss/deprel_loss: 0.3297, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4725, loss: 0.6690, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  66%|######5   | 73/111 [00:50<00:27,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9185, UAS: 0.9505, LAS: 0.9071, UEM: 0.6078, LEM: 0.3788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2898, partial_loss/deprel_loss: 0.4325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5766, loss: 0.6730, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  69%|######9   | 77/111 [00:52<00:23,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9508, LAS: 0.9073, UEM: 0.6133, LEM: 0.3822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1380, partial_loss/deprel_loss: 0.3113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4492, loss: 0.6704, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  72%|#######2  | 80/111 [00:54<00:21,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8482, UAS: 0.9498, LAS: 0.9063, UEM: 0.6056, LEM: 0.3753, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5038, partial_loss/deprel_loss: 0.9507, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2339, loss: 0.6799, batch_reg_loss: 0.1726, reg_loss: 0.1727 ||:  76%|#######5  | 84/111 [00:57<00:18,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8845, UAS: 0.9499, LAS: 0.9062, UEM: 0.6077, LEM: 0.3767, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6644, partial_loss/deprel_loss: 0.6769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8469, loss: 0.6789, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||:  78%|#######8  | 87/111 [00:59<00:16,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8672, UAS: 0.9496, LAS: 0.9058, UEM: 0.6070, LEM: 0.3774, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7890, partial_loss/deprel_loss: 0.8387, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0013, loss: 0.6827, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||:  81%|########1 | 90/111 [01:01<00:14,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9044, UAS: 0.9486, LAS: 0.9046, UEM: 0.5989, LEM: 0.3707, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4162, partial_loss/deprel_loss: 0.5504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6961, loss: 0.6908, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||:  85%|########4 | 94/111 [01:04<00:11,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9480, LAS: 0.9039, UEM: 0.5931, LEM: 0.3646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6230, partial_loss/deprel_loss: 0.6034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7799, loss: 0.6954, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||:  88%|########8 | 98/111 [01:07<00:08,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9481, LAS: 0.9041, UEM: 0.5966, LEM: 0.3690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8358, partial_loss/deprel_loss: 0.7337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9267, loss: 0.6936, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||:  91%|######### | 101/111 [01:09<00:07,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9029, UAS: 0.9480, LAS: 0.9040, UEM: 0.5914, LEM: 0.3628, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4340, partial_loss/deprel_loss: 0.4662, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6323, loss: 0.6934, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||:  95%|#########4| 105/111 [01:11<00:04,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8881, UAS: 0.9478, LAS: 0.9037, UEM: 0.5856, LEM: 0.3578, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8297, partial_loss/deprel_loss: 0.6664, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8716, loss: 0.6959, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||:  98%|#########8| 109/111 [01:14<00:01,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9479, LAS: 0.9038, UEM: 0.5869, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7285, partial_loss/deprel_loss: 0.5894, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7897, loss: 0.6951, batch_reg_loss: 0.1725, reg_loss: 0.1726 ||: 100%|##########| 111/111 [01:15<00:00,  1.46it/s]\n",
      "2023-04-07 00:37:30,881 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.589  |       N/A\n",
      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.729  |       N/A\n",
      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.173  |       N/A\n",
      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - UEM                      |     0.587  |       N/A\n",
      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - LAS                      |     0.904  |       N/A\n",
      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - loss                     |     0.695  |       N/A\n",
      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:37:30,882 - INFO - combo.training.tensorboard_writer - LEM                      |     0.360  |       N/A\n",
      "2023-04-07 00:37:30,883 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:37:30,883 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:37:30,883 - INFO - combo.training.tensorboard_writer - UAS                      |     0.948  |       N/A\n",
      "2023-04-07 00:37:30,883 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:37:30,883 - INFO - combo.training.tensorboard_writer - EM                       |     0.889  |       N/A\n",
      "2023-04-07 00:37:30,883 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:37:30,890 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 00:37:36,892 - INFO - combo.training.trainer - Epoch duration: 0:01:25.198854\n",
      "2023-04-07 00:37:36,892 - INFO - combo.training.trainer - Estimated training time remaining: 7:11:18\n",
      "2023-04-07 00:37:36,892 - INFO - allennlp.training.trainer - Epoch 80/399\n",
      "2023-04-07 00:37:36,893 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:37:36,893 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:37:36,903 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9196, UAS: 0.9620, LAS: 0.9237, UEM: 0.6907, LEM: 0.4553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3221, partial_loss/deprel_loss: 0.4183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5716, loss: 0.5313, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||:   3%|2         | 3/111 [00:02<01:17,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9603, LAS: 0.9177, UEM: 0.6303, LEM: 0.3688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4412, partial_loss/deprel_loss: 0.5262, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6817, loss: 0.5811, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||:   5%|5         | 6/111 [00:04<01:15,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8889, UAS: 0.9588, LAS: 0.9181, UEM: 0.6741, LEM: 0.4565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7152, partial_loss/deprel_loss: 0.6657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8481, loss: 0.5944, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||:   8%|8         | 9/111 [00:06<01:14,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9549, LAS: 0.9129, UEM: 0.6113, LEM: 0.3937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3193, partial_loss/deprel_loss: 0.4733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6149, loss: 0.6329, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||:  12%|#1        | 13/111 [00:09<01:08,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9546, LAS: 0.9125, UEM: 0.6094, LEM: 0.3910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4229, partial_loss/deprel_loss: 0.4221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5947, loss: 0.6348, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||:  14%|#4        | 16/111 [00:11<01:08,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8754, UAS: 0.9532, LAS: 0.9108, UEM: 0.6202, LEM: 0.4140, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9059, partial_loss/deprel_loss: 0.7547, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9574, loss: 0.6489, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||:  17%|#7        | 19/111 [00:13<01:07,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9530, LAS: 0.9100, UEM: 0.6040, LEM: 0.3906, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3067, partial_loss/deprel_loss: 0.4951, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6299, loss: 0.6532, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||:  20%|#9        | 22/111 [00:15<01:05,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9490, LAS: 0.9057, UEM: 0.5830, LEM: 0.3724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4699, partial_loss/deprel_loss: 0.5475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7044, loss: 0.6857, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||:  23%|##2       | 25/111 [00:18<01:03,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9299, UAS: 0.9502, LAS: 0.9070, UEM: 0.5930, LEM: 0.3742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2599, partial_loss/deprel_loss: 0.4180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5588, loss: 0.6773, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||:  26%|##6       | 29/111 [00:20<00:58,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9518, LAS: 0.9092, UEM: 0.6273, LEM: 0.4061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2288, partial_loss/deprel_loss: 0.3738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5173, loss: 0.6576, batch_reg_loss: 0.1725, reg_loss: 0.1725 ||:  29%|##8       | 32/111 [00:23<00:57,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9495, LAS: 0.9065, UEM: 0.6101, LEM: 0.3909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4890, partial_loss/deprel_loss: 0.5513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7113, loss: 0.6791, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  32%|###1      | 35/111 [00:25<00:54,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8907, UAS: 0.9486, LAS: 0.9054, UEM: 0.6030, LEM: 0.3847, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5379, partial_loss/deprel_loss: 0.5874, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7500, loss: 0.6869, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  34%|###4      | 38/111 [00:27<00:52,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8247, UAS: 0.9468, LAS: 0.9033, UEM: 0.5977, LEM: 0.3799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7654, partial_loss/deprel_loss: 0.9535, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2883, loss: 0.7037, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  37%|###6      | 41/111 [00:29<00:49,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9236, UAS: 0.9469, LAS: 0.9034, UEM: 0.5872, LEM: 0.3688, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3795, partial_loss/deprel_loss: 0.3789, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5514, loss: 0.7030, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  41%|####      | 45/111 [00:31<00:44,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9462, LAS: 0.9022, UEM: 0.5714, LEM: 0.3543, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5592, partial_loss/deprel_loss: 0.6000, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7643, loss: 0.7125, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  44%|####4     | 49/111 [00:34<00:40,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9474, LAS: 0.9035, UEM: 0.5757, LEM: 0.3527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3003, partial_loss/deprel_loss: 0.4217, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5699, loss: 0.7029, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  48%|####7     | 53/111 [00:37<00:41,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9485, LAS: 0.9047, UEM: 0.5836, LEM: 0.3553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2203, partial_loss/deprel_loss: 0.3744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5160, loss: 0.6956, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  50%|#####     | 56/111 [00:39<00:39,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9483, LAS: 0.9043, UEM: 0.5866, LEM: 0.3581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1981, partial_loss/deprel_loss: 0.3500, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4921, loss: 0.6978, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  53%|#####3    | 59/111 [00:41<00:36,  1.42it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9490, LAS: 0.9051, UEM: 0.5953, LEM: 0.3652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2126, partial_loss/deprel_loss: 0.3401, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4870, loss: 0.6900, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  56%|#####5    | 62/111 [00:44<00:37,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9492, LAS: 0.9052, UEM: 0.5994, LEM: 0.3674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2119, partial_loss/deprel_loss: 0.3785, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5176, loss: 0.6883, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  59%|#####8    | 65/111 [00:46<00:34,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9495, LAS: 0.9056, UEM: 0.6049, LEM: 0.3719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1288, partial_loss/deprel_loss: 0.3110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4469, loss: 0.6860, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  61%|######1   | 68/111 [00:48<00:31,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8482, UAS: 0.9491, LAS: 0.9052, UEM: 0.6076, LEM: 0.3730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3398, partial_loss/deprel_loss: 0.7577, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0465, loss: 0.6871, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  64%|######3   | 71/111 [00:50<00:29,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9494, LAS: 0.9057, UEM: 0.6087, LEM: 0.3739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2983, partial_loss/deprel_loss: 0.4091, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5593, loss: 0.6846, batch_reg_loss: 0.1724, reg_loss: 0.1725 ||:  67%|######6   | 74/111 [00:53<00:27,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9496, LAS: 0.9057, UEM: 0.6040, LEM: 0.3663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3739, partial_loss/deprel_loss: 0.5073, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6530, loss: 0.6851, batch_reg_loss: 0.1724, reg_loss: 0.1724 ||:  70%|#######   | 78/111 [00:55<00:22,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9166, UAS: 0.9496, LAS: 0.9056, UEM: 0.6007, LEM: 0.3625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3293, partial_loss/deprel_loss: 0.4565, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6035, loss: 0.6847, batch_reg_loss: 0.1724, reg_loss: 0.1724 ||:  74%|#######3  | 82/111 [00:57<00:19,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9495, LAS: 0.9057, UEM: 0.5956, LEM: 0.3583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4589, partial_loss/deprel_loss: 0.4744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6437, loss: 0.6845, batch_reg_loss: 0.1724, reg_loss: 0.1724 ||:  77%|#######6  | 85/111 [01:00<00:18,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9355, UAS: 0.9495, LAS: 0.9056, UEM: 0.5939, LEM: 0.3549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2203, partial_loss/deprel_loss: 0.3479, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4947, loss: 0.6853, batch_reg_loss: 0.1724, reg_loss: 0.1724 ||:  80%|########  | 89/111 [01:02<00:14,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8917, UAS: 0.9491, LAS: 0.9052, UEM: 0.5858, LEM: 0.3478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7029, partial_loss/deprel_loss: 0.6080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7993, loss: 0.6869, batch_reg_loss: 0.1723, reg_loss: 0.1724 ||:  84%|########3 | 93/111 [01:05<00:11,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8718, UAS: 0.9482, LAS: 0.9041, UEM: 0.5799, LEM: 0.3432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9657, partial_loss/deprel_loss: 0.7077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9316, loss: 0.6950, batch_reg_loss: 0.1723, reg_loss: 0.1724 ||:  87%|########7 | 97/111 [01:07<00:09,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9015, UAS: 0.9480, LAS: 0.9037, UEM: 0.5733, LEM: 0.3373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5950, partial_loss/deprel_loss: 0.5820, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7570, loss: 0.6973, batch_reg_loss: 0.1723, reg_loss: 0.1724 ||:  91%|######### | 101/111 [01:10<00:06,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8983, UAS: 0.9483, LAS: 0.9039, UEM: 0.5756, LEM: 0.3389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5457, partial_loss/deprel_loss: 0.6095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7691, loss: 0.6958, batch_reg_loss: 0.1723, reg_loss: 0.1724 ||:  95%|#########4| 105/111 [01:13<00:04,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9485, LAS: 0.9043, UEM: 0.5833, LEM: 0.3468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2313, partial_loss/deprel_loss: 0.3321, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4842, loss: 0.6930, batch_reg_loss: 0.1723, reg_loss: 0.1724 ||:  97%|#########7| 108/111 [01:15<00:02,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8750, UAS: 0.9487, LAS: 0.9045, UEM: 0.5949, LEM: 0.3645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7318, partial_loss/deprel_loss: 0.6724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8566, loss: 0.6913, batch_reg_loss: 0.1723, reg_loss: 0.1724 ||: 100%|##########| 111/111 [01:17<00:00,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8750, UAS: 0.9487, LAS: 0.9045, UEM: 0.5949, LEM: 0.3645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7318, partial_loss/deprel_loss: 0.6724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8566, loss: 0.6913, batch_reg_loss: 0.1723, reg_loss: 0.1724 ||: 100%|##########| 111/111 [01:17<00:00,  1.43it/s]\n",
      "2023-04-07 00:38:57,543 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8646, UAS: 0.9029, LAS: 0.8477, UEM: 0.1151, LEM: 0.0144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3311, partial_loss/deprel_loss: 47.7680, partial_loss/cycle_loss: 0.0000, batch_loss: 38.4806, loss: 41.8893, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:11,  1.09s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9320, LAS: 0.8765, UEM: 0.5111, LEM: 0.2229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5485, partial_loss/deprel_loss: 24.1775, partial_loss/cycle_loss: 0.0000, batch_loss: 19.4517, loss: 30.7239, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:05<00:08,  1.05s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9407, LAS: 0.8871, UEM: 0.6027, LEM: 0.3056, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1748, partial_loss/deprel_loss: 23.6009, partial_loss/cycle_loss: 0.0000, batch_loss: 18.9157, loss: 28.3449, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:07<00:05,  1.01s/it]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9280, UAS: 0.9430, LAS: 0.8909, UEM: 0.5963, LEM: 0.3052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3954, partial_loss/deprel_loss: 17.4416, partial_loss/cycle_loss: 0.0000, batch_loss: 14.0323, loss: 26.6526, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:10<00:01,  1.04it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.9458, LAS: 0.8946, UEM: 0.6489, LEM: 0.3860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7757, partial_loss/deprel_loss: 29.8046, partial_loss/cycle_loss: 0.0000, batch_loss: 23.9988, loss: 25.6342, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.06it/s]\n",
      "2023-04-07 00:39:09,770 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:39:09,772 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-07 00:39:09,772 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 00:39:09,772 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 00:39:09,772 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-07 00:39:09,772 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-07 00:39:09,772 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
      "2023-04-07 00:39:09,772 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.672  |    29.805\n",
      "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.732  |     0.776\n",
      "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.172  |     0.000\n",
      "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - UEM                      |     0.595  |     0.649\n",
      "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - LAS                      |     0.904  |     0.895\n",
      "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - loss                     |     0.691  |    25.634\n",
      "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - LEM                      |     0.365  |     0.386\n",
      "2023-04-07 00:39:09,773 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-07 00:39:09,774 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-07 00:39:09,774 - INFO - combo.training.tensorboard_writer - UAS                      |     0.949  |     0.946\n",
      "2023-04-07 00:39:09,774 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-07 00:39:09,774 - INFO - combo.training.tensorboard_writer - EM                       |     0.875  |     0.881\n",
      "2023-04-07 00:39:09,774 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:39:09,780 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 00:39:14,857 - INFO - combo.training.trainer - Epoch duration: 0:01:37.964569\n",
      "2023-04-07 00:39:14,858 - INFO - combo.training.trainer - Estimated training time remaining: 7:11:04\n",
      "2023-04-07 00:39:14,858 - INFO - allennlp.training.trainer - Epoch 81/399\n",
      "2023-04-07 00:39:14,858 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:39:14,859 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:39:14,868 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9547, LAS: 0.9104, UEM: 0.6792, LEM: 0.4550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5030, partial_loss/deprel_loss: 0.5679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7273, loss: 0.6154, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:   3%|2         | 3/111 [00:02<01:14,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9549, LAS: 0.9128, UEM: 0.7015, LEM: 0.4632, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2751, partial_loss/deprel_loss: 0.3782, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5299, loss: 0.6082, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:   6%|6         | 7/111 [00:04<01:10,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9524, LAS: 0.9107, UEM: 0.6876, LEM: 0.4629, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6333, partial_loss/deprel_loss: 0.6023, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7808, loss: 0.6312, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:   9%|9         | 10/111 [00:06<01:09,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9514, LAS: 0.9102, UEM: 0.6589, LEM: 0.4373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4960, partial_loss/deprel_loss: 0.5311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6964, loss: 0.6450, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:  12%|#1        | 13/111 [00:08<01:06,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9522, LAS: 0.9101, UEM: 0.6362, LEM: 0.4087, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2727, partial_loss/deprel_loss: 0.4308, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5715, loss: 0.6486, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:  14%|#4        | 16/111 [00:11<01:10,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9496, LAS: 0.9079, UEM: 0.6037, LEM: 0.3839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4495, partial_loss/deprel_loss: 0.4817, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6475, loss: 0.6674, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:  17%|#7        | 19/111 [00:13<01:07,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9513, LAS: 0.9092, UEM: 0.6182, LEM: 0.3905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2502, partial_loss/deprel_loss: 0.4057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5469, loss: 0.6559, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:  20%|#9        | 22/111 [00:15<01:05,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9502, LAS: 0.9075, UEM: 0.6075, LEM: 0.3815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1735, partial_loss/deprel_loss: 0.3221, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4646, loss: 0.6651, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:  23%|##2       | 25/111 [00:17<01:02,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9510, LAS: 0.9083, UEM: 0.6091, LEM: 0.3793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1998, partial_loss/deprel_loss: 0.3217, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4696, loss: 0.6594, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:  25%|##5       | 28/111 [00:20<01:01,  1.35it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8468, UAS: 0.9499, LAS: 0.9070, UEM: 0.6042, LEM: 0.3718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2352, partial_loss/deprel_loss: 0.7932, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0539, loss: 0.6675, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:  28%|##7       | 31/111 [00:22<00:59,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9509, LAS: 0.9084, UEM: 0.6005, LEM: 0.3653, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3909, partial_loss/deprel_loss: 0.4168, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5838, loss: 0.6564, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:  32%|###1      | 35/111 [00:25<00:54,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9528, LAS: 0.9105, UEM: 0.6227, LEM: 0.3832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2360, partial_loss/deprel_loss: 0.3608, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5081, loss: 0.6427, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:  34%|###4      | 38/111 [00:27<00:52,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9514, LAS: 0.9089, UEM: 0.6216, LEM: 0.3814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4446, partial_loss/deprel_loss: 0.4394, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6127, loss: 0.6547, batch_reg_loss: 0.1723, reg_loss: 0.1723 ||:  37%|###6      | 41/111 [00:29<00:50,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9518, LAS: 0.9095, UEM: 0.6119, LEM: 0.3702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4576, partial_loss/deprel_loss: 0.4736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6427, loss: 0.6515, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  41%|####      | 45/111 [00:31<00:45,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9508, LAS: 0.9086, UEM: 0.6184, LEM: 0.3826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1493, partial_loss/deprel_loss: 0.2488, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4012, loss: 0.6600, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  43%|####3     | 48/111 [00:34<00:45,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9077, UAS: 0.9505, LAS: 0.9082, UEM: 0.6075, LEM: 0.3719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6031, partial_loss/deprel_loss: 0.5009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6935, loss: 0.6638, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  46%|####5     | 51/111 [00:36<00:44,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9509, LAS: 0.9087, UEM: 0.6097, LEM: 0.3735, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1804, partial_loss/deprel_loss: 0.3201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4644, loss: 0.6610, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  49%|####8     | 54/111 [00:38<00:42,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8718, UAS: 0.9501, LAS: 0.9077, UEM: 0.6038, LEM: 0.3686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0205, partial_loss/deprel_loss: 0.7639, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9874, loss: 0.6706, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  51%|#####1    | 57/111 [00:41<00:39,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8983, UAS: 0.9498, LAS: 0.9072, UEM: 0.5953, LEM: 0.3598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6021, partial_loss/deprel_loss: 0.5233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7113, loss: 0.6743, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  55%|#####4    | 61/111 [00:43<00:35,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9496, LAS: 0.9071, UEM: 0.5866, LEM: 0.3521, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3604, partial_loss/deprel_loss: 0.4199, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5802, loss: 0.6753, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  59%|#####8    | 65/111 [00:46<00:31,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9191, UAS: 0.9505, LAS: 0.9079, UEM: 0.5911, LEM: 0.3532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2425, partial_loss/deprel_loss: 0.4279, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5631, loss: 0.6692, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  62%|######2   | 69/111 [00:49<00:29,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9508, LAS: 0.9080, UEM: 0.5965, LEM: 0.3573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1185, partial_loss/deprel_loss: 0.3069, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4414, loss: 0.6676, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  66%|######5   | 73/111 [00:51<00:26,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9508, LAS: 0.9081, UEM: 0.6005, LEM: 0.3605, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2179, partial_loss/deprel_loss: 0.3738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5148, loss: 0.6657, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  68%|######8   | 76/111 [00:54<00:26,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9501, LAS: 0.9073, UEM: 0.5916, LEM: 0.3543, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7469, partial_loss/deprel_loss: 0.6689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8567, loss: 0.6726, batch_reg_loss: 0.1722, reg_loss: 0.1723 ||:  71%|#######1  | 79/111 [00:56<00:23,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8454, UAS: 0.9500, LAS: 0.9070, UEM: 0.5944, LEM: 0.3549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3228, partial_loss/deprel_loss: 0.8789, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1398, loss: 0.6744, batch_reg_loss: 0.1722, reg_loss: 0.1722 ||:  75%|#######4  | 83/111 [00:59<00:20,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9497, LAS: 0.9067, UEM: 0.5907, LEM: 0.3531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1929, partial_loss/deprel_loss: 0.2878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4410, loss: 0.6763, batch_reg_loss: 0.1722, reg_loss: 0.1722 ||:  78%|#######8  | 87/111 [01:01<00:16,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9492, LAS: 0.9060, UEM: 0.5841, LEM: 0.3475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6835, partial_loss/deprel_loss: 0.5940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7840, loss: 0.6808, batch_reg_loss: 0.1722, reg_loss: 0.1722 ||:  81%|########1 | 90/111 [01:03<00:14,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8816, UAS: 0.9490, LAS: 0.9058, UEM: 0.5808, LEM: 0.3447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7765, partial_loss/deprel_loss: 0.6530, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8498, loss: 0.6830, batch_reg_loss: 0.1722, reg_loss: 0.1722 ||:  84%|########3 | 93/111 [01:05<00:12,  1.46it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9491, LAS: 0.9058, UEM: 0.5772, LEM: 0.3403, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6823, partial_loss/deprel_loss: 0.6745, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8483, loss: 0.6848, batch_reg_loss: 0.1722, reg_loss: 0.1722 ||:  87%|########7 | 97/111 [01:08<00:09,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9499, LAS: 0.9066, UEM: 0.5916, LEM: 0.3558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2769, partial_loss/deprel_loss: 0.4403, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5797, loss: 0.6777, batch_reg_loss: 0.1722, reg_loss: 0.1722 ||:  91%|######### | 101/111 [01:11<00:06,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9636, UAS: 0.9495, LAS: 0.9062, UEM: 0.6024, LEM: 0.3746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0667, partial_loss/deprel_loss: 0.1438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3005, loss: 0.6809, batch_reg_loss: 0.1721, reg_loss: 0.1722 ||:  94%|#########3| 104/111 [01:13<00:05,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9497, LAS: 0.9063, UEM: 0.6006, LEM: 0.3714, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4018, partial_loss/deprel_loss: 0.4389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6036, loss: 0.6805, batch_reg_loss: 0.1721, reg_loss: 0.1722 ||:  96%|#########6| 107/111 [01:16<00:02,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9496, LAS: 0.9061, UEM: 0.5974, LEM: 0.3681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3216, partial_loss/deprel_loss: 0.4782, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6190, loss: 0.6823, batch_reg_loss: 0.1721, reg_loss: 0.1722 ||:  99%|#########9| 110/111 [01:18<00:00,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9495, LAS: 0.9060, UEM: 0.5958, LEM: 0.3663, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5263, partial_loss/deprel_loss: 0.5980, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7558, loss: 0.6830, batch_reg_loss: 0.1721, reg_loss: 0.1722 ||: 100%|##########| 111/111 [01:18<00:00,  1.41it/s]\n",
      "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
      "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:40:37,035 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.598  |       N/A\n",
      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.526  |       N/A\n",
      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.172  |       N/A\n",
      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - UEM                      |     0.596  |       N/A\n",
      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - LAS                      |     0.906  |       N/A\n",
      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - loss                     |     0.683  |       N/A\n",
      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - LEM                      |     0.366  |       N/A\n",
      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - UAS                      |     0.950  |       N/A\n",
      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - EM                       |     0.895  |       N/A\n",
      "2023-04-07 00:40:37,036 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:40:37,041 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 00:40:41,884 - INFO - combo.training.trainer - Epoch duration: 0:01:27.026083\n",
      "2023-04-07 00:40:41,884 - INFO - combo.training.trainer - Estimated training time remaining: 7:10:06\n",
      "2023-04-07 00:40:41,885 - INFO - allennlp.training.trainer - Epoch 82/399\n",
      "2023-04-07 00:40:41,885 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:40:41,885 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:40:41,894 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8768, UAS: 0.9409, LAS: 0.8998, UEM: 0.4771, LEM: 0.2604, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0136, partial_loss/deprel_loss: 0.6579, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9012, loss: 0.7123, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:   4%|3         | 4/111 [00:02<01:10,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8989, UAS: 0.9483, LAS: 0.9083, UEM: 0.6919, LEM: 0.5363, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5977, partial_loss/deprel_loss: 0.5405, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7241, loss: 0.6607, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:   6%|6         | 7/111 [00:05<01:14,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9542, LAS: 0.9138, UEM: 0.7011, LEM: 0.4979, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6391, partial_loss/deprel_loss: 0.5094, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7074, loss: 0.6194, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:  10%|9         | 11/111 [00:07<01:08,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9534, LAS: 0.9131, UEM: 0.6858, LEM: 0.4754, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4420, partial_loss/deprel_loss: 0.4731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6390, loss: 0.6224, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:  13%|#2        | 14/111 [00:09<01:05,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8861, UAS: 0.9539, LAS: 0.9126, UEM: 0.6711, LEM: 0.4491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6797, partial_loss/deprel_loss: 0.6238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8071, loss: 0.6269, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:  16%|#6        | 18/111 [00:12<01:01,  1.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9545, LAS: 0.9128, UEM: 0.6608, LEM: 0.4301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3726, partial_loss/deprel_loss: 0.5161, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6595, loss: 0.6252, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:  19%|#8        | 21/111 [00:14<01:00,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9565, LAS: 0.9145, UEM: 0.6808, LEM: 0.4468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4160, partial_loss/deprel_loss: 0.5045, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6589, loss: 0.6114, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:  22%|##1       | 24/111 [00:16<01:01,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8881, UAS: 0.9542, LAS: 0.9119, UEM: 0.6572, LEM: 0.4251, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6785, partial_loss/deprel_loss: 0.6107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7963, loss: 0.6330, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:  24%|##4       | 27/111 [00:18<00:58,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9553, LAS: 0.9132, UEM: 0.6573, LEM: 0.4177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2071, partial_loss/deprel_loss: 0.3437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4885, loss: 0.6242, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:  28%|##7       | 31/111 [00:21<00:56,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8581, UAS: 0.9533, LAS: 0.9109, UEM: 0.6456, LEM: 0.4064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1913, partial_loss/deprel_loss: 0.8398, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0822, loss: 0.6427, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:  31%|###       | 34/111 [00:23<00:53,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8703, UAS: 0.9520, LAS: 0.9095, UEM: 0.6338, LEM: 0.3971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0930, partial_loss/deprel_loss: 0.6926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9448, loss: 0.6531, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:  33%|###3      | 37/111 [00:25<00:52,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9523, LAS: 0.9097, UEM: 0.6358, LEM: 0.3974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1727, partial_loss/deprel_loss: 0.3159, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4593, loss: 0.6540, batch_reg_loss: 0.1721, reg_loss: 0.1721 ||:  37%|###6      | 41/111 [00:28<00:48,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9517, LAS: 0.9092, UEM: 0.6257, LEM: 0.3878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2168, partial_loss/deprel_loss: 0.3799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5193, loss: 0.6588, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  41%|####      | 45/111 [00:30<00:42,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9085, UAS: 0.9508, LAS: 0.9081, UEM: 0.6245, LEM: 0.3829, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4910, partial_loss/deprel_loss: 0.5458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7069, loss: 0.6681, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  44%|####4     | 49/111 [00:33<00:40,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9501, LAS: 0.9071, UEM: 0.6120, LEM: 0.3725, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8077, partial_loss/deprel_loss: 0.6382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8442, loss: 0.6766, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  48%|####7     | 53/111 [00:35<00:39,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9225, UAS: 0.9507, LAS: 0.9076, UEM: 0.6135, LEM: 0.3716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2720, partial_loss/deprel_loss: 0.4549, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5904, loss: 0.6743, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  50%|#####     | 56/111 [00:38<00:38,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8874, UAS: 0.9502, LAS: 0.9071, UEM: 0.5999, LEM: 0.3610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6217, partial_loss/deprel_loss: 0.5910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7692, loss: 0.6763, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  54%|#####4    | 60/111 [00:40<00:34,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9502, LAS: 0.9069, UEM: 0.5913, LEM: 0.3521, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5812, partial_loss/deprel_loss: 0.5780, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7507, loss: 0.6767, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  58%|#####7    | 64/111 [00:43<00:31,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9309, UAS: 0.9498, LAS: 0.9065, UEM: 0.5906, LEM: 0.3518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2432, partial_loss/deprel_loss: 0.3638, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5117, loss: 0.6800, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  60%|######    | 67/111 [00:46<00:32,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9500, LAS: 0.9065, UEM: 0.5908, LEM: 0.3497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2326, partial_loss/deprel_loss: 0.4214, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5557, loss: 0.6793, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  63%|######3   | 70/111 [00:48<00:30,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8726, UAS: 0.9501, LAS: 0.9067, UEM: 0.5942, LEM: 0.3538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9001, partial_loss/deprel_loss: 0.6856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9006, loss: 0.6772, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  66%|######5   | 73/111 [00:50<00:28,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9371, UAS: 0.9502, LAS: 0.9067, UEM: 0.5941, LEM: 0.3537, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1827, partial_loss/deprel_loss: 0.3380, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4790, loss: 0.6774, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  68%|######8   | 76/111 [00:52<00:26,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9507, LAS: 0.9072, UEM: 0.6020, LEM: 0.3641, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3602, partial_loss/deprel_loss: 0.5102, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6522, loss: 0.6746, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  72%|#######2  | 80/111 [00:55<00:22,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8810, UAS: 0.9504, LAS: 0.9068, UEM: 0.5954, LEM: 0.3582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7883, partial_loss/deprel_loss: 0.6437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8446, loss: 0.6771, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  75%|#######4  | 83/111 [00:57<00:19,  1.42it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9504, LAS: 0.9068, UEM: 0.5946, LEM: 0.3573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3513, partial_loss/deprel_loss: 0.4657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6149, loss: 0.6778, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  77%|#######7  | 86/111 [00:59<00:17,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9503, LAS: 0.9066, UEM: 0.5921, LEM: 0.3549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3417, partial_loss/deprel_loss: 0.4772, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6221, loss: 0.6793, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  80%|########  | 89/111 [01:01<00:15,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8857, UAS: 0.9502, LAS: 0.9063, UEM: 0.5880, LEM: 0.3507, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7008, partial_loss/deprel_loss: 0.5836, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7791, loss: 0.6807, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  83%|########2 | 92/111 [01:03<00:13,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9504, LAS: 0.9067, UEM: 0.5963, LEM: 0.3600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6970, partial_loss/deprel_loss: 0.5774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7733, loss: 0.6775, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  86%|########5 | 95/111 [01:06<00:11,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9136, UAS: 0.9498, LAS: 0.9059, UEM: 0.5917, LEM: 0.3550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3445, partial_loss/deprel_loss: 0.4310, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5857, loss: 0.6827, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  89%|########9 | 99/111 [01:08<00:08,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9501, LAS: 0.9062, UEM: 0.5957, LEM: 0.3577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2567, partial_loss/deprel_loss: 0.4081, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5498, loss: 0.6808, batch_reg_loss: 0.1720, reg_loss: 0.1721 ||:  92%|#########1| 102/111 [01:10<00:06,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9501, LAS: 0.9062, UEM: 0.5980, LEM: 0.3613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1534, partial_loss/deprel_loss: 0.2828, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4289, loss: 0.6796, batch_reg_loss: 0.1720, reg_loss: 0.1720 ||:  95%|#########5| 106/111 [01:13<00:03,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9505, LAS: 0.9066, UEM: 0.6012, LEM: 0.3650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2708, partial_loss/deprel_loss: 0.3733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5247, loss: 0.6757, batch_reg_loss: 0.1720, reg_loss: 0.1720 ||:  98%|#########8| 109/111 [01:15<00:01,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9500, LAS: 0.9062, UEM: 0.5992, LEM: 0.3631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3536, partial_loss/deprel_loss: 0.4593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6101, loss: 0.6789, batch_reg_loss: 0.1720, reg_loss: 0.1720 ||: 100%|##########| 111/111 [01:17<00:00,  1.44it/s]\n",
      "2023-04-07 00:42:02,217 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.459  |       N/A\n",
      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.354  |       N/A\n",
      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.172  |       N/A\n",
      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - UEM                      |     0.599  |       N/A\n",
      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - LAS                      |     0.906  |       N/A\n",
      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - loss                     |     0.679  |       N/A\n",
      "2023-04-07 00:42:02,218 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:42:02,219 - INFO - combo.training.tensorboard_writer - LEM                      |     0.363  |       N/A\n",
      "2023-04-07 00:42:02,219 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:42:02,219 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:42:02,219 - INFO - combo.training.tensorboard_writer - UAS                      |     0.950  |       N/A\n",
      "2023-04-07 00:42:02,219 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:42:02,219 - INFO - combo.training.tensorboard_writer - EM                       |     0.915  |       N/A\n",
      "2023-04-07 00:42:02,219 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:42:02,224 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 00:42:07,283 - INFO - combo.training.trainer - Epoch duration: 0:01:25.398504\n",
      "2023-04-07 00:42:07,284 - INFO - combo.training.trainer - Estimated training time remaining: 7:09:01\n",
      "2023-04-07 00:42:07,284 - INFO - allennlp.training.trainer - Epoch 83/399\n",
      "2023-04-07 00:42:07,284 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:42:07,285 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:42:07,294 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8909, UAS: 0.9284, LAS: 0.8837, UEM: 0.1775, LEM: 0.0476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6096, partial_loss/deprel_loss: 0.6407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8064, loss: 0.8763, batch_reg_loss: 0.1720, reg_loss: 0.1720 ||:   3%|2         | 3/111 [00:02<01:18,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9434, LAS: 0.8991, UEM: 0.5232, LEM: 0.2785, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2584, partial_loss/deprel_loss: 0.4491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5829, loss: 0.7464, batch_reg_loss: 0.1720, reg_loss: 0.1720 ||:   5%|5         | 6/111 [00:04<01:14,  1.40it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9472, LAS: 0.9040, UEM: 0.5188, LEM: 0.2745, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3754, partial_loss/deprel_loss: 0.4332, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5936, loss: 0.7046, batch_reg_loss: 0.1720, reg_loss: 0.1720 ||:   9%|9         | 10/111 [00:06<01:09,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8927, UAS: 0.9509, LAS: 0.9083, UEM: 0.5943, LEM: 0.3498, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7866, partial_loss/deprel_loss: 0.5632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7799, loss: 0.6678, batch_reg_loss: 0.1720, reg_loss: 0.1720 ||:  13%|#2        | 14/111 [00:09<01:03,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9491, LAS: 0.9066, UEM: 0.5690, LEM: 0.3295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4959, partial_loss/deprel_loss: 0.5747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7309, loss: 0.6766, batch_reg_loss: 0.1719, reg_loss: 0.1720 ||:  15%|#5        | 17/111 [00:11<01:04,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8928, UAS: 0.9483, LAS: 0.9054, UEM: 0.5519, LEM: 0.3169, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7224, partial_loss/deprel_loss: 0.6577, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8426, loss: 0.6896, batch_reg_loss: 0.1719, reg_loss: 0.1720 ||:  19%|#8        | 21/111 [00:13<00:58,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8593, UAS: 0.9476, LAS: 0.9052, UEM: 0.5393, LEM: 0.3055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3746, partial_loss/deprel_loss: 0.7047, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0106, loss: 0.6951, batch_reg_loss: 0.1719, reg_loss: 0.1720 ||:  23%|##3       | 26/111 [00:15<00:50,  1.67it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9492, LAS: 0.9067, UEM: 0.6104, LEM: 0.3823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2221, partial_loss/deprel_loss: 0.3582, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5029, loss: 0.6811, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  27%|##7       | 30/111 [00:18<00:47,  1.69it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9487, LAS: 0.9066, UEM: 0.5992, LEM: 0.3710, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9904, partial_loss/deprel_loss: 0.5820, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8356, loss: 0.6787, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  31%|###       | 34/111 [00:20<00:46,  1.66it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8845, UAS: 0.9484, LAS: 0.9060, UEM: 0.5845, LEM: 0.3575, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7106, partial_loss/deprel_loss: 0.6451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8301, loss: 0.6820, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  34%|###4      | 38/111 [00:23<00:43,  1.69it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9250, UAS: 0.9472, LAS: 0.9040, UEM: 0.5775, LEM: 0.3495, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2128, partial_loss/deprel_loss: 0.3823, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5203, loss: 0.6965, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  38%|###7      | 42/111 [00:25<00:42,  1.64it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8944, UAS: 0.9459, LAS: 0.9025, UEM: 0.5688, LEM: 0.3394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5569, partial_loss/deprel_loss: 0.5899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7552, loss: 0.7069, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  41%|####1     | 46/111 [00:28<00:42,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9474, LAS: 0.9046, UEM: 0.6034, LEM: 0.3864, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2728, partial_loss/deprel_loss: 0.3495, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5061, loss: 0.6915, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  45%|####5     | 50/111 [00:31<00:42,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9489, LAS: 0.9062, UEM: 0.6256, LEM: 0.4053, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1323, partial_loss/deprel_loss: 0.2757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4189, loss: 0.6783, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  48%|####7     | 53/111 [00:34<00:42,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9494, LAS: 0.9068, UEM: 0.6231, LEM: 0.4025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3449, partial_loss/deprel_loss: 0.4298, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5847, loss: 0.6730, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  51%|#####1    | 57/111 [00:36<00:37,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9124, UAS: 0.9496, LAS: 0.9068, UEM: 0.6177, LEM: 0.3945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4062, partial_loss/deprel_loss: 0.4269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5946, loss: 0.6716, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  55%|#####4    | 61/111 [00:39<00:34,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9496, LAS: 0.9068, UEM: 0.6141, LEM: 0.3893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3288, partial_loss/deprel_loss: 0.3589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5248, loss: 0.6721, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  58%|#####7    | 64/111 [00:41<00:32,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9241, UAS: 0.9504, LAS: 0.9075, UEM: 0.6194, LEM: 0.3902, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2091, partial_loss/deprel_loss: 0.3767, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5151, loss: 0.6667, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  60%|######    | 67/111 [00:44<00:33,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9505, LAS: 0.9076, UEM: 0.6181, LEM: 0.3875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4662, partial_loss/deprel_loss: 0.4629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6354, loss: 0.6657, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  63%|######3   | 70/111 [00:46<00:30,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8761, UAS: 0.9504, LAS: 0.9074, UEM: 0.6133, LEM: 0.3826, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7722, partial_loss/deprel_loss: 0.6533, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8489, loss: 0.6670, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  66%|######5   | 73/111 [00:48<00:28,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9505, LAS: 0.9074, UEM: 0.6114, LEM: 0.3800, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9190, partial_loss/deprel_loss: 0.6907, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9083, loss: 0.6686, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  68%|######8   | 76/111 [00:50<00:25,  1.35it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9506, LAS: 0.9075, UEM: 0.6083, LEM: 0.3737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2458, partial_loss/deprel_loss: 0.3589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5082, loss: 0.6687, batch_reg_loss: 0.1719, reg_loss: 0.1719 ||:  72%|#######2  | 80/111 [00:53<00:22,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9507, LAS: 0.9076, UEM: 0.6118, LEM: 0.3788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1026, partial_loss/deprel_loss: 0.2484, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3911, loss: 0.6690, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||:  76%|#######5  | 84/111 [00:56<00:18,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8797, UAS: 0.9502, LAS: 0.9070, UEM: 0.6113, LEM: 0.3799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7965, partial_loss/deprel_loss: 0.6126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8212, loss: 0.6721, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||:  78%|#######8  | 87/111 [00:58<00:16,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9025, UAS: 0.9498, LAS: 0.9066, UEM: 0.6044, LEM: 0.3737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6229, partial_loss/deprel_loss: 0.5504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7368, loss: 0.6750, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||:  81%|########1 | 90/111 [01:00<00:14,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8997, UAS: 0.9495, LAS: 0.9063, UEM: 0.6002, LEM: 0.3700, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6756, partial_loss/deprel_loss: 0.6268, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8084, loss: 0.6786, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||:  84%|########3 | 93/111 [01:02<00:12,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9491, LAS: 0.9058, UEM: 0.5947, LEM: 0.3652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3796, partial_loss/deprel_loss: 0.4655, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6201, loss: 0.6819, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||:  86%|########6 | 96/111 [01:04<00:10,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9492, LAS: 0.9059, UEM: 0.5928, LEM: 0.3622, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2853, partial_loss/deprel_loss: 0.4503, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5891, loss: 0.6819, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||:  90%|######### | 100/111 [01:06<00:07,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9496, LAS: 0.9062, UEM: 0.5967, LEM: 0.3640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1409, partial_loss/deprel_loss: 0.3100, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4481, loss: 0.6789, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||:  94%|#########3| 104/111 [01:09<00:04,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9499, LAS: 0.9066, UEM: 0.6023, LEM: 0.3686, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1972, partial_loss/deprel_loss: 0.3334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4780, loss: 0.6747, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||:  97%|#########7| 108/111 [01:12<00:02,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9498, LAS: 0.9063, UEM: 0.5988, LEM: 0.3643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4659, partial_loss/deprel_loss: 0.5357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6935, loss: 0.6770, batch_reg_loss: 0.1718, reg_loss: 0.1719 ||: 100%|##########| 111/111 [01:13<00:00,  1.50it/s]\n",
      "2023-04-07 00:43:24,069 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.536  |       N/A\n",
      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.466  |       N/A\n",
      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.172  |       N/A\n",
      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - UEM                      |     0.599  |       N/A\n",
      "2023-04-07 00:43:24,070 - INFO - combo.training.tensorboard_writer - LAS                      |     0.906  |       N/A\n",
      "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - loss                     |     0.677  |       N/A\n",
      "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - LEM                      |     0.364  |       N/A\n",
      "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - UAS                      |     0.950  |       N/A\n",
      "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - EM                       |     0.896  |       N/A\n",
      "2023-04-07 00:43:24,071 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:43:24,076 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 00:43:28,783 - INFO - combo.training.trainer - Epoch duration: 0:01:21.499439\n",
      "2023-04-07 00:43:28,783 - INFO - combo.training.trainer - Estimated training time remaining: 7:07:41\n",
      "2023-04-07 00:43:28,784 - INFO - allennlp.training.trainer - Epoch 84/399\n",
      "2023-04-07 00:43:28,784 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:43:28,784 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:43:28,790 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9204, UAS: 0.9514, LAS: 0.9079, UEM: 0.4796, LEM: 0.2044, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2878, partial_loss/deprel_loss: 0.4113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5584, loss: 0.6576, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:   5%|4         | 5/111 [00:02<00:45,  2.32it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9469, LAS: 0.9044, UEM: 0.4177, LEM: 0.1680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4348, partial_loss/deprel_loss: 0.4723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6366, loss: 0.6858, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:   9%|9         | 10/111 [00:04<00:44,  2.25it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8954, UAS: 0.9428, LAS: 0.9011, UEM: 0.4024, LEM: 0.1678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6157, partial_loss/deprel_loss: 0.6063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7800, loss: 0.7110, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  14%|#3        | 15/111 [00:06<00:43,  2.23it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8660, UAS: 0.9426, LAS: 0.9007, UEM: 0.4122, LEM: 0.1725, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1330, partial_loss/deprel_loss: 0.7580, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0048, loss: 0.7214, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  16%|#6        | 18/111 [00:08<00:49,  1.89it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9024, UAS: 0.9414, LAS: 0.8983, UEM: 0.3904, LEM: 0.1592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5205, partial_loss/deprel_loss: 0.5271, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6976, loss: 0.7382, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  19%|#8        | 21/111 [00:11<00:53,  1.69it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9161, UAS: 0.9424, LAS: 0.8993, UEM: 0.4119, LEM: 0.1776, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3382, partial_loss/deprel_loss: 0.4379, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5897, loss: 0.7295, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  22%|##1       | 24/111 [00:13<00:54,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9052, UAS: 0.9434, LAS: 0.9004, UEM: 0.4380, LEM: 0.2060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4872, partial_loss/deprel_loss: 0.5513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7103, loss: 0.7223, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  24%|##4       | 27/111 [00:15<00:55,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9455, LAS: 0.9026, UEM: 0.4731, LEM: 0.2309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2584, partial_loss/deprel_loss: 0.3982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5420, loss: 0.7058, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  27%|##7       | 30/111 [00:17<00:53,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9473, LAS: 0.9042, UEM: 0.5138, LEM: 0.2729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1126, partial_loss/deprel_loss: 0.2701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4104, loss: 0.6924, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  31%|###       | 34/111 [00:20<00:52,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8771, UAS: 0.9434, LAS: 0.9001, UEM: 0.4985, LEM: 0.2645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8823, partial_loss/deprel_loss: 0.6641, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8795, loss: 0.7238, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  33%|###3      | 37/111 [00:22<00:51,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9439, LAS: 0.9003, UEM: 0.4910, LEM: 0.2574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5793, partial_loss/deprel_loss: 0.5165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7008, loss: 0.7221, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  36%|###6      | 40/111 [00:24<00:49,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9448, LAS: 0.9013, UEM: 0.4970, LEM: 0.2601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2447, partial_loss/deprel_loss: 0.4143, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5522, loss: 0.7138, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  39%|###8      | 43/111 [00:26<00:46,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9355, UAS: 0.9465, LAS: 0.9034, UEM: 0.5256, LEM: 0.2854, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2238, partial_loss/deprel_loss: 0.3439, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4916, loss: 0.6992, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  41%|####1     | 46/111 [00:28<00:45,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9223, UAS: 0.9458, LAS: 0.9026, UEM: 0.5203, LEM: 0.2823, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2626, partial_loss/deprel_loss: 0.3949, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5402, loss: 0.7034, batch_reg_loss: 0.1718, reg_loss: 0.1718 ||:  44%|####4     | 49/111 [00:31<00:43,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9146, UAS: 0.9466, LAS: 0.9034, UEM: 0.5216, LEM: 0.2819, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3617, partial_loss/deprel_loss: 0.4681, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6186, loss: 0.6996, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||:  47%|####6     | 52/111 [00:33<00:41,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9474, LAS: 0.9043, UEM: 0.5501, LEM: 0.3124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1540, partial_loss/deprel_loss: 0.3062, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4475, loss: 0.6910, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||:  50%|#####     | 56/111 [00:35<00:37,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8563, UAS: 0.9467, LAS: 0.9035, UEM: 0.5399, LEM: 0.3035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1279, partial_loss/deprel_loss: 0.7786, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0202, loss: 0.6955, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||:  54%|#####4    | 60/111 [00:38<00:33,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9474, LAS: 0.9045, UEM: 0.5443, LEM: 0.3067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1799, partial_loss/deprel_loss: 0.3411, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4806, loss: 0.6883, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||:  58%|#####7    | 64/111 [00:40<00:30,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8833, UAS: 0.9474, LAS: 0.9044, UEM: 0.5436, LEM: 0.3061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7734, partial_loss/deprel_loss: 0.7165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8995, loss: 0.6890, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||:  61%|######1   | 68/111 [00:43<00:27,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9484, LAS: 0.9054, UEM: 0.5534, LEM: 0.3129, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2475, partial_loss/deprel_loss: 0.4111, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5501, loss: 0.6814, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||:  65%|######4   | 72/111 [00:46<00:26,  1.49it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8980, UAS: 0.9485, LAS: 0.9056, UEM: 0.5534, LEM: 0.3148, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6119, partial_loss/deprel_loss: 0.5648, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7459, loss: 0.6804, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||:  68%|######7   | 75/111 [00:48<00:25,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9488, LAS: 0.9060, UEM: 0.5591, LEM: 0.3222, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2361, partial_loss/deprel_loss: 0.2912, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4519, loss: 0.6775, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||:  70%|#######   | 78/111 [00:51<00:25,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9484, UAS: 0.9494, LAS: 0.9067, UEM: 0.5780, LEM: 0.3444, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0818, partial_loss/deprel_loss: 0.2043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3515, loss: 0.6721, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||:  73%|#######2  | 81/111 [00:53<00:22,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8720, UAS: 0.9490, LAS: 0.9061, UEM: 0.5733, LEM: 0.3404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9083, partial_loss/deprel_loss: 0.6554, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8776, loss: 0.6770, batch_reg_loss: 0.1717, reg_loss: 0.1718 ||:  77%|#######6  | 85/111 [00:56<00:18,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9488, LAS: 0.9059, UEM: 0.5730, LEM: 0.3413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1963, partial_loss/deprel_loss: 0.3102, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4591, loss: 0.6784, batch_reg_loss: 0.1717, reg_loss: 0.1717 ||:  80%|########  | 89/111 [00:58<00:15,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9676, UAS: 0.9493, LAS: 0.9065, UEM: 0.5893, LEM: 0.3645, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0396, partial_loss/deprel_loss: 0.1135, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2704, loss: 0.6757, batch_reg_loss: 0.1717, reg_loss: 0.1717 ||:  83%|########2 | 92/111 [01:01<00:14,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9494, LAS: 0.9066, UEM: 0.5906, LEM: 0.3651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8848, partial_loss/deprel_loss: 0.7517, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9500, loss: 0.6758, batch_reg_loss: 0.1716, reg_loss: 0.1717 ||:  86%|########5 | 95/111 [01:03<00:11,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9497, LAS: 0.9070, UEM: 0.5945, LEM: 0.3684, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6637, partial_loss/deprel_loss: 0.6962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8613, loss: 0.6744, batch_reg_loss: 0.1716, reg_loss: 0.1717 ||:  88%|########8 | 98/111 [01:05<00:09,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8481, UAS: 0.9495, LAS: 0.9067, UEM: 0.5956, LEM: 0.3697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2025, partial_loss/deprel_loss: 0.8264, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0732, loss: 0.6749, batch_reg_loss: 0.1716, reg_loss: 0.1717 ||:  92%|#########1| 102/111 [01:08<00:06,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9498, LAS: 0.9069, UEM: 0.5952, LEM: 0.3670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2573, partial_loss/deprel_loss: 0.4458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5797, loss: 0.6735, batch_reg_loss: 0.1716, reg_loss: 0.1717 ||:  95%|#########4| 105/111 [01:10<00:04,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9137, UAS: 0.9498, LAS: 0.9069, UEM: 0.5966, LEM: 0.3667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2900, partial_loss/deprel_loss: 0.4007, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5502, loss: 0.6728, batch_reg_loss: 0.1716, reg_loss: 0.1717 ||:  98%|#########8| 109/111 [01:13<00:01,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9500, LAS: 0.9070, UEM: 0.6010, LEM: 0.3704, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0986, partial_loss/deprel_loss: 0.3075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4373, loss: 0.6715, batch_reg_loss: 0.1716, reg_loss: 0.1717 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
      "2023-04-07 00:44:46,230 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:44:46,230 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:44:46,230 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:44:46,230 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
      "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.307  |       N/A\n",
      "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.099  |       N/A\n",
      "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.172  |       N/A\n",
      "2023-04-07 00:44:46,231 - INFO - combo.training.tensorboard_writer - UEM                      |     0.601  |       N/A\n",
      "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - LAS                      |     0.907  |       N/A\n",
      "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - loss                     |     0.671  |       N/A\n",
      "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - LEM                      |     0.370  |       N/A\n",
      "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - UAS                      |     0.950  |       N/A\n",
      "2023-04-07 00:44:46,232 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:44:46,233 - INFO - combo.training.tensorboard_writer - EM                       |     0.935  |       N/A\n",
      "2023-04-07 00:44:46,233 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:44:46,238 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 00:44:52,274 - INFO - combo.training.trainer - Epoch duration: 0:01:23.490118\n",
      "2023-04-07 00:44:52,274 - INFO - combo.training.trainer - Estimated training time remaining: 7:06:28\n",
      "2023-04-07 00:44:52,274 - INFO - allennlp.training.trainer - Epoch 85/399\n",
      "2023-04-07 00:44:52,274 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:44:52,275 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:44:52,284 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9022, UAS: 0.9489, LAS: 0.9040, UEM: 0.4945, LEM: 0.2749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4882, partial_loss/deprel_loss: 0.5869, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7388, loss: 0.6966, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||:   4%|3         | 4/111 [00:02<00:59,  1.80it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8816, UAS: 0.9493, LAS: 0.9031, UEM: 0.4720, LEM: 0.2297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8211, partial_loss/deprel_loss: 0.6876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8859, loss: 0.7048, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||:   7%|7         | 8/111 [00:04<00:59,  1.74it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8923, UAS: 0.9508, LAS: 0.9050, UEM: 0.5020, LEM: 0.2539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5759, partial_loss/deprel_loss: 0.5518, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7282, loss: 0.6806, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||:  10%|9         | 11/111 [00:07<01:03,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9533, LAS: 0.9086, UEM: 0.5372, LEM: 0.2891, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2173, partial_loss/deprel_loss: 0.3593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5025, loss: 0.6507, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||:  14%|#3        | 15/111 [00:09<01:01,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9512, LAS: 0.9070, UEM: 0.5409, LEM: 0.2963, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2206, partial_loss/deprel_loss: 0.3592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5031, loss: 0.6631, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||:  16%|#6        | 18/111 [00:12<01:05,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9511, LAS: 0.9074, UEM: 0.5449, LEM: 0.3035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2308, partial_loss/deprel_loss: 0.3370, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4873, loss: 0.6610, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||:  19%|#8        | 21/111 [00:14<01:03,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9543, LAS: 0.9116, UEM: 0.6365, LEM: 0.4128, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2214, partial_loss/deprel_loss: 0.4003, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5361, loss: 0.6342, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||:  22%|##1       | 24/111 [00:16<01:03,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9191, UAS: 0.9527, LAS: 0.9099, UEM: 0.6114, LEM: 0.3901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3740, partial_loss/deprel_loss: 0.4229, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5847, loss: 0.6472, batch_reg_loss: 0.1716, reg_loss: 0.1716 ||:  25%|##5       | 28/111 [00:19<00:58,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9535, LAS: 0.9106, UEM: 0.6154, LEM: 0.3871, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1930, partial_loss/deprel_loss: 0.3449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4861, loss: 0.6429, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||:  28%|##7       | 31/111 [00:21<00:55,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9239, UAS: 0.9547, LAS: 0.9122, UEM: 0.6263, LEM: 0.3920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3075, partial_loss/deprel_loss: 0.4177, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5672, loss: 0.6327, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||:  31%|###       | 34/111 [00:23<00:53,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8845, UAS: 0.9544, LAS: 0.9119, UEM: 0.6212, LEM: 0.3862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6734, partial_loss/deprel_loss: 0.6002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7864, loss: 0.6345, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||:  34%|###4      | 38/111 [00:25<00:48,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9535, LAS: 0.9111, UEM: 0.6093, LEM: 0.3757, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6099, partial_loss/deprel_loss: 0.5151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7056, loss: 0.6401, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||:  37%|###6      | 41/111 [00:27<00:47,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9540, LAS: 0.9116, UEM: 0.6067, LEM: 0.3691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3456, partial_loss/deprel_loss: 0.5257, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6612, loss: 0.6379, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||:  41%|####      | 45/111 [00:30<00:43,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9532, LAS: 0.9111, UEM: 0.5997, LEM: 0.3626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7733, partial_loss/deprel_loss: 0.6122, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8159, loss: 0.6409, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||:  44%|####4     | 49/111 [00:32<00:40,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9513, LAS: 0.9092, UEM: 0.5832, LEM: 0.3510, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6072, partial_loss/deprel_loss: 0.5884, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7637, loss: 0.6533, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||:  48%|####7     | 53/111 [00:35<00:39,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8929, UAS: 0.9512, LAS: 0.9091, UEM: 0.5850, LEM: 0.3532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6603, partial_loss/deprel_loss: 0.6363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8126, loss: 0.6534, batch_reg_loss: 0.1715, reg_loss: 0.1716 ||:  50%|#####     | 56/111 [00:38<00:38,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9517, LAS: 0.9096, UEM: 0.5943, LEM: 0.3615, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1501, partial_loss/deprel_loss: 0.2723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4193, loss: 0.6495, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  54%|#####4    | 60/111 [00:40<00:34,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9081, UAS: 0.9500, LAS: 0.9079, UEM: 0.5866, LEM: 0.3552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4817, partial_loss/deprel_loss: 0.5117, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6772, loss: 0.6611, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  58%|#####7    | 64/111 [00:43<00:31,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8893, UAS: 0.9503, LAS: 0.9082, UEM: 0.5875, LEM: 0.3562, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6555, partial_loss/deprel_loss: 0.6512, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8236, loss: 0.6617, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  61%|######1   | 68/111 [00:46<00:30,  1.42it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8993, UAS: 0.9508, LAS: 0.9088, UEM: 0.5997, LEM: 0.3701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5530, partial_loss/deprel_loss: 0.4983, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6807, loss: 0.6568, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  64%|######3   | 71/111 [00:48<00:28,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8860, UAS: 0.9502, LAS: 0.9081, UEM: 0.5917, LEM: 0.3636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7786, partial_loss/deprel_loss: 0.6569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8527, loss: 0.6633, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  67%|######6   | 74/111 [00:50<00:26,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9503, LAS: 0.9081, UEM: 0.5887, LEM: 0.3580, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5200, partial_loss/deprel_loss: 0.5049, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6793, loss: 0.6635, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  69%|######9   | 77/111 [00:52<00:23,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9168, UAS: 0.9494, LAS: 0.9071, UEM: 0.5841, LEM: 0.3539, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3174, partial_loss/deprel_loss: 0.4077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5611, loss: 0.6703, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  72%|#######2  | 80/111 [00:54<00:21,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9502, LAS: 0.9081, UEM: 0.6033, LEM: 0.3762, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2790, partial_loss/deprel_loss: 0.3868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5367, loss: 0.6625, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  75%|#######4  | 83/111 [00:57<00:20,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9505, LAS: 0.9084, UEM: 0.6038, LEM: 0.3730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2464, partial_loss/deprel_loss: 0.3908, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5334, loss: 0.6609, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  77%|#######7  | 86/111 [00:59<00:18,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8735, UAS: 0.9498, LAS: 0.9076, UEM: 0.5981, LEM: 0.3690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9836, partial_loss/deprel_loss: 0.6747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9079, loss: 0.6671, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  81%|########1 | 90/111 [01:01<00:14,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8866, UAS: 0.9492, LAS: 0.9069, UEM: 0.5945, LEM: 0.3658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7101, partial_loss/deprel_loss: 0.6880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8639, loss: 0.6734, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  85%|########4 | 94/111 [01:04<00:11,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8769, UAS: 0.9493, LAS: 0.9069, UEM: 0.5976, LEM: 0.3690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9722, partial_loss/deprel_loss: 0.6962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9228, loss: 0.6741, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  87%|########7 | 97/111 [01:06<00:09,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8829, UAS: 0.9496, LAS: 0.9071, UEM: 0.5950, LEM: 0.3648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7420, partial_loss/deprel_loss: 0.7137, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8908, loss: 0.6729, batch_reg_loss: 0.1715, reg_loss: 0.1715 ||:  92%|#########1| 102/111 [01:08<00:05,  1.62it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9499, LAS: 0.9075, UEM: 0.5979, LEM: 0.3685, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5373, partial_loss/deprel_loss: 0.5125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6889, loss: 0.6693, batch_reg_loss: 0.1714, reg_loss: 0.1715 ||:  96%|#########6| 107/111 [01:11<00:02,  1.73it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9504, LAS: 0.9079, UEM: 0.6026, LEM: 0.3715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2185, partial_loss/deprel_loss: 0.3660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5080, loss: 0.6663, batch_reg_loss: 0.1714, reg_loss: 0.1715 ||: 100%|##########| 111/111 [01:13<00:00,  1.52it/s]\n",
      "2023-04-07 00:46:08,660 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9122, LAS: 0.8613, UEM: 0.3719, LEM: 0.1357, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6872, partial_loss/deprel_loss: 33.7202, partial_loss/cycle_loss: 0.0000, batch_loss: 27.1136, loss: 36.1110, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:11,  1.03s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8709, UAS: 0.9236, LAS: 0.8697, UEM: 0.3147, LEM: 0.0932, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3113, partial_loss/deprel_loss: 47.1769, partial_loss/cycle_loss: 0.0000, batch_loss: 38.0038, loss: 32.5457, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:04<00:08,  1.01s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9373, LAS: 0.8872, UEM: 0.6018, LEM: 0.3907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1716, partial_loss/deprel_loss: 19.2356, partial_loss/cycle_loss: 0.0000, batch_loss: 15.4228, loss: 28.2524, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:07<00:05,  1.00s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9431, LAS: 0.8932, UEM: 0.6361, LEM: 0.3959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1653, partial_loss/deprel_loss: 23.1310, partial_loss/cycle_loss: 0.0000, batch_loss: 18.5378, loss: 26.2134, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:10<00:01,  1.03it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9160, UAS: 0.9460, LAS: 0.8958, UEM: 0.6466, LEM: 0.3856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3953, partial_loss/deprel_loss: 25.8727, partial_loss/cycle_loss: 0.0000, batch_loss: 20.7773, loss: 25.2483, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.01it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9160, UAS: 0.9460, LAS: 0.8958, UEM: 0.6466, LEM: 0.3856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3953, partial_loss/deprel_loss: 25.8727, partial_loss/cycle_loss: 0.0000, batch_loss: 20.7773, loss: 25.2483, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.03it/s]\n",
      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.366  |    25.873\n",
      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.218  |     0.395\n",
      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.172  |     0.000\n",
      "2023-04-07 00:46:21,312 - INFO - combo.training.tensorboard_writer - UEM                      |     0.603  |     0.647\n",
      "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - LAS                      |     0.908  |     0.896\n",
      "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - loss                     |     0.666  |    25.248\n",
      "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - LEM                      |     0.371  |     0.386\n",
      "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - UAS                      |     0.950  |     0.946\n",
      "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - EM                       |     0.927  |     0.916\n",
      "2023-04-07 00:46:21,313 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:46:21,318 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 00:46:26,252 - INFO - combo.training.trainer - Epoch duration: 0:01:33.977591\n",
      "2023-04-07 00:46:26,252 - INFO - combo.training.trainer - Estimated training time remaining: 7:05:54\n",
      "2023-04-07 00:46:26,252 - INFO - allennlp.training.trainer - Epoch 86/399\n",
      "2023-04-07 00:46:26,252 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:46:26,253 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:46:26,259 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8962, UAS: 0.9549, LAS: 0.9143, UEM: 0.5126, LEM: 0.2644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5999, partial_loss/deprel_loss: 0.5818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7569, loss: 0.6319, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:   4%|3         | 4/111 [00:02<01:11,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9319, UAS: 0.9574, LAS: 0.9172, UEM: 0.5572, LEM: 0.2986, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2609, partial_loss/deprel_loss: 0.3570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5092, loss: 0.6052, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:   6%|6         | 7/111 [00:04<01:09,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9556, LAS: 0.9147, UEM: 0.5295, LEM: 0.2703, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3098, partial_loss/deprel_loss: 0.4638, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6044, loss: 0.6292, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:   9%|9         | 10/111 [00:06<01:08,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9560, LAS: 0.9151, UEM: 0.5308, LEM: 0.2715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4331, partial_loss/deprel_loss: 0.4218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5955, loss: 0.6216, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  12%|#1        | 13/111 [00:08<01:07,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9553, LAS: 0.9142, UEM: 0.5352, LEM: 0.2763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3347, partial_loss/deprel_loss: 0.4334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5850, loss: 0.6263, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  15%|#5        | 17/111 [00:11<01:03,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9548, LAS: 0.9133, UEM: 0.5388, LEM: 0.2755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2227, partial_loss/deprel_loss: 0.3917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5293, loss: 0.6341, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  18%|#8        | 20/111 [00:13<01:02,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9508, LAS: 0.9089, UEM: 0.5216, LEM: 0.2667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4718, partial_loss/deprel_loss: 0.5207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6823, loss: 0.6611, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  22%|##1       | 24/111 [00:15<00:56,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9503, LAS: 0.9078, UEM: 0.5263, LEM: 0.2784, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1759, partial_loss/deprel_loss: 0.3242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4659, loss: 0.6687, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  24%|##4       | 27/111 [00:18<00:58,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9507, LAS: 0.9085, UEM: 0.5438, LEM: 0.3015, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2016, partial_loss/deprel_loss: 0.2894, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4432, loss: 0.6630, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  28%|##7       | 31/111 [00:20<00:53,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9025, UAS: 0.9506, LAS: 0.9088, UEM: 0.5685, LEM: 0.3411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6470, partial_loss/deprel_loss: 0.5150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7128, loss: 0.6591, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  31%|###       | 34/111 [00:22<00:52,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9505, LAS: 0.9085, UEM: 0.5655, LEM: 0.3368, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2677, partial_loss/deprel_loss: 0.4214, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5621, loss: 0.6591, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  34%|###4      | 38/111 [00:25<00:49,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9380, UAS: 0.9513, LAS: 0.9093, UEM: 0.5822, LEM: 0.3554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1440, partial_loss/deprel_loss: 0.2598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4080, loss: 0.6536, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  37%|###6      | 41/111 [00:27<00:48,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9521, LAS: 0.9097, UEM: 0.5914, LEM: 0.3558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2431, partial_loss/deprel_loss: 0.4478, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5782, loss: 0.6479, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  40%|###9      | 44/111 [00:30<00:48,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8731, UAS: 0.9506, LAS: 0.9082, UEM: 0.5772, LEM: 0.3460, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0487, partial_loss/deprel_loss: 0.7064, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9462, loss: 0.6611, batch_reg_loss: 0.1714, reg_loss: 0.1714 ||:  42%|####2     | 47/111 [00:32<00:45,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9518, LAS: 0.9095, UEM: 0.5924, LEM: 0.3571, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2587, partial_loss/deprel_loss: 0.4356, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5716, loss: 0.6508, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  46%|####5     | 51/111 [00:34<00:42,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9527, LAS: 0.9100, UEM: 0.5966, LEM: 0.3561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2301, partial_loss/deprel_loss: 0.3930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5318, loss: 0.6473, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  50%|####9     | 55/111 [00:37<00:39,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9522, LAS: 0.9094, UEM: 0.6012, LEM: 0.3618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1176, partial_loss/deprel_loss: 0.3189, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4499, loss: 0.6513, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  53%|#####3    | 59/111 [00:40<00:35,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9524, LAS: 0.9098, UEM: 0.5956, LEM: 0.3554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4422, partial_loss/deprel_loss: 0.4964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6569, loss: 0.6495, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  57%|#####6    | 63/111 [00:42<00:31,  1.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9516, LAS: 0.9088, UEM: 0.5877, LEM: 0.3481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3114, partial_loss/deprel_loss: 0.4026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5557, loss: 0.6568, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  60%|######    | 67/111 [00:44<00:27,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8839, UAS: 0.9507, LAS: 0.9080, UEM: 0.5830, LEM: 0.3466, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8306, partial_loss/deprel_loss: 0.6379, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8478, loss: 0.6621, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  65%|######4   | 72/111 [00:47<00:22,  1.71it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8612, UAS: 0.9501, LAS: 0.9074, UEM: 0.5871, LEM: 0.3530, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1629, partial_loss/deprel_loss: 0.8042, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0473, loss: 0.6673, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  69%|######9   | 77/111 [00:49<00:18,  1.81it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9510, LAS: 0.9086, UEM: 0.6098, LEM: 0.3822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2064, partial_loss/deprel_loss: 0.3390, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4838, loss: 0.6614, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  73%|#######2  | 81/111 [00:51<00:16,  1.80it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9511, LAS: 0.9085, UEM: 0.6124, LEM: 0.3836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3728, partial_loss/deprel_loss: 0.4867, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6352, loss: 0.6604, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  77%|#######6  | 85/111 [00:55<00:16,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8936, UAS: 0.9501, LAS: 0.9075, UEM: 0.6048, LEM: 0.3768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6928, partial_loss/deprel_loss: 0.6402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8220, loss: 0.6699, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  80%|########  | 89/111 [00:58<00:14,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9502, LAS: 0.9077, UEM: 0.6015, LEM: 0.3738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1512, partial_loss/deprel_loss: 0.3505, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4820, loss: 0.6682, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  84%|########3 | 93/111 [01:00<00:12,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9506, LAS: 0.9082, UEM: 0.6050, LEM: 0.3765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2539, partial_loss/deprel_loss: 0.3479, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5004, loss: 0.6638, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  87%|########7 | 97/111 [01:03<00:09,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8780, UAS: 0.9503, LAS: 0.9078, UEM: 0.5996, LEM: 0.3715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8053, partial_loss/deprel_loss: 0.7396, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9240, loss: 0.6678, batch_reg_loss: 0.1713, reg_loss: 0.1714 ||:  90%|######### | 100/111 [01:05<00:07,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9505, LAS: 0.9079, UEM: 0.6015, LEM: 0.3717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6447, partial_loss/deprel_loss: 0.5784, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7629, loss: 0.6663, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||:  94%|#########3| 104/111 [01:08<00:04,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8915, UAS: 0.9501, LAS: 0.9076, UEM: 0.5952, LEM: 0.3664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5785, partial_loss/deprel_loss: 0.6021, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7687, loss: 0.6689, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||:  97%|#########7| 108/111 [01:10<00:01,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9503, LAS: 0.9078, UEM: 0.6002, LEM: 0.3706, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5065, partial_loss/deprel_loss: 0.5337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6995, loss: 0.6659, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
      "2023-04-07 00:47:43,046 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.534  |       N/A\n",
      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.506  |       N/A\n",
      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.171  |       N/A\n",
      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - UEM                      |     0.600  |       N/A\n",
      "2023-04-07 00:47:43,047 - INFO - combo.training.tensorboard_writer - LAS                      |     0.908  |       N/A\n",
      "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - loss                     |     0.666  |       N/A\n",
      "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - LEM                      |     0.371  |       N/A\n",
      "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - UAS                      |     0.950  |       N/A\n",
      "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - EM                       |     0.902  |       N/A\n",
      "2023-04-07 00:47:43,048 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:47:43,053 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 00:47:49,210 - INFO - combo.training.trainer - Epoch duration: 0:01:22.957862\n",
      "2023-04-07 00:47:49,211 - INFO - combo.training.trainer - Estimated training time remaining: 7:04:38\n",
      "2023-04-07 00:47:49,211 - INFO - allennlp.training.trainer - Epoch 87/399\n",
      "2023-04-07 00:47:49,211 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:47:49,212 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:47:49,221 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9687, LAS: 0.9283, UEM: 0.6917, LEM: 0.4037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3433, partial_loss/deprel_loss: 0.4337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5869, loss: 0.5496, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||:   3%|2         | 3/111 [00:02<01:17,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9472, UAS: 0.9621, LAS: 0.9222, UEM: 0.7021, LEM: 0.4715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1045, partial_loss/deprel_loss: 0.2157, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3647, loss: 0.5783, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||:   5%|5         | 6/111 [00:04<01:18,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9557, LAS: 0.9144, UEM: 0.6255, LEM: 0.3980, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2458, partial_loss/deprel_loss: 0.3617, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5098, loss: 0.6403, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||:   9%|9         | 10/111 [00:07<01:11,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9478, LAS: 0.9059, UEM: 0.5568, LEM: 0.3432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8828, partial_loss/deprel_loss: 0.6399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8597, loss: 0.6974, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||:  13%|#2        | 14/111 [00:09<01:07,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9500, LAS: 0.9077, UEM: 0.5914, LEM: 0.3698, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1040, partial_loss/deprel_loss: 0.3227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4502, loss: 0.6824, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||:  15%|#5        | 17/111 [00:11<01:06,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9514, LAS: 0.9091, UEM: 0.6130, LEM: 0.3889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1171, partial_loss/deprel_loss: 0.2585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4015, loss: 0.6680, batch_reg_loss: 0.1713, reg_loss: 0.1713 ||:  18%|#8        | 20/111 [00:14<01:04,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8931, UAS: 0.9511, LAS: 0.9090, UEM: 0.5950, LEM: 0.3703, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7511, partial_loss/deprel_loss: 0.5584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7682, loss: 0.6676, batch_reg_loss: 0.1712, reg_loss: 0.1713 ||:  21%|##        | 23/111 [00:16<01:01,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9521, LAS: 0.9100, UEM: 0.5844, LEM: 0.3557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4836, partial_loss/deprel_loss: 0.5146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6796, loss: 0.6586, batch_reg_loss: 0.1712, reg_loss: 0.1713 ||:  24%|##4       | 27/111 [00:18<00:55,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9511, LAS: 0.9096, UEM: 0.5885, LEM: 0.3636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3558, partial_loss/deprel_loss: 0.4047, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5662, loss: 0.6604, batch_reg_loss: 0.1712, reg_loss: 0.1713 ||:  28%|##7       | 31/111 [00:21<00:52,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8881, UAS: 0.9496, LAS: 0.9082, UEM: 0.5715, LEM: 0.3486, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8574, partial_loss/deprel_loss: 0.6428, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8570, loss: 0.6712, batch_reg_loss: 0.1712, reg_loss: 0.1713 ||:  32%|###1      | 35/111 [00:23<00:49,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9515, LAS: 0.9106, UEM: 0.5987, LEM: 0.3715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2422, partial_loss/deprel_loss: 0.3096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4673, loss: 0.6518, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  35%|###5      | 39/111 [00:27<00:51,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8493, UAS: 0.9506, LAS: 0.9096, UEM: 0.5906, LEM: 0.3639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2880, partial_loss/deprel_loss: 0.8245, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0884, loss: 0.6588, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  38%|###7      | 42/111 [00:29<00:49,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9517, LAS: 0.9103, UEM: 0.6028, LEM: 0.3697, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2292, partial_loss/deprel_loss: 0.4404, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5693, loss: 0.6515, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  41%|####1     | 46/111 [00:31<00:42,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9519, LAS: 0.9103, UEM: 0.5993, LEM: 0.3624, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7766, partial_loss/deprel_loss: 0.5683, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7812, loss: 0.6519, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  46%|####5     | 51/111 [00:33<00:36,  1.66it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9516, LAS: 0.9102, UEM: 0.6066, LEM: 0.3695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2039, partial_loss/deprel_loss: 0.2804, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4363, loss: 0.6525, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  50%|####9     | 55/111 [00:36<00:35,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8640, UAS: 0.9505, LAS: 0.9089, UEM: 0.5934, LEM: 0.3586, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0241, partial_loss/deprel_loss: 0.7608, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9846, loss: 0.6616, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  53%|#####3    | 59/111 [00:38<00:31,  1.63it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9355, UAS: 0.9507, LAS: 0.9092, UEM: 0.6009, LEM: 0.3676, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2038, partial_loss/deprel_loss: 0.3175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4659, loss: 0.6563, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  57%|#####6    | 63/111 [00:41<00:29,  1.63it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9209, UAS: 0.9497, LAS: 0.9081, UEM: 0.5987, LEM: 0.3649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2139, partial_loss/deprel_loss: 0.3651, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5061, loss: 0.6632, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  60%|######    | 67/111 [00:43<00:27,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8482, UAS: 0.9490, LAS: 0.9072, UEM: 0.5947, LEM: 0.3592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.4450, partial_loss/deprel_loss: 0.8776, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1623, loss: 0.6706, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  65%|######4   | 72/111 [00:46<00:23,  1.69it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9487, LAS: 0.9068, UEM: 0.5909, LEM: 0.3552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2596, partial_loss/deprel_loss: 0.3874, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5330, loss: 0.6724, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  69%|######9   | 77/111 [00:48<00:18,  1.82it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9488, LAS: 0.9069, UEM: 0.5854, LEM: 0.3485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3230, partial_loss/deprel_loss: 0.4347, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5835, loss: 0.6719, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  73%|#######2  | 81/111 [00:51<00:17,  1.71it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8817, UAS: 0.9492, LAS: 0.9074, UEM: 0.6009, LEM: 0.3714, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7277, partial_loss/deprel_loss: 0.6733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8553, loss: 0.6688, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  77%|#######6  | 85/111 [00:54<00:16,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9496, LAS: 0.9078, UEM: 0.6041, LEM: 0.3746, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1636, partial_loss/deprel_loss: 0.2827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4300, loss: 0.6651, batch_reg_loss: 0.1712, reg_loss: 0.1712 ||:  80%|########  | 89/111 [00:57<00:14,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9493, LAS: 0.9073, UEM: 0.5980, LEM: 0.3695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4866, partial_loss/deprel_loss: 0.4848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6563, loss: 0.6681, batch_reg_loss: 0.1711, reg_loss: 0.1712 ||:  84%|########3 | 93/111 [01:00<00:12,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9491, LAS: 0.9071, UEM: 0.5911, LEM: 0.3626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3899, partial_loss/deprel_loss: 0.4559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6138, loss: 0.6705, batch_reg_loss: 0.1711, reg_loss: 0.1712 ||:  87%|########7 | 97/111 [01:03<00:10,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9250, UAS: 0.9496, LAS: 0.9077, UEM: 0.5966, LEM: 0.3655, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3368, partial_loss/deprel_loss: 0.4039, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5616, loss: 0.6659, batch_reg_loss: 0.1711, reg_loss: 0.1712 ||:  91%|######### | 101/111 [01:05<00:06,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9502, LAS: 0.9085, UEM: 0.6076, LEM: 0.3781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3070, partial_loss/deprel_loss: 0.3840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5397, loss: 0.6596, batch_reg_loss: 0.1711, reg_loss: 0.1712 ||:  95%|#########4| 105/111 [01:08<00:03,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9120, UAS: 0.9502, LAS: 0.9084, UEM: 0.6053, LEM: 0.3757, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4180, partial_loss/deprel_loss: 0.4299, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5986, loss: 0.6600, batch_reg_loss: 0.1711, reg_loss: 0.1712 ||:  98%|#########8| 109/111 [01:11<00:01,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8934, UAS: 0.9501, LAS: 0.9082, UEM: 0.6015, LEM: 0.3723, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7131, partial_loss/deprel_loss: 0.6420, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8273, loss: 0.6628, batch_reg_loss: 0.1711, reg_loss: 0.1712 ||: 100%|##########| 111/111 [01:12<00:00,  1.52it/s]\n",
      "2023-04-07 00:49:05,042 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:49:05,042 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:49:05,042 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:49:05,042 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:49:05,042 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.642  |       N/A\n",
      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.713  |       N/A\n",
      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.171  |       N/A\n",
      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - UEM                      |     0.601  |       N/A\n",
      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - LAS                      |     0.908  |       N/A\n",
      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - loss                     |     0.663  |       N/A\n",
      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - LEM                      |     0.372  |       N/A\n",
      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - UAS                      |     0.950  |       N/A\n",
      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - EM                       |     0.893  |       N/A\n",
      "2023-04-07 00:49:05,043 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:49:05,048 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 00:49:10,018 - INFO - combo.training.trainer - Epoch duration: 0:01:20.806982\n",
      "2023-04-07 00:49:10,018 - INFO - combo.training.trainer - Estimated training time remaining: 7:03:15\n",
      "2023-04-07 00:49:10,018 - INFO - allennlp.training.trainer - Epoch 88/399\n",
      "2023-04-07 00:49:10,019 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:49:10,019 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:49:10,028 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9648, LAS: 0.9244, UEM: 0.6771, LEM: 0.4049, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3842, partial_loss/deprel_loss: 0.4413, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6010, loss: 0.5365, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:   4%|3         | 4/111 [00:02<01:08,  1.56it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9613, LAS: 0.9201, UEM: 0.6885, LEM: 0.4540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1407, partial_loss/deprel_loss: 0.2453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3955, loss: 0.5656, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:   6%|6         | 7/111 [00:04<01:11,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8917, UAS: 0.9565, LAS: 0.9148, UEM: 0.6298, LEM: 0.3948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8094, partial_loss/deprel_loss: 0.6079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8192, loss: 0.6131, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  10%|9         | 11/111 [00:07<01:07,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9074, UAS: 0.9537, LAS: 0.9116, UEM: 0.6465, LEM: 0.4133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4722, partial_loss/deprel_loss: 0.4675, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6396, loss: 0.6314, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  13%|#2        | 14/111 [00:09<01:04,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9516, LAS: 0.9094, UEM: 0.6364, LEM: 0.4066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2188, partial_loss/deprel_loss: 0.3068, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4603, loss: 0.6542, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  16%|#6        | 18/111 [00:12<01:01,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9494, LAS: 0.9073, UEM: 0.6218, LEM: 0.3947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7785, partial_loss/deprel_loss: 0.5826, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7928, loss: 0.6670, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  20%|#9        | 22/111 [00:14<00:58,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8989, UAS: 0.9493, LAS: 0.9074, UEM: 0.6181, LEM: 0.3962, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6356, partial_loss/deprel_loss: 0.5565, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7434, loss: 0.6665, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  23%|##2       | 25/111 [00:16<00:58,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9479, LAS: 0.9056, UEM: 0.5939, LEM: 0.3749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5422, partial_loss/deprel_loss: 0.5184, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6942, loss: 0.6767, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  25%|##5       | 28/111 [00:19<00:57,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9359, UAS: 0.9484, LAS: 0.9059, UEM: 0.6016, LEM: 0.3789, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1821, partial_loss/deprel_loss: 0.3461, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4843, loss: 0.6760, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  28%|##7       | 31/111 [00:21<01:00,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8825, UAS: 0.9486, LAS: 0.9059, UEM: 0.5937, LEM: 0.3671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7760, partial_loss/deprel_loss: 0.5979, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8046, loss: 0.6750, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  32%|###1      | 35/111 [00:24<00:54,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9470, LAS: 0.9040, UEM: 0.5709, LEM: 0.3493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6367, partial_loss/deprel_loss: 0.6364, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8075, loss: 0.6898, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  35%|###5      | 39/111 [00:26<00:49,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9481, LAS: 0.9056, UEM: 0.5839, LEM: 0.3616, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1492, partial_loss/deprel_loss: 0.2564, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4060, loss: 0.6773, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  39%|###8      | 43/111 [00:29<00:47,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9319, UAS: 0.9492, LAS: 0.9066, UEM: 0.5935, LEM: 0.3658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2049, partial_loss/deprel_loss: 0.3325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4780, loss: 0.6670, batch_reg_loss: 0.1711, reg_loss: 0.1711 ||:  42%|####2     | 47/111 [00:31<00:42,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9255, UAS: 0.9481, LAS: 0.9053, UEM: 0.5892, LEM: 0.3599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2277, partial_loss/deprel_loss: 0.3805, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5210, loss: 0.6769, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||:  47%|####6     | 52/111 [00:34<00:35,  1.65it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9481, LAS: 0.9055, UEM: 0.5862, LEM: 0.3568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2382, partial_loss/deprel_loss: 0.4381, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5692, loss: 0.6759, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||:  51%|#####1    | 57/111 [00:36<00:30,  1.78it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9497, LAS: 0.9070, UEM: 0.5991, LEM: 0.3631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1718, partial_loss/deprel_loss: 0.3393, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4769, loss: 0.6644, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||:  56%|#####5    | 62/111 [00:38<00:25,  1.92it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9489, LAS: 0.9063, UEM: 0.5947, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2533, partial_loss/deprel_loss: 0.3932, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5362, loss: 0.6699, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||:  59%|#####9    | 66/111 [00:41<00:25,  1.76it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9494, LAS: 0.9067, UEM: 0.5983, LEM: 0.3637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1346, partial_loss/deprel_loss: 0.2575, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4039, loss: 0.6678, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||:  63%|######3   | 70/111 [00:43<00:23,  1.74it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9503, LAS: 0.9076, UEM: 0.6103, LEM: 0.3730, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2235, partial_loss/deprel_loss: 0.3390, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4869, loss: 0.6601, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||:  67%|######6   | 74/111 [00:46<00:23,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9056, UAS: 0.9505, LAS: 0.9081, UEM: 0.6227, LEM: 0.3947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5366, partial_loss/deprel_loss: 0.5849, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7462, loss: 0.6569, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||:  70%|#######   | 78/111 [00:50<00:22,  1.48it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8969, UAS: 0.9508, LAS: 0.9084, UEM: 0.6206, LEM: 0.3901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6177, partial_loss/deprel_loss: 0.5950, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7706, loss: 0.6562, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||:  74%|#######3  | 82/111 [00:52<00:20,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9510, LAS: 0.9085, UEM: 0.6165, LEM: 0.3841, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3369, partial_loss/deprel_loss: 0.5227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6566, loss: 0.6572, batch_reg_loss: 0.1710, reg_loss: 0.1711 ||:  77%|#######6  | 85/111 [00:55<00:18,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9511, LAS: 0.9085, UEM: 0.6129, LEM: 0.3792, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5236, partial_loss/deprel_loss: 0.5315, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7009, loss: 0.6570, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||:  79%|#######9  | 88/111 [00:57<00:16,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9504, LAS: 0.9078, UEM: 0.6034, LEM: 0.3718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6980, partial_loss/deprel_loss: 0.6253, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8108, loss: 0.6609, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||:  83%|########2 | 92/111 [00:59<00:13,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9509, LAS: 0.9082, UEM: 0.6093, LEM: 0.3764, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3124, partial_loss/deprel_loss: 0.4351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5815, loss: 0.6571, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||:  86%|########5 | 95/111 [01:02<00:11,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8996, UAS: 0.9513, LAS: 0.9088, UEM: 0.6183, LEM: 0.3879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5063, partial_loss/deprel_loss: 0.6092, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7596, loss: 0.6536, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||:  88%|########8 | 98/111 [01:04<00:09,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9511, LAS: 0.9085, UEM: 0.6137, LEM: 0.3833, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8182, partial_loss/deprel_loss: 0.7218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9121, loss: 0.6563, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||:  92%|#########1| 102/111 [01:07<00:06,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8930, UAS: 0.9506, LAS: 0.9079, UEM: 0.6094, LEM: 0.3796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6152, partial_loss/deprel_loss: 0.6973, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8518, loss: 0.6612, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||:  95%|#########5| 106/111 [01:09<00:03,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8794, UAS: 0.9504, LAS: 0.9075, UEM: 0.6031, LEM: 0.3734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8294, partial_loss/deprel_loss: 0.6723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8747, loss: 0.6649, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||:  99%|#########9| 110/111 [01:11<00:00,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9035, UAS: 0.9503, LAS: 0.9075, UEM: 0.6013, LEM: 0.3718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5801, partial_loss/deprel_loss: 0.5707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7436, loss: 0.6656, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||: 100%|##########| 111/111 [01:12<00:00,  1.53it/s]\n",
      "2023-04-07 00:50:25,578 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:50:25,578 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.571  |       N/A\n",
      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.580  |       N/A\n",
      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.171  |       N/A\n",
      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - UEM                      |     0.601  |       N/A\n",
      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - LAS                      |     0.907  |       N/A\n",
      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - loss                     |     0.666  |       N/A\n",
      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - LEM                      |     0.372  |       N/A\n",
      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:50:25,579 - INFO - combo.training.tensorboard_writer - UAS                      |     0.950  |       N/A\n",
      "2023-04-07 00:50:25,580 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:50:25,580 - INFO - combo.training.tensorboard_writer - EM                       |     0.903  |       N/A\n",
      "2023-04-07 00:50:25,580 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:50:25,584 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 00:50:30,371 - INFO - combo.training.trainer - Epoch duration: 0:01:20.352845\n",
      "2023-04-07 00:50:30,372 - INFO - combo.training.trainer - Estimated training time remaining: 7:01:50\n",
      "2023-04-07 00:50:30,372 - INFO - allennlp.training.trainer - Epoch 89/399\n",
      "2023-04-07 00:50:30,372 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:50:30,373 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:50:30,382 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9209, UAS: 0.9624, LAS: 0.9199, UEM: 0.6179, LEM: 0.3293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2774, partial_loss/deprel_loss: 0.4097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5542, loss: 0.5893, batch_reg_loss: 0.1710, reg_loss: 0.1710 ||:   3%|2         | 3/111 [00:02<01:13,  1.47it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9575, LAS: 0.9151, UEM: 0.6054, LEM: 0.3576, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4951, partial_loss/deprel_loss: 0.5040, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6732, loss: 0.6034, batch_reg_loss: 0.1709, reg_loss: 0.1710 ||:   5%|5         | 6/111 [00:04<01:11,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9608, LAS: 0.9188, UEM: 0.6575, LEM: 0.4024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2058, partial_loss/deprel_loss: 0.3477, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4903, loss: 0.5747, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:   8%|8         | 9/111 [00:06<01:13,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9648, UAS: 0.9584, LAS: 0.9174, UEM: 0.7075, LEM: 0.4978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0484, partial_loss/deprel_loss: 0.1350, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2886, loss: 0.5920, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  12%|#1        | 13/111 [00:09<01:12,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8350, UAS: 0.9516, LAS: 0.9103, UEM: 0.6846, LEM: 0.4747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5908, partial_loss/deprel_loss: 0.9539, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2522, loss: 0.6493, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  14%|#4        | 16/111 [00:14<01:31,  1.04it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9528, LAS: 0.9117, UEM: 0.6715, LEM: 0.4570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4789, partial_loss/deprel_loss: 0.5093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6741, loss: 0.6407, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  18%|#8        | 20/111 [00:16<01:18,  1.16it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9546, LAS: 0.9136, UEM: 0.6846, LEM: 0.4671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2704, partial_loss/deprel_loss: 0.4513, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5860, loss: 0.6282, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  21%|##        | 23/111 [00:18<01:10,  1.24it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9526, LAS: 0.9115, UEM: 0.6587, LEM: 0.4420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6559, partial_loss/deprel_loss: 0.6576, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8282, loss: 0.6451, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  24%|##4       | 27/111 [00:20<01:00,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9520, LAS: 0.9108, UEM: 0.6580, LEM: 0.4407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1778, partial_loss/deprel_loss: 0.3197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4622, loss: 0.6525, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  29%|##8       | 32/111 [00:23<00:52,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9523, LAS: 0.9115, UEM: 0.6451, LEM: 0.4259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2655, partial_loss/deprel_loss: 0.3666, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5173, loss: 0.6465, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  33%|###3      | 37/111 [00:25<00:44,  1.66it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9529, LAS: 0.9117, UEM: 0.6360, LEM: 0.4120, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3649, partial_loss/deprel_loss: 0.4438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5989, loss: 0.6419, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  38%|###7      | 42/111 [00:27<00:37,  1.83it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9533, LAS: 0.9119, UEM: 0.6308, LEM: 0.4005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3812, partial_loss/deprel_loss: 0.4649, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6191, loss: 0.6401, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  41%|####1     | 46/111 [00:30<00:37,  1.72it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8989, UAS: 0.9530, LAS: 0.9112, UEM: 0.6381, LEM: 0.4133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4505, partial_loss/deprel_loss: 0.6057, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7455, loss: 0.6447, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  45%|####5     | 50/111 [00:33<00:36,  1.65it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9541, LAS: 0.9121, UEM: 0.6467, LEM: 0.4193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3036, partial_loss/deprel_loss: 0.4205, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5680, loss: 0.6382, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  49%|####8     | 54/111 [00:35<00:35,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8853, UAS: 0.9531, LAS: 0.9111, UEM: 0.6393, LEM: 0.4141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7622, partial_loss/deprel_loss: 0.6086, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8102, loss: 0.6446, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  52%|#####2    | 58/111 [00:38<00:33,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8813, UAS: 0.9534, LAS: 0.9116, UEM: 0.6483, LEM: 0.4255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8199, partial_loss/deprel_loss: 0.5976, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8129, loss: 0.6389, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  56%|#####5    | 62/111 [00:41<00:32,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8914, UAS: 0.9523, LAS: 0.9106, UEM: 0.6397, LEM: 0.4183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7800, partial_loss/deprel_loss: 0.5918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8003, loss: 0.6471, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  59%|#####9    | 66/111 [00:44<00:30,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9529, LAS: 0.9111, UEM: 0.6421, LEM: 0.4175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3019, partial_loss/deprel_loss: 0.4465, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5885, loss: 0.6425, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  63%|######3   | 70/111 [00:46<00:28,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9294, UAS: 0.9534, LAS: 0.9117, UEM: 0.6431, LEM: 0.4159, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2698, partial_loss/deprel_loss: 0.3487, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5037, loss: 0.6379, batch_reg_loss: 0.1709, reg_loss: 0.1709 ||:  66%|######5   | 73/111 [00:49<00:26,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8478, UAS: 0.9525, LAS: 0.9106, UEM: 0.6362, LEM: 0.4094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3974, partial_loss/deprel_loss: 0.8038, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0934, loss: 0.6450, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||:  68%|######8   | 76/111 [00:51<00:24,  1.46it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9526, LAS: 0.9106, UEM: 0.6360, LEM: 0.4098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4778, partial_loss/deprel_loss: 0.5209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6831, loss: 0.6453, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||:  71%|#######1  | 79/111 [00:53<00:22,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9524, LAS: 0.9105, UEM: 0.6310, LEM: 0.4043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3757, partial_loss/deprel_loss: 0.4632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6165, loss: 0.6464, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||:  75%|#######4  | 83/111 [00:55<00:18,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8984, UAS: 0.9519, LAS: 0.9099, UEM: 0.6210, LEM: 0.3966, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6011, partial_loss/deprel_loss: 0.6377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8012, loss: 0.6522, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||:  78%|#######8  | 87/111 [00:58<00:15,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9520, LAS: 0.9102, UEM: 0.6168, LEM: 0.3921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2273, partial_loss/deprel_loss: 0.3068, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4617, loss: 0.6498, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||:  82%|########1 | 91/111 [01:00<00:13,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9522, LAS: 0.9103, UEM: 0.6161, LEM: 0.3901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2206, partial_loss/deprel_loss: 0.4240, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5542, loss: 0.6488, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||:  85%|########4 | 94/111 [01:02<00:11,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9267, UAS: 0.9523, LAS: 0.9104, UEM: 0.6158, LEM: 0.3889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2154, partial_loss/deprel_loss: 0.3287, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4769, loss: 0.6470, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||:  87%|########7 | 97/111 [01:05<00:09,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9526, LAS: 0.9105, UEM: 0.6182, LEM: 0.3887, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3185, partial_loss/deprel_loss: 0.5270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6561, loss: 0.6454, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||:  91%|######### | 101/111 [01:07<00:06,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9128, UAS: 0.9519, LAS: 0.9096, UEM: 0.6129, LEM: 0.3839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4470, partial_loss/deprel_loss: 0.5585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7070, loss: 0.6513, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||:  94%|#########3| 104/111 [01:09<00:04,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9515, LAS: 0.9093, UEM: 0.6072, LEM: 0.3791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6124, partial_loss/deprel_loss: 0.5701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7494, loss: 0.6536, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||:  97%|#########7| 108/111 [01:12<00:02,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9515, LAS: 0.9093, UEM: 0.6053, LEM: 0.3766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4246, partial_loss/deprel_loss: 0.5151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6678, loss: 0.6540, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||: 100%|##########| 111/111 [01:14<00:00,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9515, LAS: 0.9093, UEM: 0.6053, LEM: 0.3766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4246, partial_loss/deprel_loss: 0.5151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6678, loss: 0.6540, batch_reg_loss: 0.1708, reg_loss: 0.1709 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
      "2023-04-07 00:51:48,085 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.515  |       N/A\n",
      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.425  |       N/A\n",
      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.171  |       N/A\n",
      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - UEM                      |     0.605  |       N/A\n",
      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - LAS                      |     0.909  |       N/A\n",
      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - loss                     |     0.654  |       N/A\n",
      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:51:48,086 - INFO - combo.training.tensorboard_writer - LEM                      |     0.377  |       N/A\n",
      "2023-04-07 00:51:48,087 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:51:48,087 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:51:48,087 - INFO - combo.training.tensorboard_writer - UAS                      |     0.951  |       N/A\n",
      "2023-04-07 00:51:48,087 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:51:48,087 - INFO - combo.training.tensorboard_writer - EM                       |     0.909  |       N/A\n",
      "2023-04-07 00:51:48,087 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:51:48,092 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 00:51:53,928 - INFO - combo.training.trainer - Epoch duration: 0:01:23.555709\n",
      "2023-04-07 00:51:53,928 - INFO - combo.training.trainer - Estimated training time remaining: 7:00:36\n",
      "2023-04-07 00:51:53,928 - INFO - allennlp.training.trainer - Epoch 90/399\n",
      "2023-04-07 00:51:53,928 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:51:53,929 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:51:53,937 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9586, LAS: 0.9155, UEM: 0.5270, LEM: 0.2716, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4390, partial_loss/deprel_loss: 0.4760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6394, loss: 0.6227, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:   4%|3         | 4/111 [00:02<01:11,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9620, LAS: 0.9203, UEM: 0.6100, LEM: 0.3339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3636, partial_loss/deprel_loss: 0.3784, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5462, loss: 0.5838, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:   6%|6         | 7/111 [00:05<01:12,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8784, UAS: 0.9583, LAS: 0.9171, UEM: 0.6267, LEM: 0.3639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8749, partial_loss/deprel_loss: 0.6410, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8585, loss: 0.6021, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:  10%|9         | 11/111 [00:07<01:05,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8722, UAS: 0.9531, LAS: 0.9121, UEM: 0.5706, LEM: 0.3167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9044, partial_loss/deprel_loss: 0.6860, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9005, loss: 0.6420, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:  14%|#4        | 16/111 [00:09<00:56,  1.67it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8670, UAS: 0.9505, LAS: 0.9098, UEM: 0.5415, LEM: 0.2919, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0960, partial_loss/deprel_loss: 0.7426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9841, loss: 0.6564, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:  19%|#8        | 21/111 [00:11<00:50,  1.80it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9480, UAS: 0.9539, LAS: 0.9130, UEM: 0.6156, LEM: 0.3681, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1117, partial_loss/deprel_loss: 0.2053, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3574, loss: 0.6258, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:  23%|##3       | 26/111 [00:14<00:48,  1.77it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9558, LAS: 0.9152, UEM: 0.6321, LEM: 0.3780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2744, partial_loss/deprel_loss: 0.3847, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5334, loss: 0.6117, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:  27%|##7       | 30/111 [00:17<00:47,  1.69it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8664, UAS: 0.9541, LAS: 0.9137, UEM: 0.6241, LEM: 0.3791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0644, partial_loss/deprel_loss: 0.7645, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9952, loss: 0.6239, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:  31%|###       | 34/111 [00:20<00:48,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9553, LAS: 0.9151, UEM: 0.6368, LEM: 0.3920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2827, partial_loss/deprel_loss: 0.2994, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4668, loss: 0.6155, batch_reg_loss: 0.1708, reg_loss: 0.1708 ||:  34%|###4      | 38/111 [00:22<00:44,  1.63it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9557, LAS: 0.9154, UEM: 0.6404, LEM: 0.3955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1780, partial_loss/deprel_loss: 0.3391, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4776, loss: 0.6130, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||:  38%|###7      | 42/111 [00:25<00:44,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8760, UAS: 0.9546, LAS: 0.9140, UEM: 0.6388, LEM: 0.3985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9500, partial_loss/deprel_loss: 0.6070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8463, loss: 0.6205, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||:  41%|####1     | 46/111 [00:28<00:44,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9547, LAS: 0.9141, UEM: 0.6337, LEM: 0.3903, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3840, partial_loss/deprel_loss: 0.4231, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5860, loss: 0.6183, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||:  45%|####5     | 50/111 [00:30<00:39,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9541, LAS: 0.9134, UEM: 0.6280, LEM: 0.3864, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3573, partial_loss/deprel_loss: 0.4235, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5810, loss: 0.6211, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||:  49%|####8     | 54/111 [00:33<00:37,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9543, LAS: 0.9132, UEM: 0.6260, LEM: 0.3833, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3510, partial_loss/deprel_loss: 0.4607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6095, loss: 0.6207, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||:  52%|#####2    | 58/111 [00:36<00:36,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9543, LAS: 0.9130, UEM: 0.6279, LEM: 0.3851, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2470, partial_loss/deprel_loss: 0.3760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5209, loss: 0.6219, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||:  55%|#####4    | 61/111 [00:38<00:34,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8940, UAS: 0.9539, LAS: 0.9125, UEM: 0.6219, LEM: 0.3795, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5638, partial_loss/deprel_loss: 0.5155, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6958, loss: 0.6253, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||:  59%|#####8    | 65/111 [00:41<00:30,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8806, UAS: 0.9537, LAS: 0.9121, UEM: 0.6204, LEM: 0.3791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8245, partial_loss/deprel_loss: 0.6926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8897, loss: 0.6278, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||:  61%|######1   | 68/111 [00:43<00:29,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9464, UAS: 0.9538, LAS: 0.9124, UEM: 0.6296, LEM: 0.3930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0910, partial_loss/deprel_loss: 0.2150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3609, loss: 0.6257, batch_reg_loss: 0.1707, reg_loss: 0.1708 ||:  64%|######3   | 71/111 [00:45<00:29,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9180, UAS: 0.9534, LAS: 0.9119, UEM: 0.6202, LEM: 0.3844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3472, partial_loss/deprel_loss: 0.4775, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6221, loss: 0.6306, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  68%|######7   | 75/111 [00:48<00:25,  1.42it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8772, UAS: 0.9531, LAS: 0.9114, UEM: 0.6143, LEM: 0.3787, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8013, partial_loss/deprel_loss: 0.6878, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8812, loss: 0.6355, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  70%|#######   | 78/111 [00:50<00:23,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9010, UAS: 0.9531, LAS: 0.9113, UEM: 0.6071, LEM: 0.3708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5766, partial_loss/deprel_loss: 0.6206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7825, loss: 0.6377, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  74%|#######3  | 82/111 [00:53<00:19,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8973, UAS: 0.9525, LAS: 0.9106, UEM: 0.6012, LEM: 0.3661, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4863, partial_loss/deprel_loss: 0.5547, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7117, loss: 0.6427, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  77%|#######6  | 85/111 [00:55<00:17,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8907, UAS: 0.9518, LAS: 0.9098, UEM: 0.5942, LEM: 0.3610, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7252, partial_loss/deprel_loss: 0.6054, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8001, loss: 0.6498, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  79%|#######9  | 88/111 [00:57<00:15,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9520, LAS: 0.9100, UEM: 0.5902, LEM: 0.3561, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2696, partial_loss/deprel_loss: 0.3801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5287, loss: 0.6494, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  83%|########2 | 92/111 [00:59<00:12,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9525, LAS: 0.9105, UEM: 0.5960, LEM: 0.3611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1836, partial_loss/deprel_loss: 0.2796, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4311, loss: 0.6452, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  86%|########5 | 95/111 [01:02<00:11,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8996, UAS: 0.9515, LAS: 0.9095, UEM: 0.5901, LEM: 0.3562, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6474, partial_loss/deprel_loss: 0.6101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7882, loss: 0.6541, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  89%|########9 | 99/111 [01:04<00:08,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8969, UAS: 0.9516, LAS: 0.9096, UEM: 0.5925, LEM: 0.3564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7554, partial_loss/deprel_loss: 0.5501, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7618, loss: 0.6533, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  92%|#########1| 102/111 [01:07<00:06,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8992, UAS: 0.9509, LAS: 0.9089, UEM: 0.5867, LEM: 0.3523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5455, partial_loss/deprel_loss: 0.5296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7035, loss: 0.6580, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  95%|#########4| 105/111 [01:09<00:04,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9513, LAS: 0.9093, UEM: 0.5920, LEM: 0.3550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2537, partial_loss/deprel_loss: 0.4396, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5731, loss: 0.6548, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  97%|#########7| 108/111 [01:11<00:02,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9515, LAS: 0.9096, UEM: 0.6028, LEM: 0.3725, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6137, partial_loss/deprel_loss: 0.5685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7482, loss: 0.6535, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 100%|##########| 111/111 [01:14<00:00,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9515, LAS: 0.9096, UEM: 0.6028, LEM: 0.3725, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6137, partial_loss/deprel_loss: 0.5685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7482, loss: 0.6535, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||: 100%|##########| 111/111 [01:14<00:00,  1.50it/s]\n",
      "2023-04-07 00:53:10,727 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9140, UAS: 0.9666, LAS: 0.9178, UEM: 0.7733, LEM: 0.4474, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4139, partial_loss/deprel_loss: 25.6641, partial_loss/cycle_loss: 0.0000, batch_loss: 20.6140, loss: 19.3419, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:08,  1.20it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8775, UAS: 0.9579, LAS: 0.9100, UEM: 0.7512, LEM: 0.4936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9262, partial_loss/deprel_loss: 35.7394, partial_loss/cycle_loss: 0.0000, batch_loss: 28.7767, loss: 21.8718, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  54%|#####3    | 7/13 [00:05<00:04,  1.28it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8804, UAS: 0.9531, LAS: 0.9020, UEM: 0.6854, LEM: 0.4134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7791, partial_loss/deprel_loss: 28.9505, partial_loss/cycle_loss: 0.0000, batch_loss: 23.3162, loss: 23.2931, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:07<00:01,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8289, UAS: 0.9464, LAS: 0.8943, UEM: 0.6498, LEM: 0.3856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7166, partial_loss/deprel_loss: 55.2239, partial_loss/cycle_loss: 0.0000, batch_loss: 44.5224, loss: 25.0047, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:09<00:00,  1.39it/s]\n",
      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.569  |    55.224\n",
      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.614  |     1.717\n",
      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.171  |     0.000\n",
      "2023-04-07 00:53:20,057 - INFO - combo.training.tensorboard_writer - UEM                      |     0.603  |     0.650\n",
      "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - LAS                      |     0.910  |     0.894\n",
      "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - loss                     |     0.654  |    25.005\n",
      "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - LEM                      |     0.372  |     0.386\n",
      "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - UAS                      |     0.951  |     0.946\n",
      "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - EM                       |     0.904  |     0.829\n",
      "2023-04-07 00:53:20,058 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 00:53:20,063 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 00:53:24,854 - INFO - combo.training.trainer - Epoch duration: 0:01:30.925328\n",
      "2023-04-07 00:53:24,854 - INFO - combo.training.trainer - Estimated training time remaining: 6:59:47\n",
      "2023-04-07 00:53:24,854 - INFO - allennlp.training.trainer - Epoch 91/399\n",
      "2023-04-07 00:53:24,854 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:53:24,855 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:53:24,864 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8414, UAS: 0.9196, LAS: 0.8740, UEM: 0.1556, LEM: 0.0356, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5877, partial_loss/deprel_loss: 0.9074, partial_loss/cycle_loss: 0.0000, batch_loss: 1.2141, loss: 0.9081, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:   3%|2         | 3/111 [00:02<01:18,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9417, LAS: 0.9000, UEM: 0.5139, LEM: 0.2751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5749, partial_loss/deprel_loss: 0.4906, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6781, loss: 0.7202, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:   6%|6         | 7/111 [00:04<01:12,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8703, UAS: 0.9332, LAS: 0.8911, UEM: 0.4231, LEM: 0.2178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9388, partial_loss/deprel_loss: 0.7218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9358, loss: 0.7898, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  10%|9         | 11/111 [00:07<01:07,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8817, UAS: 0.9391, LAS: 0.8975, UEM: 0.5123, LEM: 0.3099, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6934, partial_loss/deprel_loss: 0.6334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8161, loss: 0.7382, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  14%|#3        | 15/111 [00:09<01:03,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9411, LAS: 0.8992, UEM: 0.4980, LEM: 0.2940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2657, partial_loss/deprel_loss: 0.3629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.7306, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  16%|#6        | 18/111 [00:11<01:03,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9448, LAS: 0.9035, UEM: 0.5821, LEM: 0.3803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1763, partial_loss/deprel_loss: 0.2714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4230, loss: 0.6973, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  19%|#8        | 21/111 [00:14<01:03,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9467, LAS: 0.9060, UEM: 0.5947, LEM: 0.3892, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1693, partial_loss/deprel_loss: 0.2629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4149, loss: 0.6790, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  22%|##1       | 24/111 [00:16<01:03,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9264, UAS: 0.9484, LAS: 0.9081, UEM: 0.5871, LEM: 0.3703, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2777, partial_loss/deprel_loss: 0.3964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5434, loss: 0.6673, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  25%|##5       | 28/111 [00:18<00:57,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9176, UAS: 0.9507, LAS: 0.9106, UEM: 0.6326, LEM: 0.4190, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3565, partial_loss/deprel_loss: 0.4421, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5957, loss: 0.6473, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  28%|##7       | 31/111 [00:21<00:58,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8635, UAS: 0.9501, LAS: 0.9099, UEM: 0.6233, LEM: 0.4070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1390, partial_loss/deprel_loss: 0.7462, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9954, loss: 0.6526, batch_reg_loss: 0.1707, reg_loss: 0.1707 ||:  32%|###1      | 35/111 [00:23<00:53,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8896, UAS: 0.9501, LAS: 0.9099, UEM: 0.6146, LEM: 0.3962, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7562, partial_loss/deprel_loss: 0.6199, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8178, loss: 0.6525, batch_reg_loss: 0.1706, reg_loss: 0.1707 ||:  34%|###4      | 38/111 [00:26<00:50,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8731, UAS: 0.9507, LAS: 0.9103, UEM: 0.6202, LEM: 0.3983, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0333, partial_loss/deprel_loss: 0.7240, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9565, loss: 0.6498, batch_reg_loss: 0.1706, reg_loss: 0.1707 ||:  38%|###7      | 42/111 [00:28<00:47,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8811, UAS: 0.9501, LAS: 0.9096, UEM: 0.6078, LEM: 0.3855, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0019, partial_loss/deprel_loss: 0.5839, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8381, loss: 0.6546, batch_reg_loss: 0.1706, reg_loss: 0.1707 ||:  41%|####1     | 46/111 [00:31<00:42,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9508, LAS: 0.9102, UEM: 0.6114, LEM: 0.3855, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2693, partial_loss/deprel_loss: 0.4158, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5571, loss: 0.6488, batch_reg_loss: 0.1706, reg_loss: 0.1707 ||:  45%|####5     | 50/111 [00:33<00:40,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9505, LAS: 0.9100, UEM: 0.6099, LEM: 0.3849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2493, partial_loss/deprel_loss: 0.3717, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5179, loss: 0.6507, batch_reg_loss: 0.1706, reg_loss: 0.1707 ||:  49%|####8     | 54/111 [00:36<00:38,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9514, LAS: 0.9109, UEM: 0.6192, LEM: 0.3910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3527, partial_loss/deprel_loss: 0.4770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6227, loss: 0.6443, batch_reg_loss: 0.1706, reg_loss: 0.1707 ||:  52%|#####2    | 58/111 [00:39<00:36,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9037, UAS: 0.9515, LAS: 0.9108, UEM: 0.6114, LEM: 0.3828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6184, partial_loss/deprel_loss: 0.5387, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7252, loss: 0.6485, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||:  56%|#####5    | 62/111 [00:42<00:33,  1.45it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9513, LAS: 0.9104, UEM: 0.6053, LEM: 0.3773, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3285, partial_loss/deprel_loss: 0.4954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6326, loss: 0.6525, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||:  59%|#####9    | 66/111 [00:44<00:30,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8940, UAS: 0.9512, LAS: 0.9098, UEM: 0.5997, LEM: 0.3700, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4839, partial_loss/deprel_loss: 0.6563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7924, loss: 0.6560, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||:  63%|######3   | 70/111 [00:47<00:28,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9680, UAS: 0.9520, LAS: 0.9109, UEM: 0.6199, LEM: 0.3973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0445, partial_loss/deprel_loss: 0.1407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2920, loss: 0.6489, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||:  66%|######5   | 73/111 [00:49<00:27,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9522, LAS: 0.9109, UEM: 0.6165, LEM: 0.3915, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3092, partial_loss/deprel_loss: 0.4750, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6124, loss: 0.6500, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||:  68%|######8   | 76/111 [00:52<00:25,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8874, UAS: 0.9519, LAS: 0.9106, UEM: 0.6132, LEM: 0.3887, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7848, partial_loss/deprel_loss: 0.6318, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8330, loss: 0.6508, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||:  71%|#######1  | 79/111 [00:54<00:23,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9315, UAS: 0.9523, LAS: 0.9111, UEM: 0.6146, LEM: 0.3882, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2224, partial_loss/deprel_loss: 0.3762, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5160, loss: 0.6476, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||:  74%|#######3  | 82/111 [00:56<00:20,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9525, LAS: 0.9114, UEM: 0.6173, LEM: 0.3902, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7428, partial_loss/deprel_loss: 0.5632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7697, loss: 0.6460, batch_reg_loss: 0.1706, reg_loss: 0.1706 ||:  77%|#######6  | 85/111 [00:58<00:19,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9521, LAS: 0.9110, UEM: 0.6158, LEM: 0.3891, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2247, partial_loss/deprel_loss: 0.3346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4831, loss: 0.6467, batch_reg_loss: 0.1705, reg_loss: 0.1706 ||:  81%|########1 | 90/111 [01:01<00:14,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9031, UAS: 0.9520, LAS: 0.9106, UEM: 0.6101, LEM: 0.3833, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5589, partial_loss/deprel_loss: 0.5639, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7335, loss: 0.6502, batch_reg_loss: 0.1705, reg_loss: 0.1706 ||:  85%|########4 | 94/111 [01:03<00:10,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9528, LAS: 0.9115, UEM: 0.6231, LEM: 0.3931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2567, partial_loss/deprel_loss: 0.3461, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4987, loss: 0.6430, batch_reg_loss: 0.1705, reg_loss: 0.1706 ||:  88%|########8 | 98/111 [01:06<00:08,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9529, LAS: 0.9116, UEM: 0.6202, LEM: 0.3901, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6575, partial_loss/deprel_loss: 0.6112, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7910, loss: 0.6424, batch_reg_loss: 0.1705, reg_loss: 0.1706 ||:  92%|#########1| 102/111 [01:08<00:05,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8979, UAS: 0.9525, LAS: 0.9110, UEM: 0.6148, LEM: 0.3845, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5890, partial_loss/deprel_loss: 0.5102, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6965, loss: 0.6469, batch_reg_loss: 0.1705, reg_loss: 0.1706 ||:  95%|#########5| 106/111 [01:11<00:03,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8758, UAS: 0.9521, LAS: 0.9106, UEM: 0.6092, LEM: 0.3793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9806, partial_loss/deprel_loss: 0.7078, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9329, loss: 0.6498, batch_reg_loss: 0.1705, reg_loss: 0.1706 ||:  99%|#########9| 110/111 [01:13<00:00,  1.66it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9520, LAS: 0.9104, UEM: 0.6071, LEM: 0.3778, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8246, partial_loss/deprel_loss: 0.6674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8694, loss: 0.6518, batch_reg_loss: 0.1705, reg_loss: 0.1706 ||: 100%|##########| 111/111 [01:13<00:00,  1.50it/s]\n",
      "2023-04-07 00:54:41,915 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:54:41,915 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:54:41,915 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:54:41,915 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:54:41,915 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:54:41,915 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:54:41,915 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.667  |       N/A\n",
      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.825  |       N/A\n",
      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.171  |       N/A\n",
      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - UEM                      |     0.607  |       N/A\n",
      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - LAS                      |     0.910  |       N/A\n",
      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - loss                     |     0.652  |       N/A\n",
      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - LEM                      |     0.378  |       N/A\n",
      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - UAS                      |     0.952  |       N/A\n",
      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - EM                       |     0.891  |       N/A\n",
      "2023-04-07 00:54:41,916 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:54:41,921 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 00:54:46,283 - INFO - combo.training.trainer - Epoch duration: 0:01:21.429347\n",
      "2023-04-07 00:54:46,284 - INFO - combo.training.trainer - Estimated training time remaining: 6:58:25\n",
      "2023-04-07 00:54:46,284 - INFO - allennlp.training.trainer - Epoch 92/399\n",
      "2023-04-07 00:54:46,284 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:54:46,285 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:54:46,293 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9542, LAS: 0.9139, UEM: 0.7424, LEM: 0.5818, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5152, partial_loss/deprel_loss: 0.5199, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6895, loss: 0.6134, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||:   3%|2         | 3/111 [00:02<01:21,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9128, UAS: 0.9479, LAS: 0.9073, UEM: 0.6124, LEM: 0.4416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3346, partial_loss/deprel_loss: 0.4384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5882, loss: 0.6523, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||:   5%|5         | 6/111 [00:04<01:18,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9463, LAS: 0.9048, UEM: 0.6333, LEM: 0.4294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1418, partial_loss/deprel_loss: 0.3244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4584, loss: 0.6718, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||:   9%|9         | 10/111 [00:06<01:11,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9422, LAS: 0.9000, UEM: 0.5906, LEM: 0.3838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4059, partial_loss/deprel_loss: 0.4657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6242, loss: 0.7008, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||:  12%|#1        | 13/111 [00:09<01:10,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9447, LAS: 0.9030, UEM: 0.5856, LEM: 0.3780, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2784, partial_loss/deprel_loss: 0.3270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4878, loss: 0.6912, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||:  15%|#5        | 17/111 [00:11<01:06,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9470, LAS: 0.9053, UEM: 0.5853, LEM: 0.3640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2329, partial_loss/deprel_loss: 0.3702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5132, loss: 0.6773, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||:  19%|#8        | 21/111 [00:14<01:00,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8945, UAS: 0.9460, LAS: 0.9037, UEM: 0.5511, LEM: 0.3347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6266, partial_loss/deprel_loss: 0.5975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7738, loss: 0.6872, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||:  23%|##2       | 25/111 [00:16<00:55,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9259, UAS: 0.9480, LAS: 0.9061, UEM: 0.5590, LEM: 0.3307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2587, partial_loss/deprel_loss: 0.3937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5371, loss: 0.6726, batch_reg_loss: 0.1705, reg_loss: 0.1705 ||:  26%|##6       | 29/111 [00:19<00:52,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9489, LAS: 0.9070, UEM: 0.5670, LEM: 0.3330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7531, partial_loss/deprel_loss: 0.5853, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7893, loss: 0.6676, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||:  29%|##8       | 32/111 [00:21<00:52,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9460, UAS: 0.9491, LAS: 0.9076, UEM: 0.5801, LEM: 0.3557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1063, partial_loss/deprel_loss: 0.2096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3594, loss: 0.6631, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||:  32%|###1      | 35/111 [00:23<00:53,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9488, LAS: 0.9072, UEM: 0.5672, LEM: 0.3429, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3363, partial_loss/deprel_loss: 0.4694, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6132, loss: 0.6686, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||:  34%|###4      | 38/111 [00:25<00:52,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9494, LAS: 0.9079, UEM: 0.5780, LEM: 0.3534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1917, partial_loss/deprel_loss: 0.3255, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4692, loss: 0.6623, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||:  37%|###6      | 41/111 [00:28<00:51,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9505, LAS: 0.9092, UEM: 0.5912, LEM: 0.3617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2921, partial_loss/deprel_loss: 0.3574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5148, loss: 0.6529, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||:  40%|###9      | 44/111 [00:30<00:48,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8648, UAS: 0.9502, LAS: 0.9091, UEM: 0.5955, LEM: 0.3680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2522, partial_loss/deprel_loss: 0.6656, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9533, loss: 0.6536, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||:  42%|####2     | 47/111 [00:32<00:47,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9506, LAS: 0.9097, UEM: 0.5931, LEM: 0.3639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2855, partial_loss/deprel_loss: 0.3769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5290, loss: 0.6486, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||:  45%|####5     | 50/111 [00:35<00:47,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9503, LAS: 0.9092, UEM: 0.5891, LEM: 0.3591, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4746, partial_loss/deprel_loss: 0.4868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6548, loss: 0.6510, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||:  49%|####8     | 54/111 [00:37<00:40,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9506, LAS: 0.9095, UEM: 0.5857, LEM: 0.3544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3050, partial_loss/deprel_loss: 0.3623, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5212, loss: 0.6479, batch_reg_loss: 0.1704, reg_loss: 0.1705 ||:  51%|#####1    | 57/111 [00:39<00:39,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9515, LAS: 0.9105, UEM: 0.5931, LEM: 0.3599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1843, partial_loss/deprel_loss: 0.2933, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4419, loss: 0.6429, batch_reg_loss: 0.1704, reg_loss: 0.1704 ||:  55%|#####4    | 61/111 [00:42<00:35,  1.40it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8981, UAS: 0.9504, LAS: 0.9094, UEM: 0.5806, LEM: 0.3502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6265, partial_loss/deprel_loss: 0.5127, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7059, loss: 0.6522, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||:  59%|#####8    | 65/111 [00:44<00:31,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8873, UAS: 0.9501, LAS: 0.9092, UEM: 0.5760, LEM: 0.3450, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9519, partial_loss/deprel_loss: 0.6115, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8500, loss: 0.6552, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||:  62%|######2   | 69/111 [00:47<00:27,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9514, LAS: 0.9108, UEM: 0.6083, LEM: 0.3858, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4295, partial_loss/deprel_loss: 0.4640, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6274, loss: 0.6452, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||:  66%|######5   | 73/111 [00:50<00:26,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9184, UAS: 0.9524, LAS: 0.9119, UEM: 0.6201, LEM: 0.3955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3675, partial_loss/deprel_loss: 0.3858, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5524, loss: 0.6368, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||:  69%|######9   | 77/111 [00:53<00:23,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9531, LAS: 0.9123, UEM: 0.6260, LEM: 0.3974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1469, partial_loss/deprel_loss: 0.3113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4487, loss: 0.6328, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||:  72%|#######2  | 80/111 [00:55<00:21,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9530, LAS: 0.9125, UEM: 0.6196, LEM: 0.3912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6422, partial_loss/deprel_loss: 0.5340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7260, loss: 0.6324, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||:  76%|#######5  | 84/111 [00:57<00:17,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9531, LAS: 0.9127, UEM: 0.6151, LEM: 0.3860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3872, partial_loss/deprel_loss: 0.4186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5826, loss: 0.6309, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||:  79%|#######9  | 88/111 [00:59<00:14,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9534, LAS: 0.9129, UEM: 0.6182, LEM: 0.3891, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1823, partial_loss/deprel_loss: 0.3832, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5133, loss: 0.6296, batch_reg_loss: 0.1703, reg_loss: 0.1704 ||:  83%|########2 | 92/111 [01:02<00:11,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9536, LAS: 0.9132, UEM: 0.6242, LEM: 0.3969, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1635, partial_loss/deprel_loss: 0.3041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4462, loss: 0.6277, batch_reg_loss: 0.1702, reg_loss: 0.1704 ||:  86%|########6 | 96/111 [01:04<00:08,  1.70it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9539, LAS: 0.9134, UEM: 0.6223, LEM: 0.3940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5956, partial_loss/deprel_loss: 0.5345, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7169, loss: 0.6272, batch_reg_loss: 0.1702, reg_loss: 0.1704 ||:  91%|######### | 101/111 [01:06<00:05,  1.80it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9542, LAS: 0.9139, UEM: 0.6224, LEM: 0.3937, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2040, partial_loss/deprel_loss: 0.2981, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4494, loss: 0.6243, batch_reg_loss: 0.1702, reg_loss: 0.1704 ||:  95%|#########5| 106/111 [01:09<00:02,  1.82it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9536, LAS: 0.9133, UEM: 0.6157, LEM: 0.3883, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3588, partial_loss/deprel_loss: 0.4519, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6035, loss: 0.6290, batch_reg_loss: 0.1702, reg_loss: 0.1704 ||:  99%|#########9| 110/111 [01:12<00:00,  1.64it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9536, LAS: 0.9133, UEM: 0.6142, LEM: 0.3870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4580, partial_loss/deprel_loss: 0.4665, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6350, loss: 0.6291, batch_reg_loss: 0.1702, reg_loss: 0.1704 ||: 100%|##########| 111/111 [01:12<00:00,  1.52it/s]\n",
      "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:56:02,419 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.467  |       N/A\n",
      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.458  |       N/A\n",
      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.170  |       N/A\n",
      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - UEM                      |     0.614  |       N/A\n",
      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - LAS                      |     0.913  |       N/A\n",
      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - loss                     |     0.629  |       N/A\n",
      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - LEM                      |     0.387  |       N/A\n",
      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - UAS                      |     0.954  |       N/A\n",
      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - EM                       |     0.915  |       N/A\n",
      "2023-04-07 00:56:02,420 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:56:02,425 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 00:56:07,411 - INFO - combo.training.trainer - Epoch duration: 0:01:21.127162\n",
      "2023-04-07 00:56:07,412 - INFO - combo.training.trainer - Estimated training time remaining: 6:57:02\n",
      "2023-04-07 00:56:07,412 - INFO - allennlp.training.trainer - Epoch 93/399\n",
      "2023-04-07 00:56:07,412 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:56:07,413 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:56:07,422 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9622, LAS: 0.9221, UEM: 0.7398, LEM: 0.5281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1570, partial_loss/deprel_loss: 0.2857, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4302, loss: 0.5584, batch_reg_loss: 0.1702, reg_loss: 0.1702 ||:   4%|3         | 4/111 [00:02<01:17,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9572, LAS: 0.9153, UEM: 0.6616, LEM: 0.4305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2660, partial_loss/deprel_loss: 0.4206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5599, loss: 0.6086, batch_reg_loss: 0.1702, reg_loss: 0.1702 ||:   7%|7         | 8/111 [00:05<01:10,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9590, LAS: 0.9168, UEM: 0.6598, LEM: 0.4079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2378, partial_loss/deprel_loss: 0.3891, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5290, loss: 0.6018, batch_reg_loss: 0.1702, reg_loss: 0.1702 ||:  10%|9         | 11/111 [00:07<01:09,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8960, UAS: 0.9566, LAS: 0.9156, UEM: 0.6450, LEM: 0.4066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6822, partial_loss/deprel_loss: 0.5603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7548, loss: 0.6125, batch_reg_loss: 0.1702, reg_loss: 0.1702 ||:  13%|#2        | 14/111 [00:09<01:10,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9550, LAS: 0.9141, UEM: 0.6348, LEM: 0.3942, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2216, partial_loss/deprel_loss: 0.3102, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4626, loss: 0.6239, batch_reg_loss: 0.1701, reg_loss: 0.1702 ||:  15%|#5        | 17/111 [00:11<01:07,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9546, LAS: 0.9142, UEM: 0.6136, LEM: 0.3776, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4356, partial_loss/deprel_loss: 0.4792, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6406, loss: 0.6247, batch_reg_loss: 0.1701, reg_loss: 0.1702 ||:  19%|#8        | 21/111 [00:14<01:01,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9557, LAS: 0.9156, UEM: 0.6347, LEM: 0.4037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1566, partial_loss/deprel_loss: 0.2693, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4169, loss: 0.6161, batch_reg_loss: 0.1701, reg_loss: 0.1702 ||:  23%|##2       | 25/111 [00:16<00:57,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9546, LAS: 0.9146, UEM: 0.6127, LEM: 0.3836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3816, partial_loss/deprel_loss: 0.4059, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5711, loss: 0.6273, batch_reg_loss: 0.1701, reg_loss: 0.1701 ||:  26%|##6       | 29/111 [00:19<00:53,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9565, LAS: 0.9172, UEM: 0.6595, LEM: 0.4441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1907, partial_loss/deprel_loss: 0.3468, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4857, loss: 0.6083, batch_reg_loss: 0.1701, reg_loss: 0.1701 ||:  29%|##8       | 32/111 [00:21<00:53,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9561, LAS: 0.9169, UEM: 0.6562, LEM: 0.4394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1723, partial_loss/deprel_loss: 0.3134, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4553, loss: 0.6078, batch_reg_loss: 0.1701, reg_loss: 0.1701 ||:  32%|###2      | 36/111 [00:24<00:52,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8968, UAS: 0.9555, LAS: 0.9164, UEM: 0.6497, LEM: 0.4317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7917, partial_loss/deprel_loss: 0.5317, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7538, loss: 0.6085, batch_reg_loss: 0.1701, reg_loss: 0.1701 ||:  35%|###5      | 39/111 [00:26<00:53,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9564, LAS: 0.9174, UEM: 0.6608, LEM: 0.4411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1739, partial_loss/deprel_loss: 0.3126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4549, loss: 0.6001, batch_reg_loss: 0.1701, reg_loss: 0.1701 ||:  38%|###7      | 42/111 [00:29<00:53,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9564, LAS: 0.9173, UEM: 0.6523, LEM: 0.4318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2875, partial_loss/deprel_loss: 0.3333, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4941, loss: 0.6016, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||:  41%|####      | 45/111 [00:31<00:49,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9236, UAS: 0.9561, LAS: 0.9169, UEM: 0.6436, LEM: 0.4207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2851, partial_loss/deprel_loss: 0.4227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5652, loss: 0.6044, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||:  44%|####4     | 49/111 [00:34<00:44,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8913, UAS: 0.9565, LAS: 0.9175, UEM: 0.6450, LEM: 0.4208, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6738, partial_loss/deprel_loss: 0.5516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7461, loss: 0.6009, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||:  48%|####7     | 53/111 [00:36<00:40,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9563, LAS: 0.9174, UEM: 0.6370, LEM: 0.4121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4258, partial_loss/deprel_loss: 0.3993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5746, loss: 0.6023, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||:  50%|#####     | 56/111 [00:38<00:38,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9077, UAS: 0.9566, LAS: 0.9178, UEM: 0.6402, LEM: 0.4125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5124, partial_loss/deprel_loss: 0.5456, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7090, loss: 0.6001, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||:  53%|#####3    | 59/111 [00:40<00:36,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9570, LAS: 0.9181, UEM: 0.6485, LEM: 0.4235, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3293, partial_loss/deprel_loss: 0.4408, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5885, loss: 0.5983, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||:  56%|#####5    | 62/111 [00:43<00:34,  1.42it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9567, LAS: 0.9178, UEM: 0.6434, LEM: 0.4176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2561, partial_loss/deprel_loss: 0.3669, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5147, loss: 0.5990, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||:  59%|#####8    | 65/111 [00:45<00:32,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9572, LAS: 0.9183, UEM: 0.6455, LEM: 0.4177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2146, partial_loss/deprel_loss: 0.2871, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4426, loss: 0.5950, batch_reg_loss: 0.1700, reg_loss: 0.1701 ||:  61%|######1   | 68/111 [00:47<00:31,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9570, LAS: 0.9181, UEM: 0.6403, LEM: 0.4117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5097, partial_loss/deprel_loss: 0.4827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6581, loss: 0.5962, batch_reg_loss: 0.1699, reg_loss: 0.1701 ||:  64%|######3   | 71/111 [00:49<00:29,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9084, UAS: 0.9570, LAS: 0.9181, UEM: 0.6342, LEM: 0.4048, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6196, partial_loss/deprel_loss: 0.5692, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7492, loss: 0.5984, batch_reg_loss: 0.1699, reg_loss: 0.1701 ||:  68%|######8   | 76/111 [00:52<00:23,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8820, UAS: 0.9560, LAS: 0.9172, UEM: 0.6291, LEM: 0.4003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9994, partial_loss/deprel_loss: 0.7024, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9317, loss: 0.6070, batch_reg_loss: 0.1699, reg_loss: 0.1701 ||:  73%|#######2  | 81/111 [00:54<00:18,  1.64it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8847, UAS: 0.9563, LAS: 0.9174, UEM: 0.6301, LEM: 0.3992, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6907, partial_loss/deprel_loss: 0.7202, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8842, loss: 0.6059, batch_reg_loss: 0.1699, reg_loss: 0.1700 ||:  77%|#######7  | 86/111 [00:57<00:14,  1.76it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9553, LAS: 0.9163, UEM: 0.6202, LEM: 0.3909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5477, partial_loss/deprel_loss: 0.5488, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7185, loss: 0.6131, batch_reg_loss: 0.1699, reg_loss: 0.1700 ||:  82%|########1 | 91/111 [00:59<00:10,  1.82it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9093, UAS: 0.9557, LAS: 0.9167, UEM: 0.6267, LEM: 0.3972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4010, partial_loss/deprel_loss: 0.5455, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6865, loss: 0.6099, batch_reg_loss: 0.1699, reg_loss: 0.1700 ||:  86%|########5 | 95/111 [01:02<00:09,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8950, UAS: 0.9554, LAS: 0.9163, UEM: 0.6206, LEM: 0.3909, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6465, partial_loss/deprel_loss: 0.5652, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7514, loss: 0.6136, batch_reg_loss: 0.1699, reg_loss: 0.1700 ||:  89%|########9 | 99/111 [01:05<00:07,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9456, UAS: 0.9553, LAS: 0.9162, UEM: 0.6243, LEM: 0.3965, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1391, partial_loss/deprel_loss: 0.2918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4311, loss: 0.6134, batch_reg_loss: 0.1699, reg_loss: 0.1700 ||:  93%|#########2| 103/111 [01:07<00:05,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9549, LAS: 0.9158, UEM: 0.6186, LEM: 0.3910, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3359, partial_loss/deprel_loss: 0.4198, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5729, loss: 0.6165, batch_reg_loss: 0.1698, reg_loss: 0.1700 ||:  96%|#########6| 107/111 [01:10<00:02,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9545, LAS: 0.9154, UEM: 0.6144, LEM: 0.3875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3012, partial_loss/deprel_loss: 0.3890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5413, loss: 0.6187, batch_reg_loss: 0.1698, reg_loss: 0.1700 ||: 100%|##########| 111/111 [01:13<00:00,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9545, LAS: 0.9154, UEM: 0.6144, LEM: 0.3875, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3012, partial_loss/deprel_loss: 0.3890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5413, loss: 0.6187, batch_reg_loss: 0.1698, reg_loss: 0.1700 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
      "2023-04-07 00:57:23,892 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:57:23,892 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:57:23,892 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:57:23,892 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:57:23,892 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:57:23,892 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:57:23,892 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.389  |       N/A\n",
      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.301  |       N/A\n",
      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.170  |       N/A\n",
      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - UEM                      |     0.614  |       N/A\n",
      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - LAS                      |     0.915  |       N/A\n",
      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - loss                     |     0.619  |       N/A\n",
      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - LEM                      |     0.388  |       N/A\n",
      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:57:23,893 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:57:23,894 - INFO - combo.training.tensorboard_writer - UAS                      |     0.955  |       N/A\n",
      "2023-04-07 00:57:23,894 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:57:23,894 - INFO - combo.training.tensorboard_writer - EM                       |     0.931  |       N/A\n",
      "2023-04-07 00:57:23,894 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:57:23,899 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 00:57:29,960 - INFO - combo.training.trainer - Epoch duration: 0:01:22.548285\n",
      "2023-04-07 00:57:29,961 - INFO - combo.training.trainer - Estimated training time remaining: 6:55:44\n",
      "2023-04-07 00:57:29,961 - INFO - allennlp.training.trainer - Epoch 94/399\n",
      "2023-04-07 00:57:29,961 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:57:29,962 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:57:29,970 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9521, LAS: 0.9133, UEM: 0.4149, LEM: 0.2060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3573, partial_loss/deprel_loss: 0.4357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5899, loss: 0.6595, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||:   3%|2         | 3/111 [00:02<01:12,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9224, UAS: 0.9525, LAS: 0.9124, UEM: 0.4244, LEM: 0.1976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2817, partial_loss/deprel_loss: 0.3916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5394, loss: 0.6374, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||:   6%|6         | 7/111 [00:04<01:06,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9542, LAS: 0.9137, UEM: 0.4699, LEM: 0.2229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2137, partial_loss/deprel_loss: 0.3456, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4891, loss: 0.6316, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||:  10%|9         | 11/111 [00:06<01:03,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9194, UAS: 0.9548, LAS: 0.9140, UEM: 0.4912, LEM: 0.2354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2900, partial_loss/deprel_loss: 0.4000, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5478, loss: 0.6281, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||:  13%|#2        | 14/111 [00:08<01:03,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8987, UAS: 0.9528, LAS: 0.9122, UEM: 0.4714, LEM: 0.2223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7772, partial_loss/deprel_loss: 0.5558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7698, loss: 0.6451, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||:  16%|#6        | 18/111 [00:11<01:00,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8897, UAS: 0.9527, LAS: 0.9119, UEM: 0.4715, LEM: 0.2221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8692, partial_loss/deprel_loss: 0.6261, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8445, loss: 0.6476, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||:  20%|#9        | 22/111 [00:13<00:57,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9716, UAS: 0.9558, LAS: 0.9159, UEM: 0.5880, LEM: 0.3642, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0331, partial_loss/deprel_loss: 0.1041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2597, loss: 0.6200, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||:  23%|##2       | 25/111 [00:16<00:59,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9140, UAS: 0.9549, LAS: 0.9152, UEM: 0.5827, LEM: 0.3626, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5290, partial_loss/deprel_loss: 0.4605, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6440, loss: 0.6231, batch_reg_loss: 0.1698, reg_loss: 0.1698 ||:  25%|##5       | 28/111 [00:18<01:00,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9192, UAS: 0.9555, LAS: 0.9158, UEM: 0.5982, LEM: 0.3751, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3287, partial_loss/deprel_loss: 0.3859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5442, loss: 0.6142, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||:  28%|##7       | 31/111 [00:20<00:58,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8926, UAS: 0.9560, LAS: 0.9164, UEM: 0.6102, LEM: 0.3853, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7661, partial_loss/deprel_loss: 0.5392, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7543, loss: 0.6087, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||:  31%|###       | 34/111 [00:23<00:56,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9562, LAS: 0.9169, UEM: 0.6093, LEM: 0.3828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1732, partial_loss/deprel_loss: 0.2811, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4293, loss: 0.6057, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||:  33%|###3      | 37/111 [00:25<00:54,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9571, LAS: 0.9176, UEM: 0.6248, LEM: 0.3943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3037, partial_loss/deprel_loss: 0.3452, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5066, loss: 0.6012, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||:  37%|###6      | 41/111 [00:28<00:49,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9555, LAS: 0.9159, UEM: 0.6103, LEM: 0.3832, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5706, partial_loss/deprel_loss: 0.5425, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7178, loss: 0.6149, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||:  40%|###9      | 44/111 [00:30<00:46,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9549, LAS: 0.9153, UEM: 0.6039, LEM: 0.3760, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2421, partial_loss/deprel_loss: 0.3133, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4688, loss: 0.6180, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||:  42%|####2     | 47/111 [00:32<00:45,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9113, UAS: 0.9551, LAS: 0.9155, UEM: 0.5987, LEM: 0.3679, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6414, partial_loss/deprel_loss: 0.5149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7099, loss: 0.6183, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||:  45%|####5     | 50/111 [00:34<00:43,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9556, LAS: 0.9162, UEM: 0.6107, LEM: 0.3821, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1239, partial_loss/deprel_loss: 0.2417, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3878, loss: 0.6148, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||:  48%|####7     | 53/111 [00:36<00:41,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9538, LAS: 0.9145, UEM: 0.6052, LEM: 0.3785, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2717, partial_loss/deprel_loss: 0.3415, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4972, loss: 0.6253, batch_reg_loss: 0.1697, reg_loss: 0.1698 ||:  50%|#####     | 56/111 [00:38<00:38,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9546, LAS: 0.9152, UEM: 0.6152, LEM: 0.3848, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1899, partial_loss/deprel_loss: 0.2864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4368, loss: 0.6189, batch_reg_loss: 0.1697, reg_loss: 0.1697 ||:  55%|#####4    | 61/111 [00:40<00:31,  1.58it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9545, LAS: 0.9149, UEM: 0.6062, LEM: 0.3747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1938, partial_loss/deprel_loss: 0.3977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5266, loss: 0.6216, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||:  59%|#####9    | 66/111 [00:43<00:26,  1.72it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8609, UAS: 0.9538, LAS: 0.9138, UEM: 0.6011, LEM: 0.3702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0929, partial_loss/deprel_loss: 0.7331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9747, loss: 0.6295, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||:  64%|######3   | 71/111 [00:45<00:22,  1.79it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9542, LAS: 0.9143, UEM: 0.6086, LEM: 0.3763, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1674, partial_loss/deprel_loss: 0.2936, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4380, loss: 0.6262, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||:  68%|######7   | 75/111 [00:48<00:20,  1.73it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9537, LAS: 0.9138, UEM: 0.6020, LEM: 0.3701, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4646, partial_loss/deprel_loss: 0.4516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6238, loss: 0.6289, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||:  71%|#######1  | 79/111 [00:50<00:18,  1.70it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8975, UAS: 0.9539, LAS: 0.9140, UEM: 0.5997, LEM: 0.3669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7002, partial_loss/deprel_loss: 0.6113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7987, loss: 0.6289, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||:  75%|#######4  | 83/111 [00:53<00:16,  1.71it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9544, LAS: 0.9147, UEM: 0.6118, LEM: 0.3806, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2079, partial_loss/deprel_loss: 0.3162, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4641, loss: 0.6233, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||:  78%|#######8  | 87/111 [00:56<00:15,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9043, UAS: 0.9549, LAS: 0.9153, UEM: 0.6189, LEM: 0.3865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5173, partial_loss/deprel_loss: 0.5162, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6860, loss: 0.6188, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||:  82%|########1 | 91/111 [00:58<00:13,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8417, UAS: 0.9545, LAS: 0.9148, UEM: 0.6184, LEM: 0.3841, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6372, partial_loss/deprel_loss: 0.7892, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1283, loss: 0.6222, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||:  86%|########5 | 95/111 [01:01<00:10,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9547, LAS: 0.9150, UEM: 0.6189, LEM: 0.3840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2109, partial_loss/deprel_loss: 0.3147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4635, loss: 0.6209, batch_reg_loss: 0.1696, reg_loss: 0.1697 ||:  88%|########8 | 98/111 [01:04<00:09,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9547, LAS: 0.9151, UEM: 0.6162, LEM: 0.3814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3293, partial_loss/deprel_loss: 0.4396, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5871, loss: 0.6197, batch_reg_loss: 0.1695, reg_loss: 0.1697 ||:  92%|#########1| 102/111 [01:06<00:06,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9550, LAS: 0.9154, UEM: 0.6205, LEM: 0.3849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4263, partial_loss/deprel_loss: 0.4916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6481, loss: 0.6173, batch_reg_loss: 0.1695, reg_loss: 0.1697 ||:  95%|#########5| 106/111 [01:09<00:03,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9209, UAS: 0.9547, LAS: 0.9151, UEM: 0.6143, LEM: 0.3793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3580, partial_loss/deprel_loss: 0.4075, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5671, loss: 0.6200, batch_reg_loss: 0.1695, reg_loss: 0.1697 ||:  99%|#########9| 110/111 [01:11<00:00,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9572, UAS: 0.9550, LAS: 0.9155, UEM: 0.6235, LEM: 0.3915, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0758, partial_loss/deprel_loss: 0.1748, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3245, loss: 0.6173, batch_reg_loss: 0.1695, reg_loss: 0.1697 ||: 100%|##########| 111/111 [01:12<00:00,  1.53it/s]\n",
      "2023-04-07 00:58:45,473 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 00:58:45,473 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.175  |       N/A\n",
      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.076  |       N/A\n",
      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.170  |       N/A\n",
      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - UEM                      |     0.624  |       N/A\n",
      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - LAS                      |     0.915  |       N/A\n",
      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - loss                     |     0.617  |       N/A\n",
      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - LEM                      |     0.391  |       N/A\n",
      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 00:58:45,474 - INFO - combo.training.tensorboard_writer - UAS                      |     0.955  |       N/A\n",
      "2023-04-07 00:58:45,475 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 00:58:45,475 - INFO - combo.training.tensorboard_writer - EM                       |     0.957  |       N/A\n",
      "2023-04-07 00:58:45,475 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 00:58:45,479 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 00:58:50,382 - INFO - combo.training.trainer - Epoch duration: 0:01:20.421411\n",
      "2023-04-07 00:58:50,383 - INFO - combo.training.trainer - Estimated training time remaining: 6:54:19\n",
      "2023-04-07 00:58:50,383 - INFO - allennlp.training.trainer - Epoch 95/399\n",
      "2023-04-07 00:58:50,383 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 00:58:50,384 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 00:58:50,393 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9403, LAS: 0.8966, UEM: 0.2033, LEM: 0.0664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7028, partial_loss/deprel_loss: 0.6247, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8098, loss: 0.7676, batch_reg_loss: 0.1695, reg_loss: 0.1695 ||:   3%|2         | 3/111 [00:02<01:13,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9138, UAS: 0.9443, LAS: 0.9015, UEM: 0.2599, LEM: 0.0791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5260, partial_loss/deprel_loss: 0.4491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6339, loss: 0.7219, batch_reg_loss: 0.1695, reg_loss: 0.1695 ||:   5%|5         | 6/111 [00:04<01:13,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9452, LAS: 0.9049, UEM: 0.4647, LEM: 0.2893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1432, partial_loss/deprel_loss: 0.2551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4022, loss: 0.6918, batch_reg_loss: 0.1695, reg_loss: 0.1695 ||:   8%|8         | 9/111 [00:06<01:11,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9517, LAS: 0.9121, UEM: 0.5362, LEM: 0.3248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2530, partial_loss/deprel_loss: 0.4008, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5407, loss: 0.6405, batch_reg_loss: 0.1695, reg_loss: 0.1695 ||:  12%|#1        | 13/111 [00:08<01:05,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9501, LAS: 0.9100, UEM: 0.5007, LEM: 0.2911, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4803, partial_loss/deprel_loss: 0.4817, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6508, loss: 0.6529, batch_reg_loss: 0.1695, reg_loss: 0.1695 ||:  14%|#4        | 16/111 [00:10<01:03,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9510, LAS: 0.9112, UEM: 0.5359, LEM: 0.3277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3315, partial_loss/deprel_loss: 0.3570, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5214, loss: 0.6384, batch_reg_loss: 0.1695, reg_loss: 0.1695 ||:  17%|#7        | 19/111 [00:13<01:05,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9515, LAS: 0.9117, UEM: 0.5425, LEM: 0.3300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1692, partial_loss/deprel_loss: 0.3072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4491, loss: 0.6385, batch_reg_loss: 0.1694, reg_loss: 0.1695 ||:  21%|##        | 23/111 [00:15<00:59,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9527, LAS: 0.9131, UEM: 0.5493, LEM: 0.3301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4411, partial_loss/deprel_loss: 0.4339, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6048, loss: 0.6308, batch_reg_loss: 0.1694, reg_loss: 0.1695 ||:  23%|##3       | 26/111 [00:17<00:58,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9513, LAS: 0.9119, UEM: 0.5297, LEM: 0.3149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6417, partial_loss/deprel_loss: 0.5229, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7161, loss: 0.6360, batch_reg_loss: 0.1694, reg_loss: 0.1695 ||:  26%|##6       | 29/111 [00:19<00:56,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9096, UAS: 0.9521, LAS: 0.9128, UEM: 0.5411, LEM: 0.3158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6245, partial_loss/deprel_loss: 0.4886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6852, loss: 0.6294, batch_reg_loss: 0.1694, reg_loss: 0.1695 ||:  29%|##8       | 32/111 [00:22<00:57,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9525, LAS: 0.9133, UEM: 0.5363, LEM: 0.3086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4648, partial_loss/deprel_loss: 0.4901, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6544, loss: 0.6274, batch_reg_loss: 0.1694, reg_loss: 0.1695 ||:  32%|###1      | 35/111 [00:24<00:54,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9053, UAS: 0.9525, LAS: 0.9130, UEM: 0.5261, LEM: 0.2956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6211, partial_loss/deprel_loss: 0.5475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7316, loss: 0.6312, batch_reg_loss: 0.1694, reg_loss: 0.1694 ||:  35%|###5      | 39/111 [00:26<00:49,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9537, LAS: 0.9144, UEM: 0.5419, LEM: 0.3059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4597, partial_loss/deprel_loss: 0.4636, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6322, loss: 0.6227, batch_reg_loss: 0.1694, reg_loss: 0.1694 ||:  39%|###8      | 43/111 [00:28<00:44,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9520, LAS: 0.9128, UEM: 0.5411, LEM: 0.3107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1825, partial_loss/deprel_loss: 0.3025, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4479, loss: 0.6364, batch_reg_loss: 0.1694, reg_loss: 0.1694 ||:  42%|####2     | 47/111 [00:30<00:38,  1.65it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9530, LAS: 0.9136, UEM: 0.5572, LEM: 0.3243, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4463, partial_loss/deprel_loss: 0.5523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7004, loss: 0.6296, batch_reg_loss: 0.1694, reg_loss: 0.1694 ||:  46%|####5     | 51/111 [00:33<00:34,  1.71it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9099, UAS: 0.9539, LAS: 0.9149, UEM: 0.5827, LEM: 0.3534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6151, partial_loss/deprel_loss: 0.5066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6976, loss: 0.6191, batch_reg_loss: 0.1693, reg_loss: 0.1694 ||:  50%|#####     | 56/111 [00:35<00:30,  1.80it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9541, LAS: 0.9150, UEM: 0.5864, LEM: 0.3552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2266, partial_loss/deprel_loss: 0.3339, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4818, loss: 0.6187, batch_reg_loss: 0.1693, reg_loss: 0.1694 ||:  54%|#####4    | 60/111 [00:38<00:29,  1.73it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9704, UAS: 0.9552, LAS: 0.9164, UEM: 0.6180, LEM: 0.3964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0377, partial_loss/deprel_loss: 0.1045, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2604, loss: 0.6088, batch_reg_loss: 0.1693, reg_loss: 0.1694 ||:  58%|#####7    | 64/111 [00:41<00:32,  1.45it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9551, LAS: 0.9162, UEM: 0.6103, LEM: 0.3890, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2907, partial_loss/deprel_loss: 0.3677, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5216, loss: 0.6092, batch_reg_loss: 0.1693, reg_loss: 0.1694 ||:  61%|######1   | 68/111 [00:44<00:28,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9553, LAS: 0.9164, UEM: 0.6085, LEM: 0.3851, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2413, partial_loss/deprel_loss: 0.3382, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4881, loss: 0.6091, batch_reg_loss: 0.1693, reg_loss: 0.1694 ||:  65%|######4   | 72/111 [00:46<00:24,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9551, LAS: 0.9161, UEM: 0.6072, LEM: 0.3825, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1896, partial_loss/deprel_loss: 0.3795, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5108, loss: 0.6118, batch_reg_loss: 0.1693, reg_loss: 0.1694 ||:  68%|######8   | 76/111 [00:49<00:22,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8901, UAS: 0.9546, LAS: 0.9153, UEM: 0.6000, LEM: 0.3749, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6490, partial_loss/deprel_loss: 0.6409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8118, loss: 0.6166, batch_reg_loss: 0.1693, reg_loss: 0.1694 ||:  72%|#######2  | 80/111 [00:51<00:20,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9319, UAS: 0.9547, LAS: 0.9156, UEM: 0.5963, LEM: 0.3708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2473, partial_loss/deprel_loss: 0.3526, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5008, loss: 0.6157, batch_reg_loss: 0.1692, reg_loss: 0.1694 ||:  76%|#######5  | 84/111 [00:54<00:18,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9303, UAS: 0.9548, LAS: 0.9158, UEM: 0.5937, LEM: 0.3677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2914, partial_loss/deprel_loss: 0.3522, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5093, loss: 0.6155, batch_reg_loss: 0.1692, reg_loss: 0.1694 ||:  79%|#######9  | 88/111 [00:58<00:16,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9547, LAS: 0.9157, UEM: 0.5955, LEM: 0.3694, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2497, partial_loss/deprel_loss: 0.3107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4677, loss: 0.6151, batch_reg_loss: 0.1692, reg_loss: 0.1694 ||:  82%|########1 | 91/111 [01:00<00:14,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8947, UAS: 0.9548, LAS: 0.9158, UEM: 0.5948, LEM: 0.3669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6732, partial_loss/deprel_loss: 0.6229, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8022, loss: 0.6142, batch_reg_loss: 0.1692, reg_loss: 0.1694 ||:  86%|########5 | 95/111 [01:02<00:10,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9550, LAS: 0.9159, UEM: 0.5965, LEM: 0.3674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1758, partial_loss/deprel_loss: 0.2661, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4172, loss: 0.6134, batch_reg_loss: 0.1692, reg_loss: 0.1694 ||:  89%|########9 | 99/111 [01:05<00:07,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9549, LAS: 0.9159, UEM: 0.6031, LEM: 0.3734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2254, partial_loss/deprel_loss: 0.3636, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5051, loss: 0.6133, batch_reg_loss: 0.1692, reg_loss: 0.1693 ||:  93%|#########2| 103/111 [01:07<00:05,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9552, LAS: 0.9162, UEM: 0.6069, LEM: 0.3765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2262, partial_loss/deprel_loss: 0.3421, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4881, loss: 0.6110, batch_reg_loss: 0.1692, reg_loss: 0.1693 ||:  96%|#########6| 107/111 [01:09<00:02,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9548, UAS: 0.9559, LAS: 0.9168, UEM: 0.6223, LEM: 0.3930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0805, partial_loss/deprel_loss: 0.1551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3094, loss: 0.6056, batch_reg_loss: 0.1692, reg_loss: 0.1693 ||: 100%|##########| 111/111 [01:12<00:00,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9548, UAS: 0.9559, LAS: 0.9168, UEM: 0.6223, LEM: 0.3930, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0805, partial_loss/deprel_loss: 0.1551, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3094, loss: 0.6056, batch_reg_loss: 0.1692, reg_loss: 0.1693 ||: 100%|##########| 111/111 [01:12<00:00,  1.52it/s]\n",
      "2023-04-07 01:00:06,571 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8717, UAS: 0.9433, LAS: 0.8922, UEM: 0.5839, LEM: 0.2975, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3625, partial_loss/deprel_loss: 45.9887, partial_loss/cycle_loss: 0.0000, batch_loss: 37.0634, loss: 28.0423, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:03<00:10,  1.02s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9475, LAS: 0.8973, UEM: 0.5948, LEM: 0.3034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5580, partial_loss/deprel_loss: 23.4960, partial_loss/cycle_loss: 0.0000, batch_loss: 18.9084, loss: 23.4430, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:06,  1.01it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8746, UAS: 0.9461, LAS: 0.8943, UEM: 0.5695, LEM: 0.2727, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1060, partial_loss/deprel_loss: 41.4238, partial_loss/cycle_loss: 0.0000, batch_loss: 33.3602, loss: 24.6334, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  69%|######9   | 9/13 [00:08<00:03,  1.02it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9515, LAS: 0.9013, UEM: 0.6730, LEM: 0.4032, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1632, partial_loss/deprel_loss: 22.7933, partial_loss/cycle_loss: 0.0000, batch_loss: 18.2673, loss: 23.1488, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  92%|#########2| 12/13 [00:11<00:00,  1.04it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8296, UAS: 0.9464, LAS: 0.8957, UEM: 0.6553, LEM: 0.3920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6588, partial_loss/deprel_loss: 54.3492, partial_loss/cycle_loss: 0.0000, batch_loss: 43.8111, loss: 24.7382, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.02it/s]\n",
      "2023-04-07 01:00:19,335 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:00:19,335 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-07 01:00:19,335 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 01:00:19,335 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 01:00:19,335 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-07 01:00:19,335 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.155  |    54.349\n",
      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.081  |     1.659\n",
      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.169  |     0.000\n",
      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - UEM                      |     0.622  |     0.655\n",
      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - LAS                      |     0.917  |     0.896\n",
      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - loss                     |     0.606  |    24.738\n",
      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - LEM                      |     0.393  |     0.392\n",
      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - UAS                      |     0.956  |     0.946\n",
      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - EM                       |     0.955  |     0.830\n",
      "2023-04-07 01:00:19,336 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:00:19,341 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:00:24,554 - INFO - combo.training.trainer - Epoch duration: 0:01:34.171200\n",
      "2023-04-07 01:00:24,555 - INFO - combo.training.trainer - Estimated training time remaining: 6:53:37\n",
      "2023-04-07 01:00:24,555 - INFO - allennlp.training.trainer - Epoch 96/399\n",
      "2023-04-07 01:00:24,555 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:00:24,555 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:00:24,562 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8935, UAS: 0.9391, LAS: 0.8974, UEM: 0.2827, LEM: 0.1307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7643, partial_loss/deprel_loss: 0.5785, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7848, loss: 0.7524, batch_reg_loss: 0.1692, reg_loss: 0.1692 ||:   4%|3         | 4/111 [00:02<01:00,  1.76it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8979, UAS: 0.9463, LAS: 0.9054, UEM: 0.4872, LEM: 0.2904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7313, partial_loss/deprel_loss: 0.5896, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7871, loss: 0.6933, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||:   8%|8         | 9/111 [00:04<00:56,  1.80it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9499, LAS: 0.9104, UEM: 0.5896, LEM: 0.3841, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1736, partial_loss/deprel_loss: 0.2812, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4288, loss: 0.6497, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||:  11%|#         | 12/111 [00:07<01:00,  1.65it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9004, UAS: 0.9503, LAS: 0.9112, UEM: 0.5665, LEM: 0.3555, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5769, partial_loss/deprel_loss: 0.5445, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7201, loss: 0.6425, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||:  14%|#4        | 16/111 [00:09<00:55,  1.72it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9122, UAS: 0.9521, LAS: 0.9129, UEM: 0.5732, LEM: 0.3552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4876, partial_loss/deprel_loss: 0.4542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6300, loss: 0.6335, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||:  17%|#7        | 19/111 [00:11<00:56,  1.64it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8980, UAS: 0.9524, LAS: 0.9133, UEM: 0.5812, LEM: 0.3596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7037, partial_loss/deprel_loss: 0.5797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7736, loss: 0.6279, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||:  21%|##        | 23/111 [00:13<00:54,  1.62it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9520, LAS: 0.9131, UEM: 0.5641, LEM: 0.3448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2893, partial_loss/deprel_loss: 0.3722, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5247, loss: 0.6309, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||:  24%|##4       | 27/111 [00:15<00:50,  1.67it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9101, UAS: 0.9548, LAS: 0.9162, UEM: 0.6015, LEM: 0.3720, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3965, partial_loss/deprel_loss: 0.4824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6343, loss: 0.6099, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||:  29%|##8       | 32/111 [00:18<00:43,  1.82it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9012, UAS: 0.9558, LAS: 0.9175, UEM: 0.6238, LEM: 0.3993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7691, partial_loss/deprel_loss: 0.5358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7515, loss: 0.6023, batch_reg_loss: 0.1691, reg_loss: 0.1691 ||:  33%|###3      | 37/111 [00:20<00:40,  1.84it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9252, UAS: 0.9561, LAS: 0.9177, UEM: 0.6109, LEM: 0.3852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2981, partial_loss/deprel_loss: 0.4184, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5634, loss: 0.6028, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||:  37%|###6      | 41/111 [00:23<00:39,  1.75it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9546, LAS: 0.9165, UEM: 0.6138, LEM: 0.3904, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2492, partial_loss/deprel_loss: 0.3801, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5230, loss: 0.6106, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||:  41%|####      | 45/111 [00:26<00:42,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9550, LAS: 0.9170, UEM: 0.6111, LEM: 0.3871, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6034, partial_loss/deprel_loss: 0.4635, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6605, loss: 0.6057, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||:  44%|####4     | 49/111 [00:29<00:39,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9554, LAS: 0.9174, UEM: 0.6144, LEM: 0.3896, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4303, partial_loss/deprel_loss: 0.4575, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6211, loss: 0.6032, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||:  48%|####7     | 53/111 [00:31<00:37,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8986, UAS: 0.9550, LAS: 0.9167, UEM: 0.6106, LEM: 0.3844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6086, partial_loss/deprel_loss: 0.5597, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7385, loss: 0.6088, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||:  51%|#####1    | 57/111 [00:34<00:35,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9007, UAS: 0.9552, LAS: 0.9167, UEM: 0.6143, LEM: 0.3884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4830, partial_loss/deprel_loss: 0.5003, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6658, loss: 0.6087, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||:  55%|#####4    | 61/111 [00:37<00:33,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9551, LAS: 0.9167, UEM: 0.6094, LEM: 0.3821, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4728, partial_loss/deprel_loss: 0.3934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5782, loss: 0.6072, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||:  59%|#####8    | 65/111 [00:39<00:29,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9551, LAS: 0.9168, UEM: 0.6119, LEM: 0.3843, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1561, partial_loss/deprel_loss: 0.2667, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4136, loss: 0.6057, batch_reg_loss: 0.1690, reg_loss: 0.1691 ||:  62%|######2   | 69/111 [00:42<00:26,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9236, UAS: 0.9551, LAS: 0.9169, UEM: 0.6096, LEM: 0.3808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3390, partial_loss/deprel_loss: 0.3907, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5493, loss: 0.6053, batch_reg_loss: 0.1689, reg_loss: 0.1691 ||:  66%|######5   | 73/111 [00:44<00:24,  1.54it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9560, LAS: 0.9179, UEM: 0.6290, LEM: 0.4057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2955, partial_loss/deprel_loss: 0.3446, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5037, loss: 0.5985, batch_reg_loss: 0.1689, reg_loss: 0.1690 ||:  69%|######9   | 77/111 [00:47<00:23,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9036, UAS: 0.9564, LAS: 0.9185, UEM: 0.6391, LEM: 0.4171, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5531, partial_loss/deprel_loss: 0.4909, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6723, loss: 0.5941, batch_reg_loss: 0.1689, reg_loss: 0.1690 ||:  72%|#######2  | 80/111 [00:50<00:21,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9565, LAS: 0.9185, UEM: 0.6354, LEM: 0.4115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3544, partial_loss/deprel_loss: 0.4211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5767, loss: 0.5948, batch_reg_loss: 0.1689, reg_loss: 0.1690 ||:  76%|#######5  | 84/111 [00:52<00:17,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9563, LAS: 0.9183, UEM: 0.6299, LEM: 0.4058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2253, partial_loss/deprel_loss: 0.3211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4708, loss: 0.5979, batch_reg_loss: 0.1689, reg_loss: 0.1690 ||:  79%|#######9  | 88/111 [00:55<00:15,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9556, LAS: 0.9175, UEM: 0.6254, LEM: 0.4005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5456, partial_loss/deprel_loss: 0.4963, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6750, loss: 0.6032, batch_reg_loss: 0.1689, reg_loss: 0.1690 ||:  83%|########2 | 92/111 [00:58<00:13,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9555, LAS: 0.9173, UEM: 0.6257, LEM: 0.4025, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5814, partial_loss/deprel_loss: 0.5300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7091, loss: 0.6043, batch_reg_loss: 0.1689, reg_loss: 0.1690 ||:  86%|########6 | 96/111 [01:00<00:09,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9556, LAS: 0.9175, UEM: 0.6248, LEM: 0.4004, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1825, partial_loss/deprel_loss: 0.2865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4346, loss: 0.6037, batch_reg_loss: 0.1689, reg_loss: 0.1690 ||:  90%|######### | 100/111 [01:03<00:07,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8807, UAS: 0.9557, LAS: 0.9176, UEM: 0.6292, LEM: 0.4046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9167, partial_loss/deprel_loss: 0.6152, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8444, loss: 0.6018, batch_reg_loss: 0.1688, reg_loss: 0.1690 ||:  94%|#########3| 104/111 [01:06<00:04,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9550, LAS: 0.9170, UEM: 0.6240, LEM: 0.4016, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2415, partial_loss/deprel_loss: 0.3029, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4594, loss: 0.6050, batch_reg_loss: 0.1688, reg_loss: 0.1690 ||:  97%|#########7| 108/111 [01:08<00:02,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9550, LAS: 0.9168, UEM: 0.6213, LEM: 0.3972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2427, partial_loss/deprel_loss: 0.4258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5580, loss: 0.6063, batch_reg_loss: 0.1688, reg_loss: 0.1690 ||: 100%|##########| 111/111 [01:10<00:00,  1.57it/s]\n",
      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.426  |       N/A\n",
      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.243  |       N/A\n",
      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.169  |       N/A\n",
      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - UEM                      |     0.621  |       N/A\n",
      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - LAS                      |     0.917  |       N/A\n",
      "2023-04-07 01:01:38,118 - INFO - combo.training.tensorboard_writer - loss                     |     0.606  |       N/A\n",
      "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - LEM                      |     0.397  |       N/A\n",
      "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - UAS                      |     0.955  |       N/A\n",
      "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - EM                       |     0.920  |       N/A\n",
      "2023-04-07 01:01:38,119 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:01:38,123 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:01:41,735 - INFO - combo.training.trainer - Epoch duration: 0:01:17.180312\n",
      "2023-04-07 01:01:41,736 - INFO - combo.training.trainer - Estimated training time remaining: 6:52:02\n",
      "2023-04-07 01:01:41,736 - INFO - allennlp.training.trainer - Epoch 97/399\n",
      "2023-04-07 01:01:41,736 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:01:41,737 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:01:41,751 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9212, UAS: 0.9528, LAS: 0.9152, UEM: 0.4238, LEM: 0.1726, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2883, partial_loss/deprel_loss: 0.4121, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5561, loss: 0.6364, batch_reg_loss: 0.1688, reg_loss: 0.1688 ||:   4%|3         | 4/111 [00:02<01:05,  1.63it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9295, UAS: 0.9571, LAS: 0.9196, UEM: 0.4810, LEM: 0.2370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3336, partial_loss/deprel_loss: 0.3597, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5233, loss: 0.5891, batch_reg_loss: 0.1688, reg_loss: 0.1688 ||:   7%|7         | 8/111 [00:04<01:00,  1.70it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9574, LAS: 0.9207, UEM: 0.5548, LEM: 0.3183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2063, partial_loss/deprel_loss: 0.2908, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4427, loss: 0.5791, batch_reg_loss: 0.1688, reg_loss: 0.1688 ||:  12%|#1        | 13/111 [00:06<00:54,  1.81it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9551, LAS: 0.9179, UEM: 0.5253, LEM: 0.2913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4222, partial_loss/deprel_loss: 0.4357, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6018, loss: 0.6009, batch_reg_loss: 0.1688, reg_loss: 0.1688 ||:  16%|#6        | 18/111 [00:09<00:48,  1.91it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9556, LAS: 0.9183, UEM: 0.5201, LEM: 0.2861, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5889, partial_loss/deprel_loss: 0.4690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6618, loss: 0.5964, batch_reg_loss: 0.1688, reg_loss: 0.1688 ||:  21%|##        | 23/111 [00:11<00:44,  1.99it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8937, UAS: 0.9550, LAS: 0.9174, UEM: 0.5125, LEM: 0.2803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6726, partial_loss/deprel_loss: 0.5126, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7134, loss: 0.5991, batch_reg_loss: 0.1687, reg_loss: 0.1688 ||:  24%|##4       | 27/111 [00:14<00:45,  1.83it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9525, LAS: 0.9149, UEM: 0.5015, LEM: 0.2737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8222, partial_loss/deprel_loss: 0.5603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7814, loss: 0.6175, batch_reg_loss: 0.1687, reg_loss: 0.1688 ||:  28%|##7       | 31/111 [00:16<00:46,  1.71it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9539, LAS: 0.9157, UEM: 0.5416, LEM: 0.3111, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2850, partial_loss/deprel_loss: 0.3523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5076, loss: 0.6092, batch_reg_loss: 0.1687, reg_loss: 0.1688 ||:  32%|###1      | 35/111 [00:19<00:47,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9371, UAS: 0.9550, LAS: 0.9171, UEM: 0.5771, LEM: 0.3557, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1882, partial_loss/deprel_loss: 0.3070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4520, loss: 0.5997, batch_reg_loss: 0.1687, reg_loss: 0.1688 ||:  35%|###5      | 39/111 [00:22<00:47,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8661, UAS: 0.9541, LAS: 0.9158, UEM: 0.5798, LEM: 0.3571, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0605, partial_loss/deprel_loss: 0.7466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9781, loss: 0.6078, batch_reg_loss: 0.1687, reg_loss: 0.1688 ||:  39%|###8      | 43/111 [00:25<00:47,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9136, UAS: 0.9541, LAS: 0.9158, UEM: 0.5736, LEM: 0.3501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5492, partial_loss/deprel_loss: 0.4876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6686, loss: 0.6089, batch_reg_loss: 0.1687, reg_loss: 0.1688 ||:  42%|####2     | 47/111 [00:28<00:43,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9149, UAS: 0.9544, LAS: 0.9162, UEM: 0.5777, LEM: 0.3527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4814, partial_loss/deprel_loss: 0.5070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6706, loss: 0.6079, batch_reg_loss: 0.1687, reg_loss: 0.1688 ||:  45%|####5     | 50/111 [00:30<00:42,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9539, LAS: 0.9156, UEM: 0.5682, LEM: 0.3432, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3379, partial_loss/deprel_loss: 0.4453, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5925, loss: 0.6127, batch_reg_loss: 0.1687, reg_loss: 0.1687 ||:  49%|####8     | 54/111 [00:32<00:38,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9547, LAS: 0.9161, UEM: 0.5806, LEM: 0.3531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4688, partial_loss/deprel_loss: 0.5378, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6927, loss: 0.6084, batch_reg_loss: 0.1687, reg_loss: 0.1687 ||:  52%|#####2    | 58/111 [00:35<00:35,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9279, UAS: 0.9558, LAS: 0.9174, UEM: 0.6119, LEM: 0.3931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2852, partial_loss/deprel_loss: 0.3170, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4793, loss: 0.5991, batch_reg_loss: 0.1687, reg_loss: 0.1687 ||:  56%|#####5    | 62/111 [00:39<00:36,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9561, LAS: 0.9176, UEM: 0.6116, LEM: 0.3917, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4259, partial_loss/deprel_loss: 0.5426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6879, loss: 0.5979, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||:  59%|#####8    | 65/111 [00:41<00:34,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9558, LAS: 0.9175, UEM: 0.6148, LEM: 0.3955, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4009, partial_loss/deprel_loss: 0.4690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6240, loss: 0.5995, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||:  61%|######1   | 68/111 [00:43<00:32,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9559, LAS: 0.9177, UEM: 0.6136, LEM: 0.3943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1631, partial_loss/deprel_loss: 0.2949, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4371, loss: 0.5977, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||:  64%|######3   | 71/111 [00:45<00:30,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9109, UAS: 0.9551, LAS: 0.9166, UEM: 0.6049, LEM: 0.3879, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4649, partial_loss/deprel_loss: 0.4780, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6440, loss: 0.6042, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||:  67%|######6   | 74/111 [00:47<00:26,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9020, UAS: 0.9549, LAS: 0.9165, UEM: 0.6025, LEM: 0.3856, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6400, partial_loss/deprel_loss: 0.5306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7211, loss: 0.6049, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||:  70%|#######   | 78/111 [00:50<00:23,  1.40it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9473, UAS: 0.9559, LAS: 0.9177, UEM: 0.6219, LEM: 0.4045, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1427, partial_loss/deprel_loss: 0.2165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3704, loss: 0.5963, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||:  74%|#######3  | 82/111 [00:53<00:19,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9562, LAS: 0.9179, UEM: 0.6242, LEM: 0.4047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5192, partial_loss/deprel_loss: 0.5186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6873, loss: 0.5945, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||:  77%|#######6  | 85/111 [00:55<00:17,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9153, UAS: 0.9559, LAS: 0.9177, UEM: 0.6176, LEM: 0.3978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4235, partial_loss/deprel_loss: 0.4227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5915, loss: 0.5972, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||:  80%|########  | 89/111 [00:57<00:14,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9562, LAS: 0.9180, UEM: 0.6208, LEM: 0.4008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1388, partial_loss/deprel_loss: 0.2387, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3873, loss: 0.5943, batch_reg_loss: 0.1686, reg_loss: 0.1687 ||:  84%|########3 | 93/111 [01:00<00:11,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8943, UAS: 0.9562, LAS: 0.9179, UEM: 0.6276, LEM: 0.4098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8061, partial_loss/deprel_loss: 0.5951, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8058, loss: 0.5943, batch_reg_loss: 0.1685, reg_loss: 0.1687 ||:  87%|########7 | 97/111 [01:03<00:09,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9561, LAS: 0.9178, UEM: 0.6256, LEM: 0.4068, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2770, partial_loss/deprel_loss: 0.3365, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4931, loss: 0.5947, batch_reg_loss: 0.1685, reg_loss: 0.1687 ||:  91%|######### | 101/111 [01:06<00:06,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9560, LAS: 0.9177, UEM: 0.6224, LEM: 0.4029, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3510, partial_loss/deprel_loss: 0.3745, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5384, loss: 0.5959, batch_reg_loss: 0.1685, reg_loss: 0.1687 ||:  94%|#########3| 104/111 [01:08<00:04,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9560, LAS: 0.9176, UEM: 0.6200, LEM: 0.3996, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3526, partial_loss/deprel_loss: 0.3979, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5573, loss: 0.5966, batch_reg_loss: 0.1685, reg_loss: 0.1687 ||:  96%|#########6| 107/111 [01:10<00:02,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9413, UAS: 0.9562, LAS: 0.9178, UEM: 0.6249, LEM: 0.4043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1825, partial_loss/deprel_loss: 0.2514, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4061, loss: 0.5948, batch_reg_loss: 0.1685, reg_loss: 0.1687 ||:  99%|#########9| 110/111 [01:12<00:00,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9291, UAS: 0.9563, LAS: 0.9179, UEM: 0.6249, LEM: 0.4038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2849, partial_loss/deprel_loss: 0.3783, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5281, loss: 0.5942, batch_reg_loss: 0.1685, reg_loss: 0.1687 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
      "2023-04-07 01:02:57,808 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.378  |       N/A\n",
      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.285  |       N/A\n",
      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.169  |       N/A\n",
      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - UEM                      |     0.625  |       N/A\n",
      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - LAS                      |     0.918  |       N/A\n",
      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - loss                     |     0.594  |       N/A\n",
      "2023-04-07 01:02:57,809 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:02:57,810 - INFO - combo.training.tensorboard_writer - LEM                      |     0.404  |       N/A\n",
      "2023-04-07 01:02:57,810 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:02:57,810 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:02:57,810 - INFO - combo.training.tensorboard_writer - UAS                      |     0.956  |       N/A\n",
      "2023-04-07 01:02:57,810 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:02:57,810 - INFO - combo.training.tensorboard_writer - EM                       |     0.929  |       N/A\n",
      "2023-04-07 01:02:57,810 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:02:57,814 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:03:02,067 - INFO - combo.training.trainer - Epoch duration: 0:01:20.331514\n",
      "2023-04-07 01:03:02,068 - INFO - combo.training.trainer - Estimated training time remaining: 6:50:36\n",
      "2023-04-07 01:03:02,068 - INFO - allennlp.training.trainer - Epoch 98/399\n",
      "2023-04-07 01:03:02,068 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:03:02,069 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:03:02,078 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9541, LAS: 0.9186, UEM: 0.5242, LEM: 0.3288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5159, partial_loss/deprel_loss: 0.5113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6807, loss: 0.6171, batch_reg_loss: 0.1685, reg_loss: 0.1685 ||:   5%|4         | 5/111 [00:02<00:44,  2.36it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9596, UAS: 0.9624, LAS: 0.9276, UEM: 0.7138, LEM: 0.5187, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0722, partial_loss/deprel_loss: 0.1715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3201, loss: 0.5430, batch_reg_loss: 0.1685, reg_loss: 0.1685 ||:   8%|8         | 9/111 [00:04<00:45,  2.23it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9602, LAS: 0.9251, UEM: 0.6759, LEM: 0.4770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2314, partial_loss/deprel_loss: 0.3308, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4794, loss: 0.5607, batch_reg_loss: 0.1685, reg_loss: 0.1685 ||:  12%|#1        | 13/111 [00:06<00:47,  2.05it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9616, LAS: 0.9257, UEM: 0.6847, LEM: 0.4680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1678, partial_loss/deprel_loss: 0.2828, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4282, loss: 0.5542, batch_reg_loss: 0.1684, reg_loss: 0.1685 ||:  14%|#4        | 16/111 [00:08<00:56,  1.69it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9788, UAS: 0.9625, LAS: 0.9276, UEM: 0.7210, LEM: 0.5319, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0258, partial_loss/deprel_loss: 0.0861, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2424, loss: 0.5429, batch_reg_loss: 0.1684, reg_loss: 0.1685 ||:  17%|#7        | 19/111 [00:11<01:02,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9600, LAS: 0.9245, UEM: 0.6866, LEM: 0.4975, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7137, partial_loss/deprel_loss: 0.5098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7190, loss: 0.5636, batch_reg_loss: 0.1684, reg_loss: 0.1685 ||:  21%|##        | 23/111 [00:14<00:59,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9593, LAS: 0.9240, UEM: 0.6749, LEM: 0.4812, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2493, partial_loss/deprel_loss: 0.3284, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4810, loss: 0.5654, batch_reg_loss: 0.1684, reg_loss: 0.1685 ||:  23%|##3       | 26/111 [00:16<00:57,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9578, LAS: 0.9217, UEM: 0.6691, LEM: 0.4742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5636, partial_loss/deprel_loss: 0.5041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6844, loss: 0.5787, batch_reg_loss: 0.1684, reg_loss: 0.1685 ||:  27%|##7       | 30/111 [00:18<00:53,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.9563, LAS: 0.9197, UEM: 0.6634, LEM: 0.4649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8823, partial_loss/deprel_loss: 0.6261, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8457, loss: 0.5912, batch_reg_loss: 0.1684, reg_loss: 0.1684 ||:  31%|###       | 34/111 [00:21<00:50,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8895, UAS: 0.9540, LAS: 0.9172, UEM: 0.6384, LEM: 0.4451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7668, partial_loss/deprel_loss: 0.6458, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8384, loss: 0.6081, batch_reg_loss: 0.1684, reg_loss: 0.1684 ||:  34%|###4      | 38/111 [00:23<00:47,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9545, LAS: 0.9177, UEM: 0.6341, LEM: 0.4378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6419, partial_loss/deprel_loss: 0.4970, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6943, loss: 0.6035, batch_reg_loss: 0.1684, reg_loss: 0.1684 ||:  38%|###7      | 42/111 [00:26<00:44,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9048, UAS: 0.9552, LAS: 0.9182, UEM: 0.6314, LEM: 0.4292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5426, partial_loss/deprel_loss: 0.5139, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6880, loss: 0.5989, batch_reg_loss: 0.1684, reg_loss: 0.1684 ||:  41%|####1     | 46/111 [00:29<00:42,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9548, LAS: 0.9177, UEM: 0.6174, LEM: 0.4134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2994, partial_loss/deprel_loss: 0.4110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5570, loss: 0.6036, batch_reg_loss: 0.1684, reg_loss: 0.1684 ||:  45%|####5     | 50/111 [00:31<00:40,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9551, LAS: 0.9179, UEM: 0.6165, LEM: 0.4088, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3775, partial_loss/deprel_loss: 0.3967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5612, loss: 0.6012, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||:  48%|####7     | 53/111 [00:33<00:38,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9366, UAS: 0.9557, LAS: 0.9184, UEM: 0.6215, LEM: 0.4096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2372, partial_loss/deprel_loss: 0.3011, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4567, loss: 0.5959, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||:  50%|#####     | 56/111 [00:35<00:36,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9561, LAS: 0.9188, UEM: 0.6278, LEM: 0.4150, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2137, partial_loss/deprel_loss: 0.2977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4492, loss: 0.5927, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||:  53%|#####3    | 59/111 [00:38<00:36,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9563, LAS: 0.9188, UEM: 0.6229, LEM: 0.4084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3157, partial_loss/deprel_loss: 0.3908, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5441, loss: 0.5923, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||:  56%|#####5    | 62/111 [00:40<00:34,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9559, LAS: 0.9182, UEM: 0.6228, LEM: 0.4062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2031, partial_loss/deprel_loss: 0.3757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5095, loss: 0.5966, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||:  59%|#####8    | 65/111 [00:42<00:32,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9560, LAS: 0.9184, UEM: 0.6212, LEM: 0.4057, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1784, partial_loss/deprel_loss: 0.2485, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4028, loss: 0.5939, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||:  62%|######2   | 69/111 [00:45<00:29,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9566, LAS: 0.9191, UEM: 0.6341, LEM: 0.4180, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1107, partial_loss/deprel_loss: 0.2521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3921, loss: 0.5892, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||:  65%|######4   | 72/111 [00:47<00:28,  1.35it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9188, UAS: 0.9566, LAS: 0.9189, UEM: 0.6289, LEM: 0.4104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3712, partial_loss/deprel_loss: 0.4228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5807, loss: 0.5898, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||:  68%|######8   | 76/111 [00:50<00:24,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9571, LAS: 0.9195, UEM: 0.6385, LEM: 0.4207, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2057, partial_loss/deprel_loss: 0.3700, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5054, loss: 0.5858, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||:  71%|#######1  | 79/111 [00:52<00:22,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9571, LAS: 0.9194, UEM: 0.6355, LEM: 0.4166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3003, partial_loss/deprel_loss: 0.4440, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5835, loss: 0.5865, batch_reg_loss: 0.1683, reg_loss: 0.1684 ||:  74%|#######3  | 82/111 [00:54<00:21,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9572, LAS: 0.9194, UEM: 0.6377, LEM: 0.4172, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2213, partial_loss/deprel_loss: 0.3443, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4880, loss: 0.5859, batch_reg_loss: 0.1682, reg_loss: 0.1684 ||:  77%|#######6  | 85/111 [00:57<00:19,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8670, UAS: 0.9567, LAS: 0.9189, UEM: 0.6401, LEM: 0.4216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1453, partial_loss/deprel_loss: 0.6996, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9569, loss: 0.5903, batch_reg_loss: 0.1682, reg_loss: 0.1684 ||:  79%|#######9  | 88/111 [00:59<00:17,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9568, LAS: 0.9189, UEM: 0.6360, LEM: 0.4162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4078, partial_loss/deprel_loss: 0.4475, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6078, loss: 0.5904, batch_reg_loss: 0.1682, reg_loss: 0.1684 ||:  82%|########1 | 91/111 [01:01<00:14,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9060, UAS: 0.9564, LAS: 0.9184, UEM: 0.6309, LEM: 0.4100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6180, partial_loss/deprel_loss: 0.5235, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7107, loss: 0.5933, batch_reg_loss: 0.1682, reg_loss: 0.1684 ||:  86%|########5 | 95/111 [01:03<00:11,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9045, UAS: 0.9568, LAS: 0.9188, UEM: 0.6325, LEM: 0.4108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6260, partial_loss/deprel_loss: 0.5665, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7466, loss: 0.5919, batch_reg_loss: 0.1682, reg_loss: 0.1683 ||:  89%|########9 | 99/111 [01:06<00:08,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9567, LAS: 0.9188, UEM: 0.6271, LEM: 0.4056, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4285, partial_loss/deprel_loss: 0.4146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5855, loss: 0.5936, batch_reg_loss: 0.1682, reg_loss: 0.1683 ||:  93%|#########2| 103/111 [01:08<00:05,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9573, LAS: 0.9193, UEM: 0.6311, LEM: 0.4069, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1397, partial_loss/deprel_loss: 0.2701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4122, loss: 0.5898, batch_reg_loss: 0.1682, reg_loss: 0.1683 ||:  96%|#########6| 107/111 [01:10<00:02,  1.62it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9572, LAS: 0.9193, UEM: 0.6285, LEM: 0.4040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3200, partial_loss/deprel_loss: 0.4264, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5733, loss: 0.5914, batch_reg_loss: 0.1682, reg_loss: 0.1683 ||: 100%|##########| 111/111 [01:12<00:00,  1.53it/s]\n",
      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.426  |       N/A\n",
      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.320  |       N/A\n",
      "2023-04-07 01:04:18,230 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.168  |       N/A\n",
      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - UEM                      |     0.628  |       N/A\n",
      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - LAS                      |     0.919  |       N/A\n",
      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - loss                     |     0.591  |       N/A\n",
      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - LEM                      |     0.404  |       N/A\n",
      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - UAS                      |     0.957  |       N/A\n",
      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - EM                       |     0.927  |       N/A\n",
      "2023-04-07 01:04:18,231 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:04:18,236 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:04:23,599 - INFO - combo.training.trainer - Epoch duration: 0:01:21.530588\n",
      "2023-04-07 01:04:23,599 - INFO - combo.training.trainer - Estimated training time remaining: 6:49:15\n",
      "2023-04-07 01:04:23,599 - INFO - allennlp.training.trainer - Epoch 99/399\n",
      "2023-04-07 01:04:23,600 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:04:23,600 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:04:23,610 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9617, LAS: 0.9249, UEM: 0.5893, LEM: 0.3322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4106, partial_loss/deprel_loss: 0.4330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5967, loss: 0.5332, batch_reg_loss: 0.1681, reg_loss: 0.1682 ||:   4%|3         | 4/111 [00:02<01:07,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9595, LAS: 0.9213, UEM: 0.6843, LEM: 0.4378, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1692, partial_loss/deprel_loss: 0.2754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4223, loss: 0.5445, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||:   6%|6         | 7/111 [00:05<01:13,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9636, LAS: 0.9278, UEM: 0.7559, LEM: 0.5669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4117, partial_loss/deprel_loss: 0.4424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6044, loss: 0.5165, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||:   9%|9         | 10/111 [00:07<01:14,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9228, UAS: 0.9641, LAS: 0.9285, UEM: 0.7408, LEM: 0.5375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3300, partial_loss/deprel_loss: 0.3917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5475, loss: 0.5127, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||:  12%|#1        | 13/111 [00:09<01:13,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8964, UAS: 0.9580, LAS: 0.9216, UEM: 0.7034, LEM: 0.4986, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6043, partial_loss/deprel_loss: 0.5621, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7386, loss: 0.5675, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||:  15%|#5        | 17/111 [00:12<01:08,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8995, UAS: 0.9556, LAS: 0.9192, UEM: 0.6625, LEM: 0.4607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7397, partial_loss/deprel_loss: 0.5515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7573, loss: 0.5879, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||:  19%|#8        | 21/111 [00:15<01:02,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9563, LAS: 0.9201, UEM: 0.6492, LEM: 0.4395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2487, partial_loss/deprel_loss: 0.3765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5190, loss: 0.5868, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||:  23%|##2       | 25/111 [00:17<00:57,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9579, LAS: 0.9217, UEM: 0.6643, LEM: 0.4489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1325, partial_loss/deprel_loss: 0.2781, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4171, loss: 0.5753, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||:  26%|##6       | 29/111 [00:19<00:53,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9312, UAS: 0.9570, LAS: 0.9207, UEM: 0.6437, LEM: 0.4288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3022, partial_loss/deprel_loss: 0.4089, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5556, loss: 0.5883, batch_reg_loss: 0.1681, reg_loss: 0.1681 ||:  30%|##9       | 33/111 [00:22<00:51,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9567, LAS: 0.9202, UEM: 0.6330, LEM: 0.4166, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6738, partial_loss/deprel_loss: 0.5017, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7042, loss: 0.5906, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||:  33%|###3      | 37/111 [00:25<00:48,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9351, UAS: 0.9578, LAS: 0.9212, UEM: 0.6431, LEM: 0.4213, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2221, partial_loss/deprel_loss: 0.3180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4669, loss: 0.5836, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||:  36%|###6      | 40/111 [00:27<00:48,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9473, UAS: 0.9584, LAS: 0.9217, UEM: 0.6527, LEM: 0.4313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1170, partial_loss/deprel_loss: 0.2165, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3646, loss: 0.5801, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||:  39%|###8      | 43/111 [00:29<00:46,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9586, LAS: 0.9219, UEM: 0.6642, LEM: 0.4476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6093, partial_loss/deprel_loss: 0.5565, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7350, loss: 0.5771, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||:  41%|####1     | 46/111 [00:32<00:47,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9250, UAS: 0.9580, LAS: 0.9211, UEM: 0.6541, LEM: 0.4386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3014, partial_loss/deprel_loss: 0.3756, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5288, loss: 0.5832, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||:  45%|####5     | 50/111 [00:34<00:42,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9034, UAS: 0.9584, LAS: 0.9217, UEM: 0.6583, LEM: 0.4435, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6870, partial_loss/deprel_loss: 0.4964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7025, loss: 0.5790, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||:  49%|####8     | 54/111 [00:37<00:39,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9400, UAS: 0.9592, LAS: 0.9225, UEM: 0.6651, LEM: 0.4454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1660, partial_loss/deprel_loss: 0.2901, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4333, loss: 0.5727, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||:  52%|#####2    | 58/111 [00:39<00:34,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9359, UAS: 0.9592, LAS: 0.9223, UEM: 0.6643, LEM: 0.4408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1708, partial_loss/deprel_loss: 0.3220, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4597, loss: 0.5735, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||:  56%|#####5    | 62/111 [00:42<00:33,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9582, LAS: 0.9212, UEM: 0.6523, LEM: 0.4309, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7255, partial_loss/deprel_loss: 0.4816, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6983, loss: 0.5811, batch_reg_loss: 0.1680, reg_loss: 0.1681 ||:  59%|#####9    | 66/111 [00:44<00:29,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9084, UAS: 0.9577, LAS: 0.9206, UEM: 0.6417, LEM: 0.4212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5670, partial_loss/deprel_loss: 0.5030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6838, loss: 0.5851, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||:  63%|######3   | 70/111 [00:47<00:26,  1.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9118, UAS: 0.9571, LAS: 0.9201, UEM: 0.6357, LEM: 0.4142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5721, partial_loss/deprel_loss: 0.4689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6575, loss: 0.5889, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||:  67%|######6   | 74/111 [00:50<00:25,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9568, LAS: 0.9196, UEM: 0.6329, LEM: 0.4119, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2059, partial_loss/deprel_loss: 0.3338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4761, loss: 0.5904, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||:  69%|######9   | 77/111 [00:53<00:25,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9567, LAS: 0.9194, UEM: 0.6282, LEM: 0.4061, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4504, partial_loss/deprel_loss: 0.4251, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5981, loss: 0.5918, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||:  72%|#######2  | 80/111 [00:55<00:22,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9568, LAS: 0.9194, UEM: 0.6270, LEM: 0.4034, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2898, partial_loss/deprel_loss: 0.4051, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5499, loss: 0.5915, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||:  75%|#######4  | 83/111 [00:57<00:20,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9567, LAS: 0.9193, UEM: 0.6383, LEM: 0.4165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1086, partial_loss/deprel_loss: 0.2315, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3748, loss: 0.5910, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||:  77%|#######7  | 86/111 [00:59<00:19,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9568, LAS: 0.9194, UEM: 0.6343, LEM: 0.4114, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2650, partial_loss/deprel_loss: 0.3856, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5293, loss: 0.5909, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||:  81%|########1 | 90/111 [01:02<00:14,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9573, LAS: 0.9200, UEM: 0.6318, LEM: 0.4070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3063, partial_loss/deprel_loss: 0.3247, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4889, loss: 0.5869, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||:  86%|########5 | 95/111 [01:04<00:10,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9572, LAS: 0.9199, UEM: 0.6300, LEM: 0.4040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2153, partial_loss/deprel_loss: 0.3539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4941, loss: 0.5871, batch_reg_loss: 0.1679, reg_loss: 0.1680 ||:  90%|######### | 100/111 [01:06<00:06,  1.74it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9572, LAS: 0.9199, UEM: 0.6342, LEM: 0.4089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1752, partial_loss/deprel_loss: 0.2231, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3814, loss: 0.5868, batch_reg_loss: 0.1678, reg_loss: 0.1680 ||:  95%|#########4| 105/111 [01:09<00:03,  1.78it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9574, LAS: 0.9199, UEM: 0.6347, LEM: 0.4082, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1745, partial_loss/deprel_loss: 0.3159, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4555, loss: 0.5861, batch_reg_loss: 0.1678, reg_loss: 0.1680 ||:  98%|#########8| 109/111 [01:12<00:01,  1.66it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9573, LAS: 0.9198, UEM: 0.6335, LEM: 0.4064, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2176, partial_loss/deprel_loss: 0.3469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4889, loss: 0.5870, batch_reg_loss: 0.1678, reg_loss: 0.1680 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
      "2023-04-07 01:05:40,141 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.347  |       N/A\n",
      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.218  |       N/A\n",
      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.168  |       N/A\n",
      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - UEM                      |     0.633  |       N/A\n",
      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - LAS                      |     0.920  |       N/A\n",
      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - loss                     |     0.587  |       N/A\n",
      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - LEM                      |     0.406  |       N/A\n",
      "2023-04-07 01:05:40,142 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:05:40,143 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:05:40,143 - INFO - combo.training.tensorboard_writer - UAS                      |     0.957  |       N/A\n",
      "2023-04-07 01:05:40,143 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:05:40,143 - INFO - combo.training.tensorboard_writer - EM                       |     0.935  |       N/A\n",
      "2023-04-07 01:05:40,143 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:05:40,148 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:05:45,118 - INFO - combo.training.trainer - Epoch duration: 0:01:21.518221\n",
      "2023-04-07 01:05:45,118 - INFO - combo.training.trainer - Estimated training time remaining: 6:47:53\n",
      "2023-04-07 01:05:45,118 - INFO - allennlp.training.trainer - Epoch 100/399\n",
      "2023-04-07 01:05:45,119 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:05:45,119 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:05:45,132 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9520, LAS: 0.9132, UEM: 0.6094, LEM: 0.3990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6790, partial_loss/deprel_loss: 0.5050, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7076, loss: 0.6213, batch_reg_loss: 0.1678, reg_loss: 0.1678 ||:   4%|3         | 4/111 [00:02<01:06,  1.62it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9586, LAS: 0.9210, UEM: 0.6494, LEM: 0.4174, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4590, partial_loss/deprel_loss: 0.4715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6368, loss: 0.5710, batch_reg_loss: 0.1678, reg_loss: 0.1678 ||:   6%|6         | 7/111 [00:05<01:11,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9576, LAS: 0.9206, UEM: 0.5918, LEM: 0.3678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4997, partial_loss/deprel_loss: 0.4244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6072, loss: 0.5797, batch_reg_loss: 0.1678, reg_loss: 0.1678 ||:  10%|9         | 11/111 [00:07<01:06,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9606, LAS: 0.9235, UEM: 0.6388, LEM: 0.3973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2654, partial_loss/deprel_loss: 0.3501, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5009, loss: 0.5600, batch_reg_loss: 0.1678, reg_loss: 0.1678 ||:  13%|#2        | 14/111 [00:09<01:05,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9619, LAS: 0.9246, UEM: 0.6601, LEM: 0.4154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2255, partial_loss/deprel_loss: 0.3886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5238, loss: 0.5466, batch_reg_loss: 0.1678, reg_loss: 0.1678 ||:  15%|#5        | 17/111 [00:11<01:04,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9304, UAS: 0.9631, LAS: 0.9255, UEM: 0.6556, LEM: 0.4027, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2328, partial_loss/deprel_loss: 0.3960, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5311, loss: 0.5455, batch_reg_loss: 0.1677, reg_loss: 0.1678 ||:  19%|#8        | 21/111 [00:14<00:59,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9095, UAS: 0.9625, LAS: 0.9246, UEM: 0.6400, LEM: 0.3836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4028, partial_loss/deprel_loss: 0.4304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5926, loss: 0.5531, batch_reg_loss: 0.1677, reg_loss: 0.1678 ||:  23%|##2       | 25/111 [00:16<00:56,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9613, LAS: 0.9235, UEM: 0.6279, LEM: 0.3736, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2863, partial_loss/deprel_loss: 0.4400, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5770, loss: 0.5629, batch_reg_loss: 0.1677, reg_loss: 0.1678 ||:  26%|##6       | 29/111 [00:19<00:52,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9605, LAS: 0.9226, UEM: 0.6154, LEM: 0.3619, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2613, partial_loss/deprel_loss: 0.3544, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5035, loss: 0.5694, batch_reg_loss: 0.1677, reg_loss: 0.1678 ||:  30%|##9       | 33/111 [00:21<00:50,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8827, UAS: 0.9584, LAS: 0.9204, UEM: 0.5967, LEM: 0.3468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0388, partial_loss/deprel_loss: 0.6088, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8625, loss: 0.5841, batch_reg_loss: 0.1677, reg_loss: 0.1678 ||:  33%|###3      | 37/111 [00:24<00:47,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9586, LAS: 0.9211, UEM: 0.6047, LEM: 0.3567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3691, partial_loss/deprel_loss: 0.3959, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5582, loss: 0.5811, batch_reg_loss: 0.1677, reg_loss: 0.1677 ||:  37%|###6      | 41/111 [00:26<00:44,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9586, LAS: 0.9207, UEM: 0.6054, LEM: 0.3582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1545, partial_loss/deprel_loss: 0.2843, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4260, loss: 0.5829, batch_reg_loss: 0.1677, reg_loss: 0.1677 ||:  41%|####      | 45/111 [00:29<00:41,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9592, LAS: 0.9213, UEM: 0.6040, LEM: 0.3553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2283, partial_loss/deprel_loss: 0.3198, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4692, loss: 0.5803, batch_reg_loss: 0.1677, reg_loss: 0.1677 ||:  44%|####4     | 49/111 [00:31<00:38,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9581, LAS: 0.9202, UEM: 0.5987, LEM: 0.3523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2588, partial_loss/deprel_loss: 0.3593, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5069, loss: 0.5898, batch_reg_loss: 0.1677, reg_loss: 0.1677 ||:  48%|####7     | 53/111 [00:34<00:36,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9367, UAS: 0.9587, LAS: 0.9208, UEM: 0.6148, LEM: 0.3702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2090, partial_loss/deprel_loss: 0.3186, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4643, loss: 0.5836, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||:  51%|#####1    | 57/111 [00:36<00:33,  1.62it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9587, LAS: 0.9209, UEM: 0.6090, LEM: 0.3644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5263, partial_loss/deprel_loss: 0.4598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6407, loss: 0.5827, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||:  55%|#####4    | 61/111 [00:39<00:30,  1.62it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9588, LAS: 0.9210, UEM: 0.6164, LEM: 0.3774, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2336, partial_loss/deprel_loss: 0.3478, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4926, loss: 0.5814, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||:  59%|#####8    | 65/111 [00:42<00:30,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9596, LAS: 0.9221, UEM: 0.6403, LEM: 0.4112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1878, partial_loss/deprel_loss: 0.2835, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4319, loss: 0.5750, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||:  62%|######2   | 69/111 [00:45<00:31,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9076, UAS: 0.9595, LAS: 0.9220, UEM: 0.6402, LEM: 0.4117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5404, partial_loss/deprel_loss: 0.5082, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6823, loss: 0.5753, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||:  65%|######4   | 72/111 [00:47<00:28,  1.36it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9078, UAS: 0.9578, LAS: 0.9204, UEM: 0.6296, LEM: 0.4033, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5869, partial_loss/deprel_loss: 0.5256, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7055, loss: 0.5868, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||:  68%|######8   | 76/111 [00:50<00:23,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9583, LAS: 0.9208, UEM: 0.6404, LEM: 0.4149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1843, partial_loss/deprel_loss: 0.3322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4702, loss: 0.5836, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||:  72%|#######2  | 80/111 [00:52<00:20,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9581, LAS: 0.9206, UEM: 0.6366, LEM: 0.4112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3103, partial_loss/deprel_loss: 0.3814, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5347, loss: 0.5845, batch_reg_loss: 0.1676, reg_loss: 0.1677 ||:  76%|#######5  | 84/111 [00:54<00:16,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8953, UAS: 0.9580, LAS: 0.9205, UEM: 0.6320, LEM: 0.4065, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7726, partial_loss/deprel_loss: 0.5384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7528, loss: 0.5854, batch_reg_loss: 0.1675, reg_loss: 0.1677 ||:  79%|#######9  | 88/111 [00:59<00:18,  1.27it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9584, LAS: 0.9209, UEM: 0.6349, LEM: 0.4081, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4949, partial_loss/deprel_loss: 0.5901, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7386, loss: 0.5834, batch_reg_loss: 0.1675, reg_loss: 0.1677 ||:  83%|########2 | 92/111 [01:01<00:13,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9585, LAS: 0.9210, UEM: 0.6396, LEM: 0.4122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1842, partial_loss/deprel_loss: 0.3661, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4972, loss: 0.5819, batch_reg_loss: 0.1675, reg_loss: 0.1677 ||:  86%|########6 | 96/111 [01:03<00:10,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9583, LAS: 0.9208, UEM: 0.6358, LEM: 0.4079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4180, partial_loss/deprel_loss: 0.4352, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5993, loss: 0.5829, batch_reg_loss: 0.1675, reg_loss: 0.1677 ||:  91%|######### | 101/111 [01:06<00:06,  1.64it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9464, UAS: 0.9589, LAS: 0.9215, UEM: 0.6489, LEM: 0.4200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1436, partial_loss/deprel_loss: 0.2605, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4046, loss: 0.5776, batch_reg_loss: 0.1675, reg_loss: 0.1676 ||:  95%|#########4| 105/111 [01:08<00:03,  1.73it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9582, LAS: 0.9207, UEM: 0.6415, LEM: 0.4139, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4188, partial_loss/deprel_loss: 0.4373, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6011, loss: 0.5831, batch_reg_loss: 0.1675, reg_loss: 0.1676 ||:  98%|#########8| 109/111 [01:10<00:01,  1.74it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9578, LAS: 0.9203, UEM: 0.6389, LEM: 0.4113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3320, partial_loss/deprel_loss: 0.4104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5622, loss: 0.5859, batch_reg_loss: 0.1675, reg_loss: 0.1676 ||: 100%|##########| 111/111 [01:11<00:00,  1.55it/s]\n",
      "2023-04-07 01:07:00,073 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9546, LAS: 0.9047, UEM: 0.6395, LEM: 0.3262, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4405, partial_loss/deprel_loss: 24.0473, partial_loss/cycle_loss: 0.0000, batch_loss: 19.3259, loss: 22.2299, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:09,  1.10it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8763, UAS: 0.9455, LAS: 0.8921, UEM: 0.5202, LEM: 0.2292, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9855, partial_loss/deprel_loss: 35.7936, partial_loss/cycle_loss: 0.0000, batch_loss: 28.8320, loss: 23.8770, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:06,  1.08it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8697, UAS: 0.9455, LAS: 0.8928, UEM: 0.5466, LEM: 0.2615, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3333, partial_loss/deprel_loss: 46.5675, partial_loss/cycle_loss: 0.0000, batch_loss: 37.5207, loss: 25.1771, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:07<00:04,  1.01it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8289, UAS: 0.9443, LAS: 0.8922, UEM: 0.5920, LEM: 0.3072, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.7122, partial_loss/deprel_loss: 54.8760, partial_loss/cycle_loss: 0.0000, batch_loss: 44.2433, loss: 25.7398, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:10<00:01,  1.03it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8877, UAS: 0.9467, LAS: 0.8962, UEM: 0.6526, LEM: 0.3920, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7148, partial_loss/deprel_loss: 33.5731, partial_loss/cycle_loss: 0.0000, batch_loss: 27.0014, loss: 24.9927, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.02it/s]\n",
      "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-07 01:07:12,768 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.410  |    33.573\n",
      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.332  |     0.715\n",
      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.168  |     0.000\n",
      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - UEM                      |     0.639  |     0.653\n",
      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - LAS                      |     0.920  |     0.896\n",
      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - loss                     |     0.586  |    24.993\n",
      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - LEM                      |     0.411  |     0.392\n",
      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - UAS                      |     0.958  |     0.947\n",
      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - EM                       |     0.922  |     0.888\n",
      "2023-04-07 01:07:12,769 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:07:12,774 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:07:17,870 - INFO - combo.training.trainer - Epoch duration: 0:01:32.751562\n",
      "2023-04-07 01:07:17,870 - INFO - combo.training.trainer - Estimated training time remaining: 6:47:04\n",
      "2023-04-07 01:07:17,870 - INFO - allennlp.training.trainer - Epoch 101/399\n",
      "2023-04-07 01:07:17,871 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:07:17,871 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:07:17,886 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9265, UAS: 0.9584, LAS: 0.9224, UEM: 0.5521, LEM: 0.3333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2957, partial_loss/deprel_loss: 0.4164, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5597, loss: 0.5687, batch_reg_loss: 0.1675, reg_loss: 0.1675 ||:   4%|3         | 4/111 [00:02<01:07,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9619, LAS: 0.9268, UEM: 0.5710, LEM: 0.3375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3029, partial_loss/deprel_loss: 0.3438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5031, loss: 0.5421, batch_reg_loss: 0.1675, reg_loss: 0.1675 ||:   6%|6         | 7/111 [00:04<01:08,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9637, LAS: 0.9273, UEM: 0.6240, LEM: 0.3714, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1911, partial_loss/deprel_loss: 0.3880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5160, loss: 0.5432, batch_reg_loss: 0.1674, reg_loss: 0.1675 ||:  10%|9         | 11/111 [00:07<01:06,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8927, UAS: 0.9639, LAS: 0.9273, UEM: 0.6749, LEM: 0.4358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7485, partial_loss/deprel_loss: 0.5903, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7893, loss: 0.5387, batch_reg_loss: 0.1674, reg_loss: 0.1675 ||:  13%|#2        | 14/111 [00:09<01:08,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9642, LAS: 0.9277, UEM: 0.6725, LEM: 0.4326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1768, partial_loss/deprel_loss: 0.3002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4429, loss: 0.5336, batch_reg_loss: 0.1674, reg_loss: 0.1675 ||:  15%|#5        | 17/111 [00:11<01:05,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9644, LAS: 0.9284, UEM: 0.6859, LEM: 0.4493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2393, partial_loss/deprel_loss: 0.3348, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4831, loss: 0.5291, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||:  18%|#8        | 20/111 [00:13<01:03,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8949, UAS: 0.9625, LAS: 0.9264, UEM: 0.6755, LEM: 0.4419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8730, partial_loss/deprel_loss: 0.5417, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7753, loss: 0.5407, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||:  22%|##1       | 24/111 [00:16<00:58,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9616, LAS: 0.9251, UEM: 0.6596, LEM: 0.4235, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1901, partial_loss/deprel_loss: 0.3190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4606, loss: 0.5484, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||:  25%|##5       | 28/111 [00:18<00:54,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9613, LAS: 0.9247, UEM: 0.6721, LEM: 0.4391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1284, partial_loss/deprel_loss: 0.2451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3892, loss: 0.5513, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||:  28%|##7       | 31/111 [00:21<00:55,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9605, LAS: 0.9233, UEM: 0.6628, LEM: 0.4289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3010, partial_loss/deprel_loss: 0.4006, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5480, loss: 0.5633, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||:  32%|###1      | 35/111 [00:23<00:51,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9603, LAS: 0.9233, UEM: 0.6703, LEM: 0.4406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8033, partial_loss/deprel_loss: 0.5819, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7936, loss: 0.5633, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||:  34%|###4      | 38/111 [00:26<00:51,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9592, LAS: 0.9221, UEM: 0.6568, LEM: 0.4260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3455, partial_loss/deprel_loss: 0.4157, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5690, loss: 0.5733, batch_reg_loss: 0.1674, reg_loss: 0.1674 ||:  38%|###7      | 42/111 [00:28<00:46,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9601, LAS: 0.9232, UEM: 0.6750, LEM: 0.4480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2816, partial_loss/deprel_loss: 0.3762, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5246, loss: 0.5658, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||:  41%|####      | 45/111 [00:30<00:47,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9595, LAS: 0.9226, UEM: 0.6701, LEM: 0.4451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1848, partial_loss/deprel_loss: 0.2736, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4232, loss: 0.5682, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||:  43%|####3     | 48/111 [00:33<00:46,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9156, UAS: 0.9591, LAS: 0.9219, UEM: 0.6620, LEM: 0.4339, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3598, partial_loss/deprel_loss: 0.3840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5465, loss: 0.5704, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||:  47%|####6     | 52/111 [00:35<00:42,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9343, UAS: 0.9588, LAS: 0.9216, UEM: 0.6517, LEM: 0.4234, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2664, partial_loss/deprel_loss: 0.3243, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4800, loss: 0.5722, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||:  51%|#####1    | 57/111 [00:38<00:34,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9581, LAS: 0.9209, UEM: 0.6493, LEM: 0.4205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7026, partial_loss/deprel_loss: 0.5731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7663, loss: 0.5773, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||:  55%|#####4    | 61/111 [00:40<00:30,  1.65it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9588, LAS: 0.9219, UEM: 0.6482, LEM: 0.4178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1957, partial_loss/deprel_loss: 0.2670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4201, loss: 0.5711, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||:  59%|#####9    | 66/111 [00:42<00:24,  1.83it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9582, LAS: 0.9211, UEM: 0.6423, LEM: 0.4135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4466, partial_loss/deprel_loss: 0.4426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6107, loss: 0.5769, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||:  63%|######3   | 70/111 [00:44<00:21,  1.88it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8596, UAS: 0.9577, LAS: 0.9206, UEM: 0.6412, LEM: 0.4125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3618, partial_loss/deprel_loss: 0.7365, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0288, loss: 0.5812, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||:  67%|######6   | 74/111 [00:47<00:21,  1.73it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9579, LAS: 0.9208, UEM: 0.6425, LEM: 0.4136, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1749, partial_loss/deprel_loss: 0.2488, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4013, loss: 0.5804, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||:  70%|#######   | 78/111 [00:49<00:20,  1.65it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9581, LAS: 0.9210, UEM: 0.6432, LEM: 0.4122, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2130, partial_loss/deprel_loss: 0.3557, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4944, loss: 0.5795, batch_reg_loss: 0.1673, reg_loss: 0.1674 ||:  74%|#######3  | 82/111 [00:52<00:18,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9580, LAS: 0.9209, UEM: 0.6464, LEM: 0.4164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1589, partial_loss/deprel_loss: 0.2839, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4262, loss: 0.5795, batch_reg_loss: 0.1672, reg_loss: 0.1674 ||:  77%|#######7  | 86/111 [00:55<00:16,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9579, LAS: 0.9210, UEM: 0.6548, LEM: 0.4326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8256, partial_loss/deprel_loss: 0.5331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7588, loss: 0.5791, batch_reg_loss: 0.1672, reg_loss: 0.1673 ||:  81%|########1 | 90/111 [00:58<00:15,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9581, LAS: 0.9212, UEM: 0.6497, LEM: 0.4266, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3404, partial_loss/deprel_loss: 0.3952, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5515, loss: 0.5793, batch_reg_loss: 0.1672, reg_loss: 0.1673 ||:  85%|########4 | 94/111 [01:01<00:11,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9577, LAS: 0.9208, UEM: 0.6408, LEM: 0.4191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4775, partial_loss/deprel_loss: 0.4866, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6519, loss: 0.5825, batch_reg_loss: 0.1672, reg_loss: 0.1673 ||:  88%|########8 | 98/111 [01:04<00:08,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9580, LAS: 0.9210, UEM: 0.6418, LEM: 0.4177, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3033, partial_loss/deprel_loss: 0.3534, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5105, loss: 0.5806, batch_reg_loss: 0.1672, reg_loss: 0.1673 ||:  92%|#########1| 102/111 [01:06<00:05,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9581, LAS: 0.9211, UEM: 0.6415, LEM: 0.4162, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4302, partial_loss/deprel_loss: 0.4356, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6017, loss: 0.5786, batch_reg_loss: 0.1672, reg_loss: 0.1673 ||:  95%|#########5| 106/111 [01:09<00:03,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9221, UAS: 0.9576, LAS: 0.9205, UEM: 0.6366, LEM: 0.4116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3003, partial_loss/deprel_loss: 0.4267, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5686, loss: 0.5836, batch_reg_loss: 0.1672, reg_loss: 0.1673 ||:  99%|#########9| 110/111 [01:12<00:00,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9574, LAS: 0.9204, UEM: 0.6345, LEM: 0.4100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6024, partial_loss/deprel_loss: 0.4961, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6845, loss: 0.5845, batch_reg_loss: 0.1672, reg_loss: 0.1673 ||: 100%|##########| 111/111 [01:12<00:00,  1.52it/s]\n",
      "2023-04-07 01:08:33,893 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.496  |       N/A\n",
      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.602  |       N/A\n",
      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.167  |       N/A\n",
      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - UEM                      |     0.635  |       N/A\n",
      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - LAS                      |     0.920  |       N/A\n",
      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - loss                     |     0.584  |       N/A\n",
      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - LEM                      |     0.410  |       N/A\n",
      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:08:33,894 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:08:33,895 - INFO - combo.training.tensorboard_writer - UAS                      |     0.957  |       N/A\n",
      "2023-04-07 01:08:33,895 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:08:33,895 - INFO - combo.training.tensorboard_writer - EM                       |     0.908  |       N/A\n",
      "2023-04-07 01:08:33,895 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:08:33,900 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:08:38,949 - INFO - combo.training.trainer - Epoch duration: 0:01:21.078534\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:08:38,950 - INFO - combo.training.trainer - Estimated training time remaining: 6:45:41\n",
      "2023-04-07 01:08:38,950 - INFO - allennlp.training.trainer - Epoch 102/399\n",
      "2023-04-07 01:08:38,950 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:08:38,951 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:08:38,961 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9606, LAS: 0.9211, UEM: 0.6524, LEM: 0.4456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4132, partial_loss/deprel_loss: 0.3944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5653, loss: 0.5691, batch_reg_loss: 0.1672, reg_loss: 0.1672 ||:   4%|3         | 4/111 [00:02<01:05,  1.63it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9652, LAS: 0.9307, UEM: 0.7796, LEM: 0.6236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2336, partial_loss/deprel_loss: 0.2765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4351, loss: 0.5078, batch_reg_loss: 0.1672, reg_loss: 0.1672 ||:   6%|6         | 7/111 [00:04<01:08,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9618, LAS: 0.9261, UEM: 0.7107, LEM: 0.5336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3021, partial_loss/deprel_loss: 0.3575, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5136, loss: 0.5332, batch_reg_loss: 0.1671, reg_loss: 0.1672 ||:  10%|9         | 11/111 [00:07<01:04,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9556, UAS: 0.9634, LAS: 0.9282, UEM: 0.7425, LEM: 0.5678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0768, partial_loss/deprel_loss: 0.1740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3217, loss: 0.5227, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||:  13%|#2        | 14/111 [00:09<01:07,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9632, LAS: 0.9276, UEM: 0.7412, LEM: 0.5525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7525, partial_loss/deprel_loss: 0.5876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7877, loss: 0.5288, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||:  15%|#5        | 17/111 [00:11<01:06,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8545, UAS: 0.9589, LAS: 0.9228, UEM: 0.7120, LEM: 0.5238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.5075, partial_loss/deprel_loss: 0.7973, partial_loss/cycle_loss: 0.0000, batch_loss: 1.1065, loss: 0.5675, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||:  18%|#8        | 20/111 [00:13<01:03,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9608, LAS: 0.9247, UEM: 0.7363, LEM: 0.5412, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2577, partial_loss/deprel_loss: 0.3379, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4890, loss: 0.5495, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||:  21%|##        | 23/111 [00:15<01:01,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8870, UAS: 0.9585, LAS: 0.9220, UEM: 0.7148, LEM: 0.5201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8773, partial_loss/deprel_loss: 0.6363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8516, loss: 0.5670, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||:  24%|##4       | 27/111 [00:18<00:56,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9581, LAS: 0.9220, UEM: 0.7103, LEM: 0.5096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2279, partial_loss/deprel_loss: 0.3713, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5097, loss: 0.5672, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||:  28%|##7       | 31/111 [00:21<00:53,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9580, LAS: 0.9217, UEM: 0.7005, LEM: 0.4974, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2093, partial_loss/deprel_loss: 0.3733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5076, loss: 0.5702, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||:  31%|###       | 34/111 [00:23<00:53,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9580, LAS: 0.9217, UEM: 0.6965, LEM: 0.4926, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1576, partial_loss/deprel_loss: 0.2765, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4198, loss: 0.5702, batch_reg_loss: 0.1671, reg_loss: 0.1671 ||:  33%|###3      | 37/111 [00:25<00:50,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9472, UAS: 0.9577, LAS: 0.9215, UEM: 0.6872, LEM: 0.4846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1256, partial_loss/deprel_loss: 0.2269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3737, loss: 0.5715, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||:  38%|###7      | 42/111 [00:27<00:42,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8963, UAS: 0.9560, LAS: 0.9194, UEM: 0.6657, LEM: 0.4646, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6179, partial_loss/deprel_loss: 0.6150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7826, loss: 0.5871, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||:  42%|####2     | 47/111 [00:30<00:37,  1.70it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9152, UAS: 0.9558, LAS: 0.9192, UEM: 0.6558, LEM: 0.4525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5090, partial_loss/deprel_loss: 0.4367, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6182, loss: 0.5894, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||:  47%|####6     | 52/111 [00:32<00:32,  1.81it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9564, LAS: 0.9201, UEM: 0.6553, LEM: 0.4526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1447, partial_loss/deprel_loss: 0.2119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3655, loss: 0.5824, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||:  50%|#####     | 56/111 [00:35<00:32,  1.71it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9332, UAS: 0.9571, LAS: 0.9206, UEM: 0.6498, LEM: 0.4430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2884, partial_loss/deprel_loss: 0.3945, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5403, loss: 0.5802, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||:  54%|#####4    | 60/111 [00:38<00:32,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9452, UAS: 0.9577, LAS: 0.9213, UEM: 0.6562, LEM: 0.4477, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0998, partial_loss/deprel_loss: 0.2114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3561, loss: 0.5750, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||:  58%|#####7    | 64/111 [00:41<00:31,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9585, LAS: 0.9220, UEM: 0.6612, LEM: 0.4481, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1420, partial_loss/deprel_loss: 0.3105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4438, loss: 0.5705, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||:  61%|######1   | 68/111 [00:44<00:30,  1.43it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9588, LAS: 0.9223, UEM: 0.6601, LEM: 0.4452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4256, partial_loss/deprel_loss: 0.4427, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6063, loss: 0.5690, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||:  64%|######3   | 71/111 [00:46<00:28,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9588, LAS: 0.9222, UEM: 0.6597, LEM: 0.4447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7597, partial_loss/deprel_loss: 0.5197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7346, loss: 0.5689, batch_reg_loss: 0.1670, reg_loss: 0.1671 ||:  67%|######6   | 74/111 [00:48<00:26,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9592, LAS: 0.9224, UEM: 0.6585, LEM: 0.4393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2314, partial_loss/deprel_loss: 0.3426, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4873, loss: 0.5679, batch_reg_loss: 0.1669, reg_loss: 0.1671 ||:  70%|#######   | 78/111 [00:50<00:22,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8957, UAS: 0.9587, LAS: 0.9218, UEM: 0.6511, LEM: 0.4325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7663, partial_loss/deprel_loss: 0.5629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7705, loss: 0.5723, batch_reg_loss: 0.1669, reg_loss: 0.1670 ||:  74%|#######3  | 82/111 [00:53<00:19,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9592, LAS: 0.9222, UEM: 0.6537, LEM: 0.4325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1484, partial_loss/deprel_loss: 0.2987, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4355, loss: 0.5698, batch_reg_loss: 0.1669, reg_loss: 0.1670 ||:  77%|#######7  | 86/111 [00:56<00:16,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9595, LAS: 0.9227, UEM: 0.6553, LEM: 0.4340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1589, partial_loss/deprel_loss: 0.2685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4135, loss: 0.5666, batch_reg_loss: 0.1669, reg_loss: 0.1670 ||:  80%|########  | 89/111 [00:58<00:15,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9593, LAS: 0.9226, UEM: 0.6498, LEM: 0.4279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5596, partial_loss/deprel_loss: 0.5026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6809, loss: 0.5676, batch_reg_loss: 0.1669, reg_loss: 0.1670 ||:  84%|########3 | 93/111 [01:01<00:12,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9590, LAS: 0.9221, UEM: 0.6420, LEM: 0.4201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4337, partial_loss/deprel_loss: 0.4895, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6452, loss: 0.5714, batch_reg_loss: 0.1669, reg_loss: 0.1670 ||:  87%|########7 | 97/111 [01:04<00:09,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9589, LAS: 0.9219, UEM: 0.6386, LEM: 0.4158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3582, partial_loss/deprel_loss: 0.4022, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5602, loss: 0.5725, batch_reg_loss: 0.1669, reg_loss: 0.1670 ||:  90%|######### | 100/111 [01:06<00:07,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9156, UAS: 0.9590, LAS: 0.9220, UEM: 0.6363, LEM: 0.4131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5635, partial_loss/deprel_loss: 0.4484, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6383, loss: 0.5716, batch_reg_loss: 0.1669, reg_loss: 0.1670 ||:  93%|#########2| 103/111 [01:08<00:05,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9591, LAS: 0.9222, UEM: 0.6381, LEM: 0.4158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2237, partial_loss/deprel_loss: 0.3158, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4642, loss: 0.5704, batch_reg_loss: 0.1668, reg_loss: 0.1670 ||:  95%|#########5| 106/111 [01:10<00:03,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9586, LAS: 0.9217, UEM: 0.6342, LEM: 0.4117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4813, partial_loss/deprel_loss: 0.4999, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6630, loss: 0.5739, batch_reg_loss: 0.1668, reg_loss: 0.1670 ||:  99%|#########9| 110/111 [01:13<00:00,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9585, LAS: 0.9215, UEM: 0.6323, LEM: 0.4101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6699, partial_loss/deprel_loss: 0.5022, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7025, loss: 0.5751, batch_reg_loss: 0.1668, reg_loss: 0.1670 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
      "2023-04-07 01:09:55,423 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:09:55,423 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:09:55,423 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:09:55,423 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:09:55,423 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.502  |       N/A\n",
      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.670  |       N/A\n",
      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.167  |       N/A\n",
      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - UEM                      |     0.632  |       N/A\n",
      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - LAS                      |     0.922  |       N/A\n",
      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - loss                     |     0.575  |       N/A\n",
      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - LEM                      |     0.410  |       N/A\n",
      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - UAS                      |     0.958  |       N/A\n",
      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:09:55,424 - INFO - combo.training.tensorboard_writer - EM                       |     0.903  |       N/A\n",
      "2023-04-07 01:09:55,425 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:09:55,430 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:09:59,571 - INFO - combo.training.trainer - Epoch duration: 0:01:20.620700\n",
      "2023-04-07 01:09:59,571 - INFO - combo.training.trainer - Estimated training time remaining: 6:44:16\n",
      "2023-04-07 01:09:59,571 - INFO - allennlp.training.trainer - Epoch 103/399\n",
      "2023-04-07 01:09:59,571 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:09:59,572 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:09:59,580 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9667, LAS: 0.9267, UEM: 0.6543, LEM: 0.3516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2148, partial_loss/deprel_loss: 0.3473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4876, loss: 0.5462, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||:   4%|3         | 4/111 [00:02<01:16,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9632, LAS: 0.9251, UEM: 0.6317, LEM: 0.3365, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1864, partial_loss/deprel_loss: 0.3413, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4771, loss: 0.5638, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||:   6%|6         | 7/111 [00:04<01:13,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9728, UAS: 0.9657, LAS: 0.9289, UEM: 0.7378, LEM: 0.5188, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0321, partial_loss/deprel_loss: 0.1224, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2712, loss: 0.5427, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||:   9%|9         | 10/111 [00:07<01:15,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9589, LAS: 0.9227, UEM: 0.6830, LEM: 0.4771, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6950, partial_loss/deprel_loss: 0.5189, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7209, loss: 0.5806, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||:  13%|#2        | 14/111 [00:10<01:09,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9279, UAS: 0.9609, LAS: 0.9240, UEM: 0.6861, LEM: 0.4643, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2205, partial_loss/deprel_loss: 0.3790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.5681, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||:  15%|#5        | 17/111 [00:12<01:07,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9060, UAS: 0.9623, LAS: 0.9250, UEM: 0.7001, LEM: 0.4740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6032, partial_loss/deprel_loss: 0.4965, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6846, loss: 0.5604, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||:  18%|#8        | 20/111 [00:14<01:05,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9602, LAS: 0.9230, UEM: 0.6678, LEM: 0.4394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7369, partial_loss/deprel_loss: 0.4643, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6856, loss: 0.5714, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||:  22%|##1       | 24/111 [00:16<00:59,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9327, UAS: 0.9611, LAS: 0.9240, UEM: 0.6702, LEM: 0.4396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2633, partial_loss/deprel_loss: 0.3939, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5345, loss: 0.5612, batch_reg_loss: 0.1668, reg_loss: 0.1668 ||:  26%|##6       | 29/111 [00:19<00:51,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9599, LAS: 0.9224, UEM: 0.6433, LEM: 0.4131, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3315, partial_loss/deprel_loss: 0.4209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5697, loss: 0.5704, batch_reg_loss: 0.1667, reg_loss: 0.1668 ||:  31%|###       | 34/111 [00:21<00:44,  1.74it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9598, LAS: 0.9225, UEM: 0.6343, LEM: 0.4024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2272, partial_loss/deprel_loss: 0.2924, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4461, loss: 0.5673, batch_reg_loss: 0.1667, reg_loss: 0.1668 ||:  35%|###5      | 39/111 [00:23<00:39,  1.83it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8991, UAS: 0.9603, LAS: 0.9230, UEM: 0.6486, LEM: 0.4226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5966, partial_loss/deprel_loss: 0.5535, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7288, loss: 0.5641, batch_reg_loss: 0.1667, reg_loss: 0.1668 ||:  39%|###8      | 43/111 [00:26<00:38,  1.78it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9583, LAS: 0.9213, UEM: 0.6354, LEM: 0.4107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3198, partial_loss/deprel_loss: 0.3918, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5442, loss: 0.5782, batch_reg_loss: 0.1667, reg_loss: 0.1668 ||:  42%|####2     | 47/111 [00:29<00:39,  1.64it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8768, UAS: 0.9562, LAS: 0.9189, UEM: 0.6229, LEM: 0.4013, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9840, partial_loss/deprel_loss: 0.6410, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8763, loss: 0.5938, batch_reg_loss: 0.1667, reg_loss: 0.1668 ||:  46%|####5     | 51/111 [00:31<00:37,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9570, LAS: 0.9198, UEM: 0.6357, LEM: 0.4096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2263, partial_loss/deprel_loss: 0.3587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4989, loss: 0.5857, batch_reg_loss: 0.1667, reg_loss: 0.1668 ||:  50%|####9     | 55/111 [00:35<00:37,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9430, UAS: 0.9578, LAS: 0.9206, UEM: 0.6415, LEM: 0.4125, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1857, partial_loss/deprel_loss: 0.3076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4499, loss: 0.5814, batch_reg_loss: 0.1667, reg_loss: 0.1668 ||:  53%|#####3    | 59/111 [00:37<00:34,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9581, LAS: 0.9210, UEM: 0.6393, LEM: 0.4106, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3038, partial_loss/deprel_loss: 0.3076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4735, loss: 0.5791, batch_reg_loss: 0.1667, reg_loss: 0.1667 ||:  57%|#####6    | 63/111 [00:40<00:33,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9585, LAS: 0.9215, UEM: 0.6440, LEM: 0.4141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4838, partial_loss/deprel_loss: 0.4486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6223, loss: 0.5752, batch_reg_loss: 0.1667, reg_loss: 0.1667 ||:  59%|#####9    | 66/111 [00:43<00:33,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8947, UAS: 0.9576, LAS: 0.9204, UEM: 0.6336, LEM: 0.4063, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7353, partial_loss/deprel_loss: 0.6104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8020, loss: 0.5839, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||:  62%|######2   | 69/111 [00:45<00:31,  1.34it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9574, LAS: 0.9203, UEM: 0.6283, LEM: 0.4010, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2851, partial_loss/deprel_loss: 0.3712, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5206, loss: 0.5847, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||:  65%|######4   | 72/111 [00:47<00:29,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9574, LAS: 0.9204, UEM: 0.6231, LEM: 0.3956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3128, partial_loss/deprel_loss: 0.3818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5346, loss: 0.5847, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||:  68%|######7   | 75/111 [00:50<00:27,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9184, UAS: 0.9578, LAS: 0.9211, UEM: 0.6336, LEM: 0.4086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4455, partial_loss/deprel_loss: 0.5083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6624, loss: 0.5806, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||:  70%|#######   | 78/111 [00:52<00:25,  1.27it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9024, UAS: 0.9577, LAS: 0.9210, UEM: 0.6295, LEM: 0.4050, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6275, partial_loss/deprel_loss: 0.5117, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7015, loss: 0.5811, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||:  74%|#######3  | 82/111 [00:55<00:22,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9580, LAS: 0.9213, UEM: 0.6309, LEM: 0.4043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3798, partial_loss/deprel_loss: 0.3906, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5551, loss: 0.5784, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||:  77%|#######7  | 86/111 [00:58<00:18,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9579, LAS: 0.9213, UEM: 0.6258, LEM: 0.3998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5987, partial_loss/deprel_loss: 0.5247, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7061, loss: 0.5788, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||:  81%|########1 | 90/111 [01:00<00:14,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9580, LAS: 0.9214, UEM: 0.6220, LEM: 0.3940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3268, partial_loss/deprel_loss: 0.3844, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5394, loss: 0.5793, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||:  85%|########4 | 94/111 [01:02<00:11,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9583, LAS: 0.9216, UEM: 0.6287, LEM: 0.3993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1964, partial_loss/deprel_loss: 0.2947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4416, loss: 0.5763, batch_reg_loss: 0.1666, reg_loss: 0.1667 ||:  88%|########8 | 98/111 [01:05<00:08,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9518, UAS: 0.9591, LAS: 0.9225, UEM: 0.6436, LEM: 0.4152, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1200, partial_loss/deprel_loss: 0.2479, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3888, loss: 0.5697, batch_reg_loss: 0.1665, reg_loss: 0.1667 ||:  92%|#########1| 102/111 [01:08<00:06,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8799, UAS: 0.9582, LAS: 0.9216, UEM: 0.6361, LEM: 0.4093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8615, partial_loss/deprel_loss: 0.5799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8028, loss: 0.5751, batch_reg_loss: 0.1665, reg_loss: 0.1667 ||:  95%|#########5| 106/111 [01:11<00:03,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9584, LAS: 0.9217, UEM: 0.6389, LEM: 0.4116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5202, partial_loss/deprel_loss: 0.4868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6600, loss: 0.5732, batch_reg_loss: 0.1665, reg_loss: 0.1667 ||:  99%|#########9| 110/111 [01:14<00:00,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9585, LAS: 0.9218, UEM: 0.6393, LEM: 0.4117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2825, partial_loss/deprel_loss: 0.3588, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5101, loss: 0.5726, batch_reg_loss: 0.1665, reg_loss: 0.1667 ||: 100%|##########| 111/111 [01:14<00:00,  1.48it/s]\n",
      "2023-04-07 01:11:17,321 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.359  |       N/A\n",
      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.282  |       N/A\n",
      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.167  |       N/A\n",
      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - UEM                      |     0.639  |       N/A\n",
      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - LAS                      |     0.922  |       N/A\n",
      "2023-04-07 01:11:17,322 - INFO - combo.training.tensorboard_writer - loss                     |     0.573  |       N/A\n",
      "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - LEM                      |     0.412  |       N/A\n",
      "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - UAS                      |     0.959  |       N/A\n",
      "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - EM                       |     0.930  |       N/A\n",
      "2023-04-07 01:11:17,323 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:11:17,334 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:11:22,132 - INFO - combo.training.trainer - Epoch duration: 0:01:22.560293\n",
      "2023-04-07 01:11:22,132 - INFO - combo.training.trainer - Estimated training time remaining: 6:42:57\n",
      "2023-04-07 01:11:22,132 - INFO - allennlp.training.trainer - Epoch 104/399\n",
      "2023-04-07 01:11:22,132 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:11:22,133 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:11:22,143 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9579, LAS: 0.9237, UEM: 0.4843, LEM: 0.2304, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4918, partial_loss/deprel_loss: 0.4045, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5885, loss: 0.5448, batch_reg_loss: 0.1665, reg_loss: 0.1665 ||:   3%|2         | 3/111 [00:02<01:12,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9596, LAS: 0.9227, UEM: 0.5784, LEM: 0.3192, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2692, partial_loss/deprel_loss: 0.3732, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5189, loss: 0.5343, batch_reg_loss: 0.1665, reg_loss: 0.1665 ||:   5%|5         | 6/111 [00:04<01:12,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9639, LAS: 0.9279, UEM: 0.6773, LEM: 0.4301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4708, partial_loss/deprel_loss: 0.4108, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5893, loss: 0.5089, batch_reg_loss: 0.1665, reg_loss: 0.1665 ||:   8%|8         | 9/111 [00:06<01:10,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8996, UAS: 0.9582, LAS: 0.9228, UEM: 0.6431, LEM: 0.4054, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8202, partial_loss/deprel_loss: 0.5701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7866, loss: 0.5546, batch_reg_loss: 0.1665, reg_loss: 0.1665 ||:  13%|#2        | 14/111 [00:08<01:01,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9393, UAS: 0.9574, LAS: 0.9219, UEM: 0.6226, LEM: 0.3829, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2362, partial_loss/deprel_loss: 0.2969, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4512, loss: 0.5644, batch_reg_loss: 0.1665, reg_loss: 0.1665 ||:  17%|#7        | 19/111 [00:11<00:54,  1.70it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9268, UAS: 0.9592, LAS: 0.9236, UEM: 0.6460, LEM: 0.4133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2917, partial_loss/deprel_loss: 0.3613, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5138, loss: 0.5537, batch_reg_loss: 0.1664, reg_loss: 0.1665 ||:  22%|##1       | 24/111 [00:13<00:48,  1.81it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9607, LAS: 0.9253, UEM: 0.6852, LEM: 0.4642, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1332, partial_loss/deprel_loss: 0.2207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3697, loss: 0.5380, batch_reg_loss: 0.1664, reg_loss: 0.1665 ||:  25%|##5       | 28/111 [00:16<00:50,  1.64it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9083, UAS: 0.9590, LAS: 0.9238, UEM: 0.6721, LEM: 0.4576, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6297, partial_loss/deprel_loss: 0.4486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6512, loss: 0.5475, batch_reg_loss: 0.1664, reg_loss: 0.1665 ||:  29%|##8       | 32/111 [00:19<00:50,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9037, UAS: 0.9587, LAS: 0.9229, UEM: 0.6562, LEM: 0.4379, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5505, partial_loss/deprel_loss: 0.5524, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7184, loss: 0.5561, batch_reg_loss: 0.1664, reg_loss: 0.1665 ||:  32%|###2      | 36/111 [00:21<00:47,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9362, UAS: 0.9583, LAS: 0.9225, UEM: 0.6445, LEM: 0.4229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2530, partial_loss/deprel_loss: 0.3163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4700, loss: 0.5594, batch_reg_loss: 0.1664, reg_loss: 0.1665 ||:  36%|###6      | 40/111 [00:24<00:45,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9180, UAS: 0.9579, LAS: 0.9221, UEM: 0.6292, LEM: 0.4080, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5182, partial_loss/deprel_loss: 0.4399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6220, loss: 0.5646, batch_reg_loss: 0.1664, reg_loss: 0.1664 ||:  40%|###9      | 44/111 [00:27<00:44,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9591, LAS: 0.9233, UEM: 0.6478, LEM: 0.4241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4055, partial_loss/deprel_loss: 0.4315, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5926, loss: 0.5555, batch_reg_loss: 0.1664, reg_loss: 0.1664 ||:  43%|####3     | 48/111 [00:30<00:43,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9046, UAS: 0.9582, LAS: 0.9226, UEM: 0.6473, LEM: 0.4273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6240, partial_loss/deprel_loss: 0.5214, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7083, loss: 0.5615, batch_reg_loss: 0.1664, reg_loss: 0.1664 ||:  46%|####5     | 51/111 [00:32<00:44,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9587, LAS: 0.9230, UEM: 0.6452, LEM: 0.4223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2726, partial_loss/deprel_loss: 0.3050, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4649, loss: 0.5592, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||:  49%|####8     | 54/111 [00:35<00:43,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9583, LAS: 0.9225, UEM: 0.6372, LEM: 0.4141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5030, partial_loss/deprel_loss: 0.5071, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6726, loss: 0.5631, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||:  51%|#####1    | 57/111 [00:37<00:40,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8865, UAS: 0.9576, LAS: 0.9218, UEM: 0.6313, LEM: 0.4109, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8949, partial_loss/deprel_loss: 0.5334, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7720, loss: 0.5673, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||:  54%|#####4    | 60/111 [00:39<00:37,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9583, LAS: 0.9223, UEM: 0.6402, LEM: 0.4173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1827, partial_loss/deprel_loss: 0.2880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4332, loss: 0.5619, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||:  57%|#####6    | 63/111 [00:41<00:36,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9584, LAS: 0.9225, UEM: 0.6340, LEM: 0.4100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2745, partial_loss/deprel_loss: 0.3362, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4901, loss: 0.5619, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||:  59%|#####9    | 66/111 [00:44<00:33,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9521, UAS: 0.9590, LAS: 0.9233, UEM: 0.6448, LEM: 0.4206, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0997, partial_loss/deprel_loss: 0.2236, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3651, loss: 0.5570, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||:  63%|######3   | 70/111 [00:46<00:28,  1.41it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9587, LAS: 0.9229, UEM: 0.6394, LEM: 0.4141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3804, partial_loss/deprel_loss: 0.4674, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6163, loss: 0.5598, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||:  67%|######6   | 74/111 [00:49<00:25,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9005, UAS: 0.9587, LAS: 0.9230, UEM: 0.6390, LEM: 0.4135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8076, partial_loss/deprel_loss: 0.4870, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7174, loss: 0.5591, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||:  70%|#######   | 78/111 [00:51<00:20,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9590, LAS: 0.9232, UEM: 0.6394, LEM: 0.4138, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1533, partial_loss/deprel_loss: 0.2899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4288, loss: 0.5578, batch_reg_loss: 0.1663, reg_loss: 0.1664 ||:  74%|#######3  | 82/111 [00:53<00:18,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9591, LAS: 0.9233, UEM: 0.6367, LEM: 0.4102, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4186, partial_loss/deprel_loss: 0.4657, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6226, loss: 0.5577, batch_reg_loss: 0.1662, reg_loss: 0.1664 ||:  77%|#######7  | 86/111 [00:56<00:15,  1.63it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9588, LAS: 0.9227, UEM: 0.6289, LEM: 0.4028, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6325, partial_loss/deprel_loss: 0.5095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7003, loss: 0.5627, batch_reg_loss: 0.1662, reg_loss: 0.1664 ||:  81%|########1 | 90/111 [00:58<00:13,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9430, UAS: 0.9590, LAS: 0.9230, UEM: 0.6330, LEM: 0.4060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1584, partial_loss/deprel_loss: 0.2693, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4134, loss: 0.5602, batch_reg_loss: 0.1662, reg_loss: 0.1664 ||:  85%|########4 | 94/111 [01:01<00:11,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9268, UAS: 0.9589, LAS: 0.9227, UEM: 0.6276, LEM: 0.4005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2896, partial_loss/deprel_loss: 0.3616, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5134, loss: 0.5627, batch_reg_loss: 0.1662, reg_loss: 0.1664 ||:  88%|########8 | 98/111 [01:03<00:08,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9728, UAS: 0.9581, LAS: 0.9220, UEM: 0.6366, LEM: 0.4174, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0334, partial_loss/deprel_loss: 0.1020, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2545, loss: 0.5686, batch_reg_loss: 0.1662, reg_loss: 0.1664 ||:  92%|#########1| 102/111 [01:06<00:06,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9582, LAS: 0.9220, UEM: 0.6356, LEM: 0.4154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3712, partial_loss/deprel_loss: 0.3612, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5294, loss: 0.5684, batch_reg_loss: 0.1662, reg_loss: 0.1664 ||:  95%|#########5| 106/111 [01:09<00:03,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9585, LAS: 0.9225, UEM: 0.6374, LEM: 0.4164, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3568, partial_loss/deprel_loss: 0.3704, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5339, loss: 0.5656, batch_reg_loss: 0.1662, reg_loss: 0.1663 ||:  99%|#########9| 110/111 [01:12<00:00,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9585, LAS: 0.9225, UEM: 0.6356, LEM: 0.4146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4134, partial_loss/deprel_loss: 0.4592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6162, loss: 0.5660, batch_reg_loss: 0.1662, reg_loss: 0.1663 ||: 100%|##########| 111/111 [01:12<00:00,  1.52it/s]\n",
      "2023-04-07 01:12:38,230 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:12:38,230 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:12:38,230 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:12:38,230 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:12:38,230 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:12:38,230 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.459  |       N/A\n",
      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.413  |       N/A\n",
      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.166  |       N/A\n",
      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - UEM                      |     0.636  |       N/A\n",
      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - LAS                      |     0.922  |       N/A\n",
      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - loss                     |     0.566  |       N/A\n",
      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - LEM                      |     0.415  |       N/A\n",
      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - UAS                      |     0.958  |       N/A\n",
      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - EM                       |     0.921  |       N/A\n",
      "2023-04-07 01:12:38,231 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:12:38,238 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:12:43,544 - INFO - combo.training.trainer - Epoch duration: 0:01:21.411689\n",
      "2023-04-07 01:12:43,545 - INFO - combo.training.trainer - Estimated training time remaining: 6:41:35\n",
      "2023-04-07 01:12:43,545 - INFO - allennlp.training.trainer - Epoch 105/399\n",
      "2023-04-07 01:12:43,545 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:12:43,546 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:12:43,555 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9605, LAS: 0.9238, UEM: 0.5154, LEM: 0.2423, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4710, partial_loss/deprel_loss: 0.4087, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5874, loss: 0.5467, batch_reg_loss: 0.1662, reg_loss: 0.1662 ||:   4%|3         | 4/111 [00:02<00:54,  1.95it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9268, UAS: 0.9555, LAS: 0.9193, UEM: 0.4861, LEM: 0.2369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3070, partial_loss/deprel_loss: 0.3412, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5006, loss: 0.5761, batch_reg_loss: 0.1662, reg_loss: 0.1662 ||:   7%|7         | 8/111 [00:04<00:55,  1.87it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9145, UAS: 0.9566, LAS: 0.9206, UEM: 0.5133, LEM: 0.2719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4960, partial_loss/deprel_loss: 0.4824, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6513, loss: 0.5721, batch_reg_loss: 0.1661, reg_loss: 0.1662 ||:  11%|#         | 12/111 [00:06<00:54,  1.81it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9589, LAS: 0.9236, UEM: 0.5616, LEM: 0.3189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2420, partial_loss/deprel_loss: 0.3775, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5165, loss: 0.5580, batch_reg_loss: 0.1661, reg_loss: 0.1662 ||:  14%|#4        | 16/111 [00:09<00:55,  1.71it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8997, UAS: 0.9586, LAS: 0.9240, UEM: 0.5809, LEM: 0.3489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7090, partial_loss/deprel_loss: 0.4814, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6930, loss: 0.5559, batch_reg_loss: 0.1661, reg_loss: 0.1662 ||:  18%|#8        | 20/111 [00:11<00:52,  1.74it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9578, LAS: 0.9217, UEM: 0.5885, LEM: 0.3592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1913, partial_loss/deprel_loss: 0.2940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4395, loss: 0.5726, batch_reg_loss: 0.1661, reg_loss: 0.1661 ||:  22%|##1       | 24/111 [00:13<00:49,  1.76it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9590, LAS: 0.9226, UEM: 0.5978, LEM: 0.3627, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4385, partial_loss/deprel_loss: 0.5090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6610, loss: 0.5674, batch_reg_loss: 0.1661, reg_loss: 0.1661 ||:  26%|##6       | 29/111 [00:16<00:43,  1.89it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9008, UAS: 0.9586, LAS: 0.9223, UEM: 0.5805, LEM: 0.3475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6027, partial_loss/deprel_loss: 0.5682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7412, loss: 0.5714, batch_reg_loss: 0.1661, reg_loss: 0.1661 ||:  30%|##9       | 33/111 [00:18<00:42,  1.84it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9587, LAS: 0.9221, UEM: 0.6065, LEM: 0.3742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2653, partial_loss/deprel_loss: 0.4016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5404, loss: 0.5698, batch_reg_loss: 0.1661, reg_loss: 0.1661 ||:  33%|###3      | 37/111 [00:21<00:43,  1.70it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9594, LAS: 0.9225, UEM: 0.6225, LEM: 0.3869, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2054, partial_loss/deprel_loss: 0.3136, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4580, loss: 0.5648, batch_reg_loss: 0.1661, reg_loss: 0.1661 ||:  37%|###6      | 41/111 [00:24<00:44,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9591, LAS: 0.9220, UEM: 0.6231, LEM: 0.3862, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2100, partial_loss/deprel_loss: 0.3562, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4930, loss: 0.5681, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||:  41%|####      | 45/111 [00:26<00:41,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9592, LAS: 0.9222, UEM: 0.6172, LEM: 0.3777, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2282, partial_loss/deprel_loss: 0.3457, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4882, loss: 0.5694, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||:  44%|####4     | 49/111 [00:29<00:39,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9592, LAS: 0.9220, UEM: 0.6134, LEM: 0.3740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4211, partial_loss/deprel_loss: 0.5321, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6759, loss: 0.5711, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||:  48%|####7     | 53/111 [00:32<00:39,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9597, LAS: 0.9228, UEM: 0.6325, LEM: 0.4001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2204, partial_loss/deprel_loss: 0.2532, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4126, loss: 0.5662, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||:  50%|#####     | 56/111 [00:34<00:39,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9752, UAS: 0.9606, LAS: 0.9240, UEM: 0.6598, LEM: 0.4393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0256, partial_loss/deprel_loss: 0.0931, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2456, loss: 0.5583, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||:  53%|#####3    | 59/111 [00:37<00:40,  1.28it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9472, UAS: 0.9606, LAS: 0.9239, UEM: 0.6677, LEM: 0.4476, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1025, partial_loss/deprel_loss: 0.2338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3735, loss: 0.5582, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||:  57%|#####6    | 63/111 [00:40<00:37,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9603, LAS: 0.9236, UEM: 0.6652, LEM: 0.4453, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5848, partial_loss/deprel_loss: 0.4815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6681, loss: 0.5607, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||:  59%|#####9    | 66/111 [00:42<00:33,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9604, LAS: 0.9236, UEM: 0.6648, LEM: 0.4440, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1711, partial_loss/deprel_loss: 0.2880, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4306, loss: 0.5598, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||:  62%|######2   | 69/111 [00:44<00:31,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9592, LAS: 0.9223, UEM: 0.6538, LEM: 0.4348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0157, partial_loss/deprel_loss: 0.6286, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8720, loss: 0.5674, batch_reg_loss: 0.1660, reg_loss: 0.1661 ||:  66%|######5   | 73/111 [00:47<00:26,  1.43it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9588, LAS: 0.9219, UEM: 0.6449, LEM: 0.4262, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3976, partial_loss/deprel_loss: 0.4270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5871, loss: 0.5712, batch_reg_loss: 0.1659, reg_loss: 0.1661 ||:  69%|######9   | 77/111 [00:49<00:23,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8965, UAS: 0.9580, LAS: 0.9211, UEM: 0.6370, LEM: 0.4197, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9152, partial_loss/deprel_loss: 0.6189, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8441, loss: 0.5799, batch_reg_loss: 0.1659, reg_loss: 0.1661 ||:  72%|#######2  | 80/111 [00:51<00:21,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9087, UAS: 0.9576, LAS: 0.9209, UEM: 0.6312, LEM: 0.4145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6424, partial_loss/deprel_loss: 0.4890, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6856, loss: 0.5808, batch_reg_loss: 0.1659, reg_loss: 0.1661 ||:  75%|#######4  | 83/111 [00:54<00:19,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9583, LAS: 0.9215, UEM: 0.6427, LEM: 0.4242, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1461, partial_loss/deprel_loss: 0.2934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4299, loss: 0.5761, batch_reg_loss: 0.1659, reg_loss: 0.1661 ||:  77%|#######7  | 86/111 [00:56<00:17,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9589, LAS: 0.9221, UEM: 0.6461, LEM: 0.4239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1714, partial_loss/deprel_loss: 0.3043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4437, loss: 0.5725, batch_reg_loss: 0.1659, reg_loss: 0.1660 ||:  81%|########1 | 90/111 [00:58<00:14,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9593, LAS: 0.9225, UEM: 0.6463, LEM: 0.4227, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1769, partial_loss/deprel_loss: 0.2699, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4172, loss: 0.5698, batch_reg_loss: 0.1659, reg_loss: 0.1660 ||:  85%|########4 | 94/111 [01:01<00:11,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9595, LAS: 0.9228, UEM: 0.6455, LEM: 0.4205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2810, partial_loss/deprel_loss: 0.3794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5256, loss: 0.5681, batch_reg_loss: 0.1659, reg_loss: 0.1660 ||:  88%|########8 | 98/111 [01:03<00:08,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9116, UAS: 0.9592, LAS: 0.9224, UEM: 0.6407, LEM: 0.4158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5674, partial_loss/deprel_loss: 0.3946, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5951, loss: 0.5697, batch_reg_loss: 0.1659, reg_loss: 0.1660 ||:  92%|#########1| 102/111 [01:06<00:05,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9595, LAS: 0.9227, UEM: 0.6432, LEM: 0.4163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1545, partial_loss/deprel_loss: 0.2660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4095, loss: 0.5678, batch_reg_loss: 0.1659, reg_loss: 0.1660 ||:  95%|#########5| 106/111 [01:09<00:03,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8596, UAS: 0.9588, LAS: 0.9218, UEM: 0.6365, LEM: 0.4107, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3701, partial_loss/deprel_loss: 0.8036, partial_loss/cycle_loss: 0.0000, batch_loss: 1.0827, loss: 0.5747, batch_reg_loss: 0.1659, reg_loss: 0.1660 ||:  99%|#########9| 110/111 [01:12<00:00,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9586, LAS: 0.9217, UEM: 0.6349, LEM: 0.4092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6125, partial_loss/deprel_loss: 0.5305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7127, loss: 0.5760, batch_reg_loss: 0.1659, reg_loss: 0.1660 ||: 100%|##########| 111/111 [01:12<00:00,  1.53it/s]\n",
      "2023-04-07 01:13:59,528 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9553, LAS: 0.9111, UEM: 0.7989, LEM: 0.6196, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1845, partial_loss/deprel_loss: 18.4393, partial_loss/cycle_loss: 0.0000, batch_loss: 14.7883, loss: 19.5219, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:11,  1.05s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9480, LAS: 0.9002, UEM: 0.6879, LEM: 0.4533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4402, partial_loss/deprel_loss: 23.9572, partial_loss/cycle_loss: 0.0000, batch_loss: 19.2538, loss: 24.4794, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:04<00:07,  1.01it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8872, UAS: 0.9532, LAS: 0.9045, UEM: 0.6803, LEM: 0.4123, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7114, partial_loss/deprel_loss: 29.0657, partial_loss/cycle_loss: 0.0000, batch_loss: 23.3948, loss: 22.1284, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  69%|######9   | 9/13 [00:07<00:03,  1.14it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8793, UAS: 0.9449, LAS: 0.8945, UEM: 0.6256, LEM: 0.3659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0921, partial_loss/deprel_loss: 41.6153, partial_loss/cycle_loss: 0.0000, batch_loss: 33.5107, loss: 25.4303, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  92%|#########2| 12/13 [00:09<00:00,  1.16it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9476, LAS: 0.8979, UEM: 0.6576, LEM: 0.3943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1506, partial_loss/deprel_loss: 22.9104, partial_loss/cycle_loss: 0.0000, batch_loss: 18.3585, loss: 24.8863, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:10<00:00,  1.29it/s]\n",
      "2023-04-07 01:14:09,620 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:14:09,620 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-07 01:14:09,620 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 01:14:09,620 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.530  |    22.910\n",
      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.613  |     0.151\n",
      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.166  |     0.000\n",
      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - UEM                      |     0.635  |     0.658\n",
      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - LAS                      |     0.922  |     0.898\n",
      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - loss                     |     0.576  |    24.886\n",
      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - LEM                      |     0.409  |     0.394\n",
      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - UAS                      |     0.959  |     0.948\n",
      "2023-04-07 01:14:09,621 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-07 01:14:09,622 - INFO - combo.training.tensorboard_writer - EM                       |     0.905  |     0.939\n",
      "2023-04-07 01:14:09,622 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:14:09,626 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:14:14,904 - INFO - combo.training.trainer - Epoch duration: 0:01:31.359274\n",
      "2023-04-07 01:14:14,905 - INFO - combo.training.trainer - Estimated training time remaining: 6:40:40\n",
      "2023-04-07 01:14:14,905 - INFO - allennlp.training.trainer - Epoch 106/399\n",
      "2023-04-07 01:14:14,905 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:14:14,906 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:14:14,916 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9460, UAS: 0.9597, LAS: 0.9221, UEM: 0.6360, LEM: 0.4109, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1200, partial_loss/deprel_loss: 0.2448, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3857, loss: 0.5495, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:   4%|3         | 4/111 [00:02<01:11,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8979, UAS: 0.9562, LAS: 0.9204, UEM: 0.6661, LEM: 0.4711, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6598, partial_loss/deprel_loss: 0.4809, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6825, loss: 0.5676, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:   6%|6         | 7/111 [00:04<01:11,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9575, LAS: 0.9226, UEM: 0.6810, LEM: 0.4839, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7804, partial_loss/deprel_loss: 0.6168, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8153, loss: 0.5618, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:   9%|9         | 10/111 [00:07<01:10,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9585, LAS: 0.9235, UEM: 0.6787, LEM: 0.4796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1399, partial_loss/deprel_loss: 0.2521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3955, loss: 0.5556, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:  12%|#1        | 13/111 [00:09<01:11,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9589, LAS: 0.9241, UEM: 0.6982, LEM: 0.5117, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5977, partial_loss/deprel_loss: 0.5713, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7424, loss: 0.5556, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:  14%|#4        | 16/111 [00:11<01:08,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9035, UAS: 0.9575, LAS: 0.9222, UEM: 0.6738, LEM: 0.4852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6464, partial_loss/deprel_loss: 0.4745, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6747, loss: 0.5711, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:  17%|#7        | 19/111 [00:13<01:08,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9568, LAS: 0.9216, UEM: 0.6542, LEM: 0.4620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2399, partial_loss/deprel_loss: 0.2948, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4496, loss: 0.5771, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:  21%|##        | 23/111 [00:16<01:02,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9569, LAS: 0.9217, UEM: 0.6400, LEM: 0.4420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2381, partial_loss/deprel_loss: 0.3725, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5114, loss: 0.5755, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:  24%|##4       | 27/111 [00:19<00:58,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9252, UAS: 0.9582, LAS: 0.9229, UEM: 0.6431, LEM: 0.4341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3158, partial_loss/deprel_loss: 0.3573, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5148, loss: 0.5670, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:  28%|##7       | 31/111 [00:21<00:52,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9237, UAS: 0.9594, LAS: 0.9240, UEM: 0.6449, LEM: 0.4297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3148, partial_loss/deprel_loss: 0.3962, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5457, loss: 0.5601, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:  32%|###1      | 35/111 [00:24<00:51,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.9591, LAS: 0.9232, UEM: 0.6442, LEM: 0.4281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8498, partial_loss/deprel_loss: 0.6169, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8292, loss: 0.5630, batch_reg_loss: 0.1658, reg_loss: 0.1658 ||:  34%|###4      | 38/111 [00:26<00:49,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9023, UAS: 0.9595, LAS: 0.9239, UEM: 0.6561, LEM: 0.4424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7706, partial_loss/deprel_loss: 0.5407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7524, loss: 0.5581, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||:  37%|###6      | 41/111 [00:28<00:48,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9595, LAS: 0.9238, UEM: 0.6468, LEM: 0.4285, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5706, partial_loss/deprel_loss: 0.4615, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6490, loss: 0.5583, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||:  41%|####      | 45/111 [00:31<00:45,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9026, UAS: 0.9591, LAS: 0.9235, UEM: 0.6394, LEM: 0.4217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6297, partial_loss/deprel_loss: 0.5389, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7228, loss: 0.5618, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||:  43%|####3     | 48/111 [00:33<00:43,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9209, UAS: 0.9593, LAS: 0.9236, UEM: 0.6394, LEM: 0.4189, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4952, partial_loss/deprel_loss: 0.4717, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6421, loss: 0.5602, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||:  46%|####5     | 51/111 [00:35<00:42,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9400, UAS: 0.9601, LAS: 0.9243, UEM: 0.6537, LEM: 0.4329, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1582, partial_loss/deprel_loss: 0.2718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4148, loss: 0.5541, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||:  49%|####8     | 54/111 [00:38<00:43,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9597, LAS: 0.9237, UEM: 0.6536, LEM: 0.4303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3267, partial_loss/deprel_loss: 0.4067, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5564, loss: 0.5575, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||:  51%|#####1    | 57/111 [00:40<00:40,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9114, UAS: 0.9588, LAS: 0.9227, UEM: 0.6441, LEM: 0.4226, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5373, partial_loss/deprel_loss: 0.5270, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6947, loss: 0.5655, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||:  54%|#####4    | 60/111 [00:42<00:38,  1.33it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9288, UAS: 0.9592, LAS: 0.9230, UEM: 0.6392, LEM: 0.4135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3362, partial_loss/deprel_loss: 0.4284, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5756, loss: 0.5650, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||:  58%|#####7    | 64/111 [00:44<00:32,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9359, UAS: 0.9592, LAS: 0.9229, UEM: 0.6352, LEM: 0.4070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2206, partial_loss/deprel_loss: 0.3035, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4526, loss: 0.5645, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||:  61%|######1   | 68/111 [00:47<00:28,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9052, UAS: 0.9587, LAS: 0.9225, UEM: 0.6254, LEM: 0.3985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5371, partial_loss/deprel_loss: 0.5104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6814, loss: 0.5688, batch_reg_loss: 0.1657, reg_loss: 0.1658 ||:  65%|######4   | 72/111 [00:49<00:25,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9586, LAS: 0.9223, UEM: 0.6207, LEM: 0.3927, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5256, partial_loss/deprel_loss: 0.4265, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6120, loss: 0.5691, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||:  68%|######8   | 76/111 [00:52<00:23,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9587, LAS: 0.9223, UEM: 0.6193, LEM: 0.3889, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1841, partial_loss/deprel_loss: 0.3153, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4547, loss: 0.5685, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||:  72%|#######2  | 80/111 [00:55<00:22,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9590, LAS: 0.9226, UEM: 0.6208, LEM: 0.3900, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2910, partial_loss/deprel_loss: 0.3747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5236, loss: 0.5656, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||:  75%|#######4  | 83/111 [00:58<00:20,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9009, UAS: 0.9588, LAS: 0.9222, UEM: 0.6164, LEM: 0.3852, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5515, partial_loss/deprel_loss: 0.5246, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6956, loss: 0.5683, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||:  77%|#######7  | 86/111 [01:00<00:17,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9583, LAS: 0.9218, UEM: 0.6130, LEM: 0.3822, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2468, partial_loss/deprel_loss: 0.3473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4928, loss: 0.5711, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||:  80%|########  | 89/111 [01:02<00:15,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9588, LAS: 0.9224, UEM: 0.6181, LEM: 0.3849, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1722, partial_loss/deprel_loss: 0.2980, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4384, loss: 0.5672, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||:  84%|########3 | 93/111 [01:04<00:12,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9548, UAS: 0.9594, LAS: 0.9231, UEM: 0.6311, LEM: 0.3998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0772, partial_loss/deprel_loss: 0.2163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3541, loss: 0.5627, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||:  88%|########8 | 98/111 [01:07<00:08,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9593, LAS: 0.9232, UEM: 0.6285, LEM: 0.3972, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6855, partial_loss/deprel_loss: 0.4708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6793, loss: 0.5622, batch_reg_loss: 0.1656, reg_loss: 0.1657 ||:  93%|#########2| 103/111 [01:09<00:04,  1.76it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9196, UAS: 0.9589, LAS: 0.9229, UEM: 0.6367, LEM: 0.4134, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4590, partial_loss/deprel_loss: 0.4846, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6451, loss: 0.5652, batch_reg_loss: 0.1655, reg_loss: 0.1657 ||:  96%|#########6| 107/111 [01:11<00:02,  1.76it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9590, LAS: 0.9230, UEM: 0.6388, LEM: 0.4147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6903, partial_loss/deprel_loss: 0.5063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7086, loss: 0.5640, batch_reg_loss: 0.1655, reg_loss: 0.1657 ||: 100%|##########| 111/111 [01:14<00:00,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9590, LAS: 0.9230, UEM: 0.6388, LEM: 0.4147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6903, partial_loss/deprel_loss: 0.5063, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7086, loss: 0.5640, batch_reg_loss: 0.1655, reg_loss: 0.1657 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.506  |       N/A\n",
      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.690  |       N/A\n",
      "2023-04-07 01:15:32,908 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.166  |       N/A\n",
      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - UEM                      |     0.639  |       N/A\n",
      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - LAS                      |     0.923  |       N/A\n",
      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - loss                     |     0.564  |       N/A\n",
      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - LEM                      |     0.415  |       N/A\n",
      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - UAS                      |     0.959  |       N/A\n",
      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - EM                       |     0.907  |       N/A\n",
      "2023-04-07 01:15:32,909 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:15:32,914 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:15:37,937 - INFO - combo.training.trainer - Epoch duration: 0:01:23.032082\n",
      "2023-04-07 01:15:37,938 - INFO - combo.training.trainer - Estimated training time remaining: 6:39:22\n",
      "2023-04-07 01:15:37,938 - INFO - allennlp.training.trainer - Epoch 107/399\n",
      "2023-04-07 01:15:37,938 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:15:37,939 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:15:37,951 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9063, UAS: 0.9404, LAS: 0.9045, UEM: 0.1818, LEM: 0.0670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6183, partial_loss/deprel_loss: 0.4834, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6759, loss: 0.7128, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||:   3%|2         | 3/111 [00:02<01:17,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9551, LAS: 0.9217, UEM: 0.7477, LEM: 0.6220, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2309, partial_loss/deprel_loss: 0.3238, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4707, loss: 0.5912, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||:   5%|5         | 6/111 [00:04<01:20,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9327, UAS: 0.9598, LAS: 0.9264, UEM: 0.7318, LEM: 0.5729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2415, partial_loss/deprel_loss: 0.3944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5294, loss: 0.5564, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||:   8%|8         | 9/111 [00:06<01:16,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9556, UAS: 0.9638, LAS: 0.9295, UEM: 0.7680, LEM: 0.5838, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0983, partial_loss/deprel_loss: 0.1903, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3374, loss: 0.5257, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||:  11%|#         | 12/111 [00:09<01:14,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9645, LAS: 0.9301, UEM: 0.7532, LEM: 0.5563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2345, partial_loss/deprel_loss: 0.3621, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5021, loss: 0.5165, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||:  14%|#4        | 16/111 [00:12<01:10,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8812, UAS: 0.9611, LAS: 0.9260, UEM: 0.7304, LEM: 0.5306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0098, partial_loss/deprel_loss: 0.6083, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8541, loss: 0.5462, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||:  17%|#7        | 19/111 [00:14<01:07,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8918, UAS: 0.9604, LAS: 0.9254, UEM: 0.7239, LEM: 0.5191, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9762, partial_loss/deprel_loss: 0.5604, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8090, loss: 0.5532, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||:  20%|#9        | 22/111 [00:16<01:06,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9099, UAS: 0.9597, LAS: 0.9250, UEM: 0.7145, LEM: 0.5123, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6173, partial_loss/deprel_loss: 0.4916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6822, loss: 0.5542, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||:  23%|##2       | 25/111 [00:18<01:03,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9192, UAS: 0.9588, LAS: 0.9239, UEM: 0.6825, LEM: 0.4837, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4539, partial_loss/deprel_loss: 0.4544, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6198, loss: 0.5627, batch_reg_loss: 0.1655, reg_loss: 0.1655 ||:  26%|##6       | 29/111 [00:21<00:58,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8950, UAS: 0.9579, LAS: 0.9230, UEM: 0.6704, LEM: 0.4709, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8390, partial_loss/deprel_loss: 0.5060, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7380, loss: 0.5715, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||:  29%|##8       | 32/111 [00:23<00:55,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9584, LAS: 0.9234, UEM: 0.6645, LEM: 0.4611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3485, partial_loss/deprel_loss: 0.3792, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5385, loss: 0.5686, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||:  32%|###1      | 35/111 [00:25<00:53,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9089, UAS: 0.9585, LAS: 0.9232, UEM: 0.6623, LEM: 0.4566, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5470, partial_loss/deprel_loss: 0.5001, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6749, loss: 0.5675, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||:  34%|###4      | 38/111 [00:27<00:50,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9595, LAS: 0.9242, UEM: 0.6705, LEM: 0.4606, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2611, partial_loss/deprel_loss: 0.3462, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4946, loss: 0.5603, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||:  37%|###6      | 41/111 [00:29<00:49,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9595, LAS: 0.9238, UEM: 0.6617, LEM: 0.4485, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6102, partial_loss/deprel_loss: 0.5191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7027, loss: 0.5607, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||:  41%|####      | 45/111 [00:32<00:44,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9589, LAS: 0.9233, UEM: 0.6512, LEM: 0.4375, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2744, partial_loss/deprel_loss: 0.3026, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4623, loss: 0.5633, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||:  44%|####4     | 49/111 [00:34<00:39,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9593, LAS: 0.9237, UEM: 0.6471, LEM: 0.4301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3814, partial_loss/deprel_loss: 0.4476, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5998, loss: 0.5621, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||:  48%|####7     | 53/111 [00:36<00:36,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9592, LAS: 0.9237, UEM: 0.6426, LEM: 0.4236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2156, partial_loss/deprel_loss: 0.3679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5028, loss: 0.5612, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||:  51%|#####1    | 57/111 [00:39<00:34,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9458, UAS: 0.9596, LAS: 0.9240, UEM: 0.6447, LEM: 0.4221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1229, partial_loss/deprel_loss: 0.2915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4231, loss: 0.5587, batch_reg_loss: 0.1654, reg_loss: 0.1655 ||:  55%|#####4    | 61/111 [00:42<00:32,  1.53it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9597, LAS: 0.9239, UEM: 0.6410, LEM: 0.4175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5022, partial_loss/deprel_loss: 0.4624, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6357, loss: 0.5594, batch_reg_loss: 0.1654, reg_loss: 0.1654 ||:  59%|#####8    | 65/111 [00:44<00:29,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9529, UAS: 0.9589, LAS: 0.9234, UEM: 0.6424, LEM: 0.4215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1442, partial_loss/deprel_loss: 0.2097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3620, loss: 0.5627, batch_reg_loss: 0.1653, reg_loss: 0.1654 ||:  62%|######2   | 69/111 [00:47<00:28,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9592, LAS: 0.9236, UEM: 0.6441, LEM: 0.4216, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4032, partial_loss/deprel_loss: 0.4486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6049, loss: 0.5617, batch_reg_loss: 0.1653, reg_loss: 0.1654 ||:  66%|######5   | 73/111 [00:50<00:25,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9548, UAS: 0.9599, LAS: 0.9243, UEM: 0.6642, LEM: 0.4449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0766, partial_loss/deprel_loss: 0.1825, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3266, loss: 0.5553, batch_reg_loss: 0.1653, reg_loss: 0.1654 ||:  70%|#######   | 78/111 [00:52<00:20,  1.65it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9604, LAS: 0.9248, UEM: 0.6636, LEM: 0.4416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4480, partial_loss/deprel_loss: 0.4697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6306, loss: 0.5532, batch_reg_loss: 0.1653, reg_loss: 0.1654 ||:  75%|#######4  | 83/111 [00:54<00:15,  1.79it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9605, LAS: 0.9249, UEM: 0.6583, LEM: 0.4353, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3688, partial_loss/deprel_loss: 0.3764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5402, loss: 0.5531, batch_reg_loss: 0.1653, reg_loss: 0.1654 ||:  79%|#######9  | 88/111 [00:57<00:12,  1.87it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9603, LAS: 0.9246, UEM: 0.6530, LEM: 0.4290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3882, partial_loss/deprel_loss: 0.4423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5967, loss: 0.5549, batch_reg_loss: 0.1653, reg_loss: 0.1654 ||:  83%|########2 | 92/111 [00:59<00:10,  1.81it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9597, LAS: 0.9239, UEM: 0.6455, LEM: 0.4215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6310, partial_loss/deprel_loss: 0.5527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7336, loss: 0.5602, batch_reg_loss: 0.1653, reg_loss: 0.1654 ||:  86%|########6 | 96/111 [01:02<00:08,  1.75it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8789, UAS: 0.9591, LAS: 0.9233, UEM: 0.6407, LEM: 0.4176, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9582, partial_loss/deprel_loss: 0.5912, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8299, loss: 0.5646, batch_reg_loss: 0.1652, reg_loss: 0.1654 ||:  90%|######### | 100/111 [01:04<00:06,  1.62it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9328, UAS: 0.9591, LAS: 0.9231, UEM: 0.6373, LEM: 0.4132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2896, partial_loss/deprel_loss: 0.3896, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5348, loss: 0.5664, batch_reg_loss: 0.1652, reg_loss: 0.1654 ||:  94%|#########3| 104/111 [01:08<00:04,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9592, LAS: 0.9232, UEM: 0.6353, LEM: 0.4108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3564, partial_loss/deprel_loss: 0.4573, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6024, loss: 0.5661, batch_reg_loss: 0.1652, reg_loss: 0.1654 ||:  97%|#########7| 108/111 [01:10<00:02,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9596, LAS: 0.9237, UEM: 0.6431, LEM: 0.4185, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2550, partial_loss/deprel_loss: 0.3154, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4686, loss: 0.5627, batch_reg_loss: 0.1652, reg_loss: 0.1654 ||: 100%|##########| 111/111 [01:12<00:00,  1.52it/s]\n",
      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.315  |       N/A\n",
      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.255  |       N/A\n",
      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.165  |       N/A\n",
      "2023-04-07 01:16:54,108 - INFO - combo.training.tensorboard_writer - UEM                      |     0.643  |       N/A\n",
      "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - LAS                      |     0.924  |       N/A\n",
      "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - loss                     |     0.563  |       N/A\n",
      "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - LEM                      |     0.419  |       N/A\n",
      "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - UAS                      |     0.960  |       N/A\n",
      "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - EM                       |     0.936  |       N/A\n",
      "2023-04-07 01:16:54,109 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:16:54,114 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:16:59,229 - INFO - combo.training.trainer - Epoch duration: 0:01:21.291164\n",
      "2023-04-07 01:16:59,230 - INFO - combo.training.trainer - Estimated training time remaining: 6:37:58\n",
      "2023-04-07 01:16:59,230 - INFO - allennlp.training.trainer - Epoch 108/399\n",
      "2023-04-07 01:16:59,230 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:16:59,230 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:16:59,239 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9553, LAS: 0.9185, UEM: 0.4522, LEM: 0.2261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2684, partial_loss/deprel_loss: 0.3385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4897, loss: 0.6150, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||:   3%|2         | 3/111 [00:02<01:15,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8999, UAS: 0.9546, LAS: 0.9193, UEM: 0.4889, LEM: 0.2563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8166, partial_loss/deprel_loss: 0.5060, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7334, loss: 0.6051, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||:   5%|5         | 6/111 [00:04<01:15,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9595, LAS: 0.9240, UEM: 0.6025, LEM: 0.3661, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1919, partial_loss/deprel_loss: 0.2749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4235, loss: 0.5659, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||:   8%|8         | 9/111 [00:06<01:15,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8859, UAS: 0.9532, LAS: 0.9178, UEM: 0.5312, LEM: 0.3147, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0256, partial_loss/deprel_loss: 0.5718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8277, loss: 0.5976, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||:  12%|#1        | 13/111 [00:09<01:08,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9536, LAS: 0.9181, UEM: 0.5355, LEM: 0.3208, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2057, partial_loss/deprel_loss: 0.2798, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4302, loss: 0.5954, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||:  14%|#4        | 16/111 [00:11<01:06,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9538, LAS: 0.9180, UEM: 0.5170, LEM: 0.3018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4307, partial_loss/deprel_loss: 0.3894, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5629, loss: 0.5964, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||:  17%|#7        | 19/111 [00:13<01:04,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9534, LAS: 0.9171, UEM: 0.5024, LEM: 0.2893, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5278, partial_loss/deprel_loss: 0.4720, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6483, loss: 0.5977, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||:  20%|#9        | 22/111 [00:15<01:01,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9547, LAS: 0.9183, UEM: 0.5345, LEM: 0.3124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6225, partial_loss/deprel_loss: 0.4262, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6306, loss: 0.5869, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||:  23%|##2       | 25/111 [00:17<01:02,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9420, UAS: 0.9568, LAS: 0.9208, UEM: 0.5885, LEM: 0.3651, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1603, partial_loss/deprel_loss: 0.2463, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3942, loss: 0.5704, batch_reg_loss: 0.1652, reg_loss: 0.1652 ||:  25%|##5       | 28/111 [00:19<00:59,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8955, UAS: 0.9567, LAS: 0.9207, UEM: 0.5925, LEM: 0.3715, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6408, partial_loss/deprel_loss: 0.6466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8106, loss: 0.5757, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||:  28%|##7       | 31/111 [00:22<00:59,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9220, UAS: 0.9570, LAS: 0.9211, UEM: 0.5842, LEM: 0.3600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3374, partial_loss/deprel_loss: 0.4541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5959, loss: 0.5759, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||:  31%|###       | 34/111 [00:24<00:56,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9073, UAS: 0.9571, LAS: 0.9210, UEM: 0.5775, LEM: 0.3523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5832, partial_loss/deprel_loss: 0.5241, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7011, loss: 0.5768, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||:  33%|###3      | 37/111 [00:26<00:53,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9566, LAS: 0.9205, UEM: 0.5616, LEM: 0.3367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5129, partial_loss/deprel_loss: 0.4416, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6210, loss: 0.5796, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||:  37%|###6      | 41/111 [00:29<00:48,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8969, UAS: 0.9568, LAS: 0.9208, UEM: 0.5599, LEM: 0.3330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7523, partial_loss/deprel_loss: 0.5404, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7479, loss: 0.5798, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||:  41%|####      | 45/111 [00:31<00:44,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9573, LAS: 0.9212, UEM: 0.5717, LEM: 0.3448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3370, partial_loss/deprel_loss: 0.3491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5118, loss: 0.5767, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||:  43%|####3     | 48/111 [00:33<00:43,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9327, UAS: 0.9577, LAS: 0.9217, UEM: 0.5806, LEM: 0.3533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2611, partial_loss/deprel_loss: 0.3451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4934, loss: 0.5721, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||:  46%|####5     | 51/111 [00:35<00:42,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9580, UAS: 0.9585, LAS: 0.9226, UEM: 0.6101, LEM: 0.3869, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0995, partial_loss/deprel_loss: 0.1774, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3269, loss: 0.5642, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||:  49%|####8     | 54/111 [00:38<00:40,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8888, UAS: 0.9580, LAS: 0.9222, UEM: 0.6093, LEM: 0.3867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9579, partial_loss/deprel_loss: 0.6240, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8558, loss: 0.5683, batch_reg_loss: 0.1651, reg_loss: 0.1652 ||:  51%|#####1    | 57/111 [00:40<00:38,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9593, LAS: 0.9234, UEM: 0.6378, LEM: 0.4135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1566, partial_loss/deprel_loss: 0.2924, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4303, loss: 0.5589, batch_reg_loss: 0.1651, reg_loss: 0.1651 ||:  55%|#####4    | 61/111 [00:42<00:33,  1.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9597, LAS: 0.9237, UEM: 0.6403, LEM: 0.4135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2546, partial_loss/deprel_loss: 0.2992, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4553, loss: 0.5568, batch_reg_loss: 0.1651, reg_loss: 0.1651 ||:  59%|#####8    | 65/111 [00:44<00:28,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9601, LAS: 0.9239, UEM: 0.6396, LEM: 0.4078, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2857, partial_loss/deprel_loss: 0.3470, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4998, loss: 0.5548, batch_reg_loss: 0.1650, reg_loss: 0.1651 ||:  63%|######3   | 70/111 [00:46<00:22,  1.79it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9602, LAS: 0.9242, UEM: 0.6355, LEM: 0.4028, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3710, partial_loss/deprel_loss: 0.3691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5345, loss: 0.5529, batch_reg_loss: 0.1650, reg_loss: 0.1651 ||:  68%|######7   | 75/111 [00:49<00:19,  1.84it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9609, LAS: 0.9247, UEM: 0.6496, LEM: 0.4167, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2679, partial_loss/deprel_loss: 0.3331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4851, loss: 0.5488, batch_reg_loss: 0.1650, reg_loss: 0.1651 ||:  71%|#######1  | 79/111 [00:51<00:18,  1.72it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9605, LAS: 0.9245, UEM: 0.6596, LEM: 0.4358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6113, partial_loss/deprel_loss: 0.5152, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6994, loss: 0.5509, batch_reg_loss: 0.1650, reg_loss: 0.1651 ||:  75%|#######4  | 83/111 [00:55<00:18,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9111, UAS: 0.9602, LAS: 0.9244, UEM: 0.6551, LEM: 0.4322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4968, partial_loss/deprel_loss: 0.4183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5990, loss: 0.5509, batch_reg_loss: 0.1650, reg_loss: 0.1651 ||:  78%|#######8  | 87/111 [00:58<00:16,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9606, LAS: 0.9248, UEM: 0.6565, LEM: 0.4329, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4187, partial_loss/deprel_loss: 0.3940, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5639, loss: 0.5483, batch_reg_loss: 0.1650, reg_loss: 0.1651 ||:  82%|########1 | 91/111 [01:00<00:13,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9067, UAS: 0.9600, LAS: 0.9242, UEM: 0.6535, LEM: 0.4293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6841, partial_loss/deprel_loss: 0.4818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6872, loss: 0.5532, batch_reg_loss: 0.1649, reg_loss: 0.1651 ||:  86%|########5 | 95/111 [01:03<00:10,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9598, LAS: 0.9239, UEM: 0.6465, LEM: 0.4221, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3786, partial_loss/deprel_loss: 0.4065, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5658, loss: 0.5551, batch_reg_loss: 0.1649, reg_loss: 0.1651 ||:  89%|########9 | 99/111 [01:05<00:07,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9596, LAS: 0.9238, UEM: 0.6435, LEM: 0.4186, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3555, partial_loss/deprel_loss: 0.3684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5308, loss: 0.5557, batch_reg_loss: 0.1649, reg_loss: 0.1651 ||:  93%|#########2| 103/111 [01:08<00:05,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9041, UAS: 0.9592, LAS: 0.9235, UEM: 0.6426, LEM: 0.4184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8306, partial_loss/deprel_loss: 0.4825, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7170, loss: 0.5577, batch_reg_loss: 0.1649, reg_loss: 0.1651 ||:  96%|#########6| 107/111 [01:11<00:02,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9593, LAS: 0.9237, UEM: 0.6404, LEM: 0.4160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4690, partial_loss/deprel_loss: 0.4414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6118, loss: 0.5582, batch_reg_loss: 0.1649, reg_loss: 0.1651 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9593, LAS: 0.9237, UEM: 0.6404, LEM: 0.4160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4690, partial_loss/deprel_loss: 0.4414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6118, loss: 0.5582, batch_reg_loss: 0.1649, reg_loss: 0.1651 ||: 100%|##########| 111/111 [01:13<00:00,  1.50it/s]\n",
      "2023-04-07 01:18:15,970 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.441  |       N/A\n",
      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.469  |       N/A\n",
      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.165  |       N/A\n",
      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - UEM                      |     0.640  |       N/A\n",
      "2023-04-07 01:18:15,971 - INFO - combo.training.tensorboard_writer - LAS                      |     0.924  |       N/A\n",
      "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - loss                     |     0.558  |       N/A\n",
      "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - LEM                      |     0.416  |       N/A\n",
      "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - UAS                      |     0.959  |       N/A\n",
      "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - EM                       |     0.922  |       N/A\n",
      "2023-04-07 01:18:15,972 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:18:15,977 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:18:20,504 - INFO - combo.training.trainer - Epoch duration: 0:01:21.274289\n",
      "2023-04-07 01:18:20,504 - INFO - combo.training.trainer - Estimated training time remaining: 6:36:35\n",
      "2023-04-07 01:18:20,505 - INFO - allennlp.training.trainer - Epoch 109/399\n",
      "2023-04-07 01:18:20,505 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:18:20,505 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:18:20,511 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9593, LAS: 0.9236, UEM: 0.6521, LEM: 0.4525, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5284, partial_loss/deprel_loss: 0.4916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6639, loss: 0.5311, batch_reg_loss: 0.1649, reg_loss: 0.1649 ||:   3%|2         | 3/111 [00:02<01:20,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9525, UAS: 0.9639, LAS: 0.9292, UEM: 0.6776, LEM: 0.4671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0727, partial_loss/deprel_loss: 0.2414, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3725, loss: 0.5108, batch_reg_loss: 0.1649, reg_loss: 0.1649 ||:   6%|6         | 7/111 [00:04<01:13,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9647, LAS: 0.9301, UEM: 0.7206, LEM: 0.5242, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5017, partial_loss/deprel_loss: 0.4443, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6206, loss: 0.4998, batch_reg_loss: 0.1649, reg_loss: 0.1649 ||:   9%|9         | 10/111 [00:07<01:13,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9639, LAS: 0.9291, UEM: 0.6909, LEM: 0.4869, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2603, partial_loss/deprel_loss: 0.3373, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4868, loss: 0.5078, batch_reg_loss: 0.1649, reg_loss: 0.1649 ||:  12%|#1        | 13/111 [00:09<01:09,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9650, LAS: 0.9297, UEM: 0.7081, LEM: 0.4977, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1774, partial_loss/deprel_loss: 0.3130, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4507, loss: 0.5012, batch_reg_loss: 0.1649, reg_loss: 0.1649 ||:  14%|#4        | 16/111 [00:11<01:09,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9652, LAS: 0.9295, UEM: 0.7043, LEM: 0.4836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1694, partial_loss/deprel_loss: 0.2815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4240, loss: 0.5025, batch_reg_loss: 0.1648, reg_loss: 0.1649 ||:  17%|#7        | 19/111 [00:13<01:06,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9268, UAS: 0.9654, LAS: 0.9295, UEM: 0.6904, LEM: 0.4650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2851, partial_loss/deprel_loss: 0.3708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5185, loss: 0.5048, batch_reg_loss: 0.1648, reg_loss: 0.1649 ||:  20%|#9        | 22/111 [00:15<01:04,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9639, LAS: 0.9277, UEM: 0.6742, LEM: 0.4469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6014, partial_loss/deprel_loss: 0.5016, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6864, loss: 0.5192, batch_reg_loss: 0.1648, reg_loss: 0.1649 ||:  23%|##3       | 26/111 [00:18<00:59,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8808, UAS: 0.9629, LAS: 0.9264, UEM: 0.6690, LEM: 0.4389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9460, partial_loss/deprel_loss: 0.6749, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8939, loss: 0.5308, batch_reg_loss: 0.1648, reg_loss: 0.1649 ||:  26%|##6       | 29/111 [00:20<00:57,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9076, UAS: 0.9615, LAS: 0.9251, UEM: 0.6499, LEM: 0.4218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6377, partial_loss/deprel_loss: 0.4794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6759, loss: 0.5409, batch_reg_loss: 0.1648, reg_loss: 0.1649 ||:  29%|##8       | 32/111 [00:22<00:57,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9618, LAS: 0.9255, UEM: 0.6579, LEM: 0.4286, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1913, partial_loss/deprel_loss: 0.2937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4380, loss: 0.5392, batch_reg_loss: 0.1648, reg_loss: 0.1648 ||:  32%|###1      | 35/111 [00:24<00:54,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9622, LAS: 0.9256, UEM: 0.6576, LEM: 0.4232, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2549, partial_loss/deprel_loss: 0.3702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5119, loss: 0.5392, batch_reg_loss: 0.1648, reg_loss: 0.1648 ||:  35%|###5      | 39/111 [00:27<00:49,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9624, LAS: 0.9262, UEM: 0.6782, LEM: 0.4593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6272, partial_loss/deprel_loss: 0.4519, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6517, loss: 0.5356, batch_reg_loss: 0.1648, reg_loss: 0.1648 ||:  38%|###7      | 42/111 [00:29<00:50,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9618, LAS: 0.9259, UEM: 0.6666, LEM: 0.4473, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6933, partial_loss/deprel_loss: 0.4629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6737, loss: 0.5404, batch_reg_loss: 0.1648, reg_loss: 0.1648 ||:  42%|####2     | 47/111 [00:32<00:42,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9612, LAS: 0.9255, UEM: 0.6695, LEM: 0.4513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2173, partial_loss/deprel_loss: 0.2628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4185, loss: 0.5427, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||:  46%|####5     | 51/111 [00:35<00:40,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9617, LAS: 0.9261, UEM: 0.6680, LEM: 0.4468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2944, partial_loss/deprel_loss: 0.3405, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4960, loss: 0.5398, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||:  50%|####9     | 55/111 [00:37<00:35,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9620, LAS: 0.9264, UEM: 0.6709, LEM: 0.4483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2472, partial_loss/deprel_loss: 0.2889, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4453, loss: 0.5356, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||:  53%|#####3    | 59/111 [00:40<00:34,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9621, LAS: 0.9265, UEM: 0.6713, LEM: 0.4464, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3059, partial_loss/deprel_loss: 0.3606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5144, loss: 0.5340, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||:  57%|#####6    | 63/111 [00:43<00:32,  1.47it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9380, UAS: 0.9622, LAS: 0.9267, UEM: 0.6706, LEM: 0.4439, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1655, partial_loss/deprel_loss: 0.2805, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4222, loss: 0.5326, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||:  60%|######    | 67/111 [00:45<00:28,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9617, LAS: 0.9261, UEM: 0.6613, LEM: 0.4347, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2136, partial_loss/deprel_loss: 0.3104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4557, loss: 0.5385, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||:  65%|######4   | 72/111 [00:47<00:23,  1.67it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9610, LAS: 0.9255, UEM: 0.6554, LEM: 0.4301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6497, partial_loss/deprel_loss: 0.4840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6818, loss: 0.5429, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||:  68%|######8   | 76/111 [00:50<00:21,  1.66it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9607, LAS: 0.9252, UEM: 0.6508, LEM: 0.4250, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2026, partial_loss/deprel_loss: 0.3609, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4939, loss: 0.5461, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||:  72%|#######2  | 80/111 [00:52<00:18,  1.65it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9607, LAS: 0.9251, UEM: 0.6457, LEM: 0.4202, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2719, partial_loss/deprel_loss: 0.3363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4881, loss: 0.5473, batch_reg_loss: 0.1647, reg_loss: 0.1648 ||:  76%|#######5  | 84/111 [00:55<00:16,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8811, UAS: 0.9606, LAS: 0.9251, UEM: 0.6512, LEM: 0.4269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0141, partial_loss/deprel_loss: 0.6056, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8519, loss: 0.5472, batch_reg_loss: 0.1646, reg_loss: 0.1648 ||:  79%|#######9  | 88/111 [00:58<00:15,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9607, LAS: 0.9251, UEM: 0.6511, LEM: 0.4258, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2974, partial_loss/deprel_loss: 0.3590, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5113, loss: 0.5471, batch_reg_loss: 0.1646, reg_loss: 0.1648 ||:  83%|########2 | 92/111 [01:00<00:12,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9512, UAS: 0.9605, LAS: 0.9250, UEM: 0.6587, LEM: 0.4366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0870, partial_loss/deprel_loss: 0.2240, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3612, loss: 0.5474, batch_reg_loss: 0.1646, reg_loss: 0.1648 ||:  86%|########6 | 96/111 [01:03<00:10,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9105, UAS: 0.9600, LAS: 0.9245, UEM: 0.6535, LEM: 0.4318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6137, partial_loss/deprel_loss: 0.4769, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6689, loss: 0.5521, batch_reg_loss: 0.1646, reg_loss: 0.1648 ||:  90%|######### | 100/111 [01:06<00:07,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9596, LAS: 0.9239, UEM: 0.6484, LEM: 0.4261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4753, partial_loss/deprel_loss: 0.4882, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6502, loss: 0.5571, batch_reg_loss: 0.1646, reg_loss: 0.1647 ||:  94%|#########3| 104/111 [01:08<00:04,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9596, LAS: 0.9239, UEM: 0.6458, LEM: 0.4228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2564, partial_loss/deprel_loss: 0.3385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4867, loss: 0.5568, batch_reg_loss: 0.1646, reg_loss: 0.1647 ||:  97%|#########7| 108/111 [01:11<00:01,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9596, LAS: 0.9238, UEM: 0.6435, LEM: 0.4200, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2266, partial_loss/deprel_loss: 0.3723, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5078, loss: 0.5579, batch_reg_loss: 0.1646, reg_loss: 0.1647 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.372  |       N/A\n",
      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.227  |       N/A\n",
      "2023-04-07 01:19:36,947 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.165  |       N/A\n",
      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - UEM                      |     0.643  |       N/A\n",
      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - LAS                      |     0.924  |       N/A\n",
      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - loss                     |     0.558  |       N/A\n",
      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - LEM                      |     0.420  |       N/A\n",
      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - UAS                      |     0.960  |       N/A\n",
      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - EM                       |     0.929  |       N/A\n",
      "2023-04-07 01:19:36,948 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:19:36,953 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:19:41,588 - INFO - combo.training.trainer - Epoch duration: 0:01:21.083316\n",
      "2023-04-07 01:19:41,588 - INFO - combo.training.trainer - Estimated training time remaining: 6:35:12\n",
      "2023-04-07 01:19:41,589 - INFO - allennlp.training.trainer - Epoch 110/399\n",
      "2023-04-07 01:19:41,589 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:19:41,589 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:19:41,614 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9717, LAS: 0.9407, UEM: 0.8579, LEM: 0.7503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4825, partial_loss/deprel_loss: 0.4682, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6356, loss: 0.4710, batch_reg_loss: 0.1646, reg_loss: 0.1646 ||:   3%|2         | 3/111 [00:02<01:23,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9648, LAS: 0.9312, UEM: 0.7607, LEM: 0.6095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2430, partial_loss/deprel_loss: 0.3122, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4630, loss: 0.5286, batch_reg_loss: 0.1646, reg_loss: 0.1646 ||:   5%|5         | 6/111 [00:04<01:19,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9070, UAS: 0.9631, LAS: 0.9301, UEM: 0.7603, LEM: 0.6183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5614, partial_loss/deprel_loss: 0.5790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7401, loss: 0.5314, batch_reg_loss: 0.1646, reg_loss: 0.1646 ||:   8%|8         | 9/111 [00:06<01:16,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9338, UAS: 0.9626, LAS: 0.9295, UEM: 0.7216, LEM: 0.5597, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1972, partial_loss/deprel_loss: 0.3086, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4509, loss: 0.5329, batch_reg_loss: 0.1646, reg_loss: 0.1646 ||:  11%|#         | 12/111 [00:08<01:14,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9602, LAS: 0.9259, UEM: 0.6921, LEM: 0.5212, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3618, partial_loss/deprel_loss: 0.4305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5813, loss: 0.5588, batch_reg_loss: 0.1645, reg_loss: 0.1646 ||:  14%|#3        | 15/111 [00:10<01:09,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9328, UAS: 0.9605, LAS: 0.9263, UEM: 0.6697, LEM: 0.4844, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3103, partial_loss/deprel_loss: 0.3685, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5214, loss: 0.5584, batch_reg_loss: 0.1645, reg_loss: 0.1646 ||:  17%|#7        | 19/111 [00:13<01:03,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9598, LAS: 0.9255, UEM: 0.6550, LEM: 0.4644, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1687, partial_loss/deprel_loss: 0.3197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4541, loss: 0.5648, batch_reg_loss: 0.1645, reg_loss: 0.1646 ||:  20%|#9        | 22/111 [00:15<01:03,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9106, UAS: 0.9586, LAS: 0.9242, UEM: 0.6355, LEM: 0.4419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5601, partial_loss/deprel_loss: 0.4628, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6468, loss: 0.5702, batch_reg_loss: 0.1645, reg_loss: 0.1646 ||:  23%|##3       | 26/111 [00:18<00:58,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9580, LAS: 0.9236, UEM: 0.6279, LEM: 0.4288, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2239, partial_loss/deprel_loss: 0.3454, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4856, loss: 0.5715, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||:  27%|##7       | 30/111 [00:21<00:55,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9576, LAS: 0.9234, UEM: 0.6131, LEM: 0.4149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6178, partial_loss/deprel_loss: 0.5330, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7145, loss: 0.5735, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||:  30%|##9       | 33/111 [00:23<00:55,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9568, LAS: 0.9225, UEM: 0.6158, LEM: 0.4149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2690, partial_loss/deprel_loss: 0.3602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5064, loss: 0.5788, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||:  32%|###2      | 36/111 [00:25<00:53,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9568, LAS: 0.9225, UEM: 0.6259, LEM: 0.4195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0041, partial_loss/deprel_loss: 0.5339, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7924, loss: 0.5774, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||:  35%|###5      | 39/111 [00:27<00:53,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9555, LAS: 0.9210, UEM: 0.6101, LEM: 0.4044, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8748, partial_loss/deprel_loss: 0.6011, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8203, loss: 0.5890, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||:  39%|###8      | 43/111 [00:30<00:48,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9099, UAS: 0.9556, LAS: 0.9212, UEM: 0.5979, LEM: 0.3897, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5680, partial_loss/deprel_loss: 0.4212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6151, loss: 0.5863, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||:  43%|####3     | 48/111 [00:32<00:39,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9562, LAS: 0.9215, UEM: 0.6145, LEM: 0.4018, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0934, partial_loss/deprel_loss: 0.2977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4213, loss: 0.5821, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||:  48%|####7     | 53/111 [00:34<00:33,  1.74it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9171, UAS: 0.9565, LAS: 0.9217, UEM: 0.6144, LEM: 0.3993, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4778, partial_loss/deprel_loss: 0.4093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5875, loss: 0.5790, batch_reg_loss: 0.1645, reg_loss: 0.1645 ||:  51%|#####1    | 57/111 [00:36<00:30,  1.80it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9412, UAS: 0.9562, LAS: 0.9214, UEM: 0.6066, LEM: 0.3921, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2144, partial_loss/deprel_loss: 0.3356, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4758, loss: 0.5818, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||:  55%|#####4    | 61/111 [00:38<00:27,  1.84it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9565, LAS: 0.9219, UEM: 0.6104, LEM: 0.3969, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3077, partial_loss/deprel_loss: 0.3634, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5167, loss: 0.5782, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||:  59%|#####8    | 65/111 [00:42<00:28,  1.63it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9564, LAS: 0.9217, UEM: 0.6083, LEM: 0.3928, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3418, partial_loss/deprel_loss: 0.3516, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.5789, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||:  62%|######2   | 69/111 [00:44<00:26,  1.58it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9572, LAS: 0.9223, UEM: 0.6156, LEM: 0.3964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4749, partial_loss/deprel_loss: 0.4711, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6363, loss: 0.5745, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||:  66%|######5   | 73/111 [00:47<00:25,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9575, LAS: 0.9226, UEM: 0.6203, LEM: 0.3998, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1145, partial_loss/deprel_loss: 0.2285, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3701, loss: 0.5720, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||:  69%|######9   | 77/111 [00:50<00:23,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9135, UAS: 0.9575, LAS: 0.9225, UEM: 0.6175, LEM: 0.3945, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5904, partial_loss/deprel_loss: 0.4982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6810, loss: 0.5731, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||:  73%|#######2  | 81/111 [00:53<00:21,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9576, LAS: 0.9226, UEM: 0.6186, LEM: 0.3954, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3328, partial_loss/deprel_loss: 0.4035, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5538, loss: 0.5720, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||:  76%|#######5  | 84/111 [00:56<00:19,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9580, LAS: 0.9229, UEM: 0.6180, LEM: 0.3933, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3493, partial_loss/deprel_loss: 0.4093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5617, loss: 0.5701, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||:  78%|#######8  | 87/111 [00:58<00:17,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9583, LAS: 0.9233, UEM: 0.6233, LEM: 0.3994, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1383, partial_loss/deprel_loss: 0.2481, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3905, loss: 0.5673, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||:  81%|########1 | 90/111 [01:00<00:15,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9082, UAS: 0.9585, LAS: 0.9235, UEM: 0.6321, LEM: 0.4094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6988, partial_loss/deprel_loss: 0.4598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6720, loss: 0.5650, batch_reg_loss: 0.1644, reg_loss: 0.1645 ||:  84%|########3 | 93/111 [01:02<00:13,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9585, LAS: 0.9234, UEM: 0.6279, LEM: 0.4046, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3920, partial_loss/deprel_loss: 0.4626, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6129, loss: 0.5658, batch_reg_loss: 0.1643, reg_loss: 0.1645 ||:  86%|########6 | 96/111 [01:05<00:11,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9586, LAS: 0.9236, UEM: 0.6319, LEM: 0.4104, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6267, partial_loss/deprel_loss: 0.4552, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6539, loss: 0.5635, batch_reg_loss: 0.1643, reg_loss: 0.1645 ||:  89%|########9 | 99/111 [01:07<00:08,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9590, LAS: 0.9239, UEM: 0.6369, LEM: 0.4143, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3991, partial_loss/deprel_loss: 0.4368, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5936, loss: 0.5613, batch_reg_loss: 0.1643, reg_loss: 0.1645 ||:  92%|#########1| 102/111 [01:09<00:06,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9196, UAS: 0.9594, LAS: 0.9242, UEM: 0.6422, LEM: 0.4173, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3173, partial_loss/deprel_loss: 0.3599, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5157, loss: 0.5582, batch_reg_loss: 0.1643, reg_loss: 0.1645 ||:  95%|#########4| 105/111 [01:12<00:04,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9597, LAS: 0.9245, UEM: 0.6444, LEM: 0.4182, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1521, partial_loss/deprel_loss: 0.2242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3741, loss: 0.5558, batch_reg_loss: 0.1643, reg_loss: 0.1645 ||:  97%|#########7| 108/111 [01:14<00:02,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9596, LAS: 0.9243, UEM: 0.6463, LEM: 0.4194, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2799, partial_loss/deprel_loss: 0.3418, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4937, loss: 0.5562, batch_reg_loss: 0.1643, reg_loss: 0.1645 ||: 100%|##########| 111/111 [01:16<00:00,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9596, LAS: 0.9243, UEM: 0.6463, LEM: 0.4194, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2799, partial_loss/deprel_loss: 0.3418, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4937, loss: 0.5562, batch_reg_loss: 0.1643, reg_loss: 0.1645 ||: 100%|##########| 111/111 [01:16<00:00,  1.46it/s]\n",
      "2023-04-07 01:21:01,093 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9641, LAS: 0.9129, UEM: 0.7128, LEM: 0.3718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3735, partial_loss/deprel_loss: 25.4464, partial_loss/cycle_loss: 0.0000, batch_loss: 20.4318, loss: 19.6309, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:11,  1.04s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9636, LAS: 0.9138, UEM: 0.7601, LEM: 0.4905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1781, partial_loss/deprel_loss: 18.1071, partial_loss/cycle_loss: 0.0000, batch_loss: 14.5213, loss: 19.2017, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:04<00:08,  1.02s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8781, UAS: 0.9509, LAS: 0.9007, UEM: 0.7007, LEM: 0.4404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1098, partial_loss/deprel_loss: 41.2865, partial_loss/cycle_loss: 0.0000, batch_loss: 33.2512, loss: 23.2837, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:08<00:05,  1.02s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8705, UAS: 0.9466, LAS: 0.8952, UEM: 0.6532, LEM: 0.3988, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3394, partial_loss/deprel_loss: 45.8758, partial_loss/cycle_loss: 0.0000, batch_loss: 36.9685, loss: 25.1615, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  77%|#######6  | 10/13 [00:10<00:03,  1.01s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9476, LAS: 0.8970, UEM: 0.6576, LEM: 0.3971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8956, partial_loss/deprel_loss: 29.6791, partial_loss/cycle_loss: 0.0000, batch_loss: 23.9224, loss: 24.6363, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.03it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9476, LAS: 0.8970, UEM: 0.6576, LEM: 0.3971, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8956, partial_loss/deprel_loss: 29.6791, partial_loss/cycle_loss: 0.0000, batch_loss: 23.9224, loss: 24.6363, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.03it/s]\n",
      "2023-04-07 01:21:13,721 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:21:13,721 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-07 01:21:13,721 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 01:21:13,721 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - patience                 |     6.000  |       N/A\n",
      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.342  |    29.679\n",
      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.280  |     0.896\n",
      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.164  |     0.000\n",
      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - UEM                      |     0.646  |     0.658\n",
      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - LAS                      |     0.924  |     0.897\n",
      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - loss                     |     0.556  |    24.636\n",
      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - LEM                      |     0.419  |     0.397\n",
      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-07 01:21:13,722 - INFO - combo.training.tensorboard_writer - UAS                      |     0.960  |     0.948\n",
      "2023-04-07 01:21:13,723 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-07 01:21:13,723 - INFO - combo.training.tensorboard_writer - EM                       |     0.934  |     0.881\n",
      "2023-04-07 01:21:13,723 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:21:13,728 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:21:18,618 - INFO - combo.training.trainer - Epoch duration: 0:01:37.029658\n",
      "2023-04-07 01:21:18,619 - INFO - combo.training.trainer - Estimated training time remaining: 6:34:30\n",
      "2023-04-07 01:21:18,619 - INFO - allennlp.training.trainer - Epoch 111/399\n",
      "2023-04-07 01:21:18,619 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:21:18,619 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:21:18,627 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9351, UAS: 0.9556, LAS: 0.9218, UEM: 0.4730, LEM: 0.2527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2893, partial_loss/deprel_loss: 0.2881, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4526, loss: 0.5829, batch_reg_loss: 0.1643, reg_loss: 0.1643 ||:   4%|3         | 4/111 [00:02<01:09,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9574, LAS: 0.9235, UEM: 0.4780, LEM: 0.2599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3950, partial_loss/deprel_loss: 0.3992, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5627, loss: 0.5757, batch_reg_loss: 0.1643, reg_loss: 0.1643 ||:   7%|7         | 8/111 [00:04<01:03,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9294, UAS: 0.9598, LAS: 0.9249, UEM: 0.5409, LEM: 0.3060, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2755, partial_loss/deprel_loss: 0.3663, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5124, loss: 0.5598, batch_reg_loss: 0.1643, reg_loss: 0.1643 ||:  12%|#1        | 13/111 [00:06<00:55,  1.78it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9476, UAS: 0.9620, LAS: 0.9272, UEM: 0.6094, LEM: 0.3869, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1368, partial_loss/deprel_loss: 0.2402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3838, loss: 0.5370, batch_reg_loss: 0.1642, reg_loss: 0.1643 ||:  16%|#6        | 18/111 [00:09<00:48,  1.90it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9626, LAS: 0.9280, UEM: 0.6157, LEM: 0.3911, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3550, partial_loss/deprel_loss: 0.3964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5523, loss: 0.5314, batch_reg_loss: 0.1642, reg_loss: 0.1643 ||:  20%|#9        | 22/111 [00:11<00:46,  1.91it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9647, LAS: 0.9304, UEM: 0.6799, LEM: 0.4691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3518, partial_loss/deprel_loss: 0.3935, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5494, loss: 0.5178, batch_reg_loss: 0.1642, reg_loss: 0.1643 ||:  23%|##3       | 26/111 [00:14<00:49,  1.70it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9448, UAS: 0.9639, LAS: 0.9299, UEM: 0.6849, LEM: 0.4770, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1500, partial_loss/deprel_loss: 0.2611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4031, loss: 0.5199, batch_reg_loss: 0.1642, reg_loss: 0.1643 ||:  27%|##7       | 30/111 [00:17<00:53,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9635, LAS: 0.9297, UEM: 0.7096, LEM: 0.5093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1431, partial_loss/deprel_loss: 0.2757, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4134, loss: 0.5201, batch_reg_loss: 0.1642, reg_loss: 0.1642 ||:  30%|##9       | 33/111 [00:19<00:54,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9038, UAS: 0.9603, LAS: 0.9262, UEM: 0.6885, LEM: 0.4912, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6263, partial_loss/deprel_loss: 0.5303, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7137, loss: 0.5447, batch_reg_loss: 0.1642, reg_loss: 0.1642 ||:  33%|###3      | 37/111 [00:22<00:49,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9603, LAS: 0.9262, UEM: 0.6803, LEM: 0.4802, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4154, partial_loss/deprel_loss: 0.4471, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6050, loss: 0.5469, batch_reg_loss: 0.1642, reg_loss: 0.1642 ||:  37%|###6      | 41/111 [00:24<00:44,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9592, LAS: 0.9249, UEM: 0.6709, LEM: 0.4690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1996, partial_loss/deprel_loss: 0.3331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4706, loss: 0.5541, batch_reg_loss: 0.1642, reg_loss: 0.1642 ||:  41%|####      | 45/111 [00:27<00:43,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8997, UAS: 0.9580, LAS: 0.9238, UEM: 0.6687, LEM: 0.4696, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8114, partial_loss/deprel_loss: 0.4566, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6917, loss: 0.5602, batch_reg_loss: 0.1642, reg_loss: 0.1642 ||:  44%|####4     | 49/111 [00:30<00:41,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9098, UAS: 0.9581, LAS: 0.9238, UEM: 0.6645, LEM: 0.4654, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5992, partial_loss/deprel_loss: 0.4125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6140, loss: 0.5593, batch_reg_loss: 0.1642, reg_loss: 0.1642 ||:  48%|####7     | 53/111 [00:33<00:40,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9589, LAS: 0.9246, UEM: 0.6702, LEM: 0.4658, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1928, partial_loss/deprel_loss: 0.3195, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4583, loss: 0.5533, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  50%|#####     | 56/111 [00:35<00:40,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9144, UAS: 0.9589, LAS: 0.9245, UEM: 0.6632, LEM: 0.4577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5083, partial_loss/deprel_loss: 0.4816, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6511, loss: 0.5547, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  53%|#####3    | 59/111 [00:37<00:37,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9591, LAS: 0.9245, UEM: 0.6607, LEM: 0.4538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3761, partial_loss/deprel_loss: 0.4201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5754, loss: 0.5543, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  56%|#####5    | 62/111 [00:39<00:35,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9596, LAS: 0.9248, UEM: 0.6674, LEM: 0.4607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2814, partial_loss/deprel_loss: 0.3194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4760, loss: 0.5503, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  59%|#####8    | 65/111 [00:41<00:33,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9597, LAS: 0.9248, UEM: 0.6682, LEM: 0.4607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1707, partial_loss/deprel_loss: 0.2553, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4025, loss: 0.5495, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  61%|######1   | 68/111 [00:44<00:31,  1.35it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9599, LAS: 0.9250, UEM: 0.6684, LEM: 0.4601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1683, partial_loss/deprel_loss: 0.2533, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4004, loss: 0.5474, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  64%|######3   | 71/111 [00:46<00:29,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9600, LAS: 0.9251, UEM: 0.6631, LEM: 0.4524, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2880, partial_loss/deprel_loss: 0.3692, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5171, loss: 0.5473, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  68%|######7   | 75/111 [00:48<00:24,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9295, UAS: 0.9592, LAS: 0.9241, UEM: 0.6583, LEM: 0.4477, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2128, partial_loss/deprel_loss: 0.3548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4905, loss: 0.5534, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  70%|#######   | 78/111 [00:51<00:23,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9593, LAS: 0.9240, UEM: 0.6555, LEM: 0.4427, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4426, partial_loss/deprel_loss: 0.4539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6158, loss: 0.5546, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  73%|#######2  | 81/111 [00:53<00:21,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9470, UAS: 0.9593, LAS: 0.9240, UEM: 0.6541, LEM: 0.4401, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1507, partial_loss/deprel_loss: 0.2648, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4060, loss: 0.5554, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  76%|#######5  | 84/111 [00:55<00:19,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9591, LAS: 0.9238, UEM: 0.6509, LEM: 0.4369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1896, partial_loss/deprel_loss: 0.2569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4075, loss: 0.5566, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  78%|#######8  | 87/111 [00:57<00:17,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9595, LAS: 0.9241, UEM: 0.6525, LEM: 0.4357, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2041, partial_loss/deprel_loss: 0.2996, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4446, loss: 0.5538, batch_reg_loss: 0.1641, reg_loss: 0.1642 ||:  81%|########1 | 90/111 [00:59<00:15,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9597, LAS: 0.9243, UEM: 0.6539, LEM: 0.4352, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3412, partial_loss/deprel_loss: 0.3975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5503, loss: 0.5519, batch_reg_loss: 0.1640, reg_loss: 0.1642 ||:  85%|########4 | 94/111 [01:02<00:11,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9600, LAS: 0.9247, UEM: 0.6560, LEM: 0.4365, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2771, partial_loss/deprel_loss: 0.3875, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5294, loss: 0.5495, batch_reg_loss: 0.1640, reg_loss: 0.1642 ||:  87%|########7 | 97/111 [01:04<00:09,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9596, LAS: 0.9243, UEM: 0.6499, LEM: 0.4312, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3014, partial_loss/deprel_loss: 0.3095, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4719, loss: 0.5512, batch_reg_loss: 0.1640, reg_loss: 0.1642 ||:  91%|######### | 101/111 [01:09<00:08,  1.13it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9594, LAS: 0.9240, UEM: 0.6432, LEM: 0.4241, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4741, partial_loss/deprel_loss: 0.5343, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6863, loss: 0.5547, batch_reg_loss: 0.1640, reg_loss: 0.1642 ||:  95%|#########4| 105/111 [01:12<00:04,  1.25it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9597, LAS: 0.9244, UEM: 0.6477, LEM: 0.4275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2616, partial_loss/deprel_loss: 0.3654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5086, loss: 0.5519, batch_reg_loss: 0.1640, reg_loss: 0.1641 ||:  97%|#########7| 108/111 [01:14<00:02,  1.24it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9595, LAS: 0.9241, UEM: 0.6436, LEM: 0.4229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3721, partial_loss/deprel_loss: 0.3770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5400, loss: 0.5536, batch_reg_loss: 0.1640, reg_loss: 0.1641 ||: 100%|##########| 111/111 [01:16<00:00,  1.45it/s]\n",
      "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:22:38,115 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.377  |       N/A\n",
      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.372  |       N/A\n",
      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.164  |       N/A\n",
      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - UEM                      |     0.644  |       N/A\n",
      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - LAS                      |     0.924  |       N/A\n",
      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - loss                     |     0.554  |       N/A\n",
      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - LEM                      |     0.423  |       N/A\n",
      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - UAS                      |     0.959  |       N/A\n",
      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - EM                       |     0.922  |       N/A\n",
      "2023-04-07 01:22:38,116 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:22:38,121 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:22:45,590 - INFO - combo.training.trainer - Epoch duration: 0:01:26.971396\n",
      "2023-04-07 01:22:45,591 - INFO - combo.training.trainer - Estimated training time remaining: 6:33:21\n",
      "2023-04-07 01:22:45,591 - INFO - allennlp.training.trainer - Epoch 112/399\n",
      "2023-04-07 01:22:45,591 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:22:45,592 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:22:45,602 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8898, UAS: 0.9465, LAS: 0.9113, UEM: 0.3516, LEM: 0.1868, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9347, partial_loss/deprel_loss: 0.5649, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8029, loss: 0.6429, batch_reg_loss: 0.1640, reg_loss: 0.1640 ||:   3%|2         | 3/111 [00:02<01:18,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8976, UAS: 0.9502, LAS: 0.9139, UEM: 0.4979, LEM: 0.3100, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7785, partial_loss/deprel_loss: 0.5310, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7445, loss: 0.6125, batch_reg_loss: 0.1640, reg_loss: 0.1640 ||:   5%|5         | 6/111 [00:04<01:16,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9543, LAS: 0.9171, UEM: 0.5289, LEM: 0.2964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2015, partial_loss/deprel_loss: 0.3542, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4876, loss: 0.5984, batch_reg_loss: 0.1640, reg_loss: 0.1640 ||:   9%|9         | 10/111 [00:06<01:10,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9520, LAS: 0.9153, UEM: 0.4784, LEM: 0.2608, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3941, partial_loss/deprel_loss: 0.4399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5947, loss: 0.6202, batch_reg_loss: 0.1640, reg_loss: 0.1640 ||:  13%|#2        | 14/111 [00:09<01:06,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9388, UAS: 0.9533, LAS: 0.9172, UEM: 0.5065, LEM: 0.2880, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1862, partial_loss/deprel_loss: 0.3066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4465, loss: 0.6082, batch_reg_loss: 0.1640, reg_loss: 0.1640 ||:  16%|#6        | 18/111 [00:12<01:03,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8858, UAS: 0.9527, LAS: 0.9165, UEM: 0.5070, LEM: 0.2859, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8457, partial_loss/deprel_loss: 0.5729, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7914, loss: 0.6121, batch_reg_loss: 0.1640, reg_loss: 0.1640 ||:  19%|#8        | 21/111 [00:14<01:04,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9252, UAS: 0.9537, LAS: 0.9181, UEM: 0.5409, LEM: 0.3272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3244, partial_loss/deprel_loss: 0.3309, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4936, loss: 0.6005, batch_reg_loss: 0.1639, reg_loss: 0.1640 ||:  22%|##1       | 24/111 [00:16<01:03,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9403, UAS: 0.9540, LAS: 0.9189, UEM: 0.5440, LEM: 0.3287, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3007, partial_loss/deprel_loss: 0.2811, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4490, loss: 0.5944, batch_reg_loss: 0.1639, reg_loss: 0.1640 ||:  24%|##4       | 27/111 [00:19<01:01,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9564, LAS: 0.9210, UEM: 0.5942, LEM: 0.3711, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1901, partial_loss/deprel_loss: 0.2766, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4233, loss: 0.5804, batch_reg_loss: 0.1639, reg_loss: 0.1640 ||:  27%|##7       | 30/111 [00:21<00:58,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9170, UAS: 0.9571, LAS: 0.9218, UEM: 0.6062, LEM: 0.3837, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4590, partial_loss/deprel_loss: 0.4322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6015, loss: 0.5729, batch_reg_loss: 0.1639, reg_loss: 0.1640 ||:  30%|##9       | 33/111 [00:23<00:56,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9579, LAS: 0.9227, UEM: 0.6108, LEM: 0.3877, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2158, partial_loss/deprel_loss: 0.2707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4236, loss: 0.5635, batch_reg_loss: 0.1639, reg_loss: 0.1640 ||:  33%|###3      | 37/111 [00:25<00:51,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9576, LAS: 0.9225, UEM: 0.6093, LEM: 0.3865, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7147, partial_loss/deprel_loss: 0.4772, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6886, loss: 0.5641, batch_reg_loss: 0.1639, reg_loss: 0.1640 ||:  36%|###6      | 40/111 [00:28<00:52,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9577, LAS: 0.9223, UEM: 0.6054, LEM: 0.3808, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2507, partial_loss/deprel_loss: 0.3784, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5167, loss: 0.5653, batch_reg_loss: 0.1639, reg_loss: 0.1640 ||:  39%|###8      | 43/111 [00:30<00:49,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9584, UAS: 0.9583, LAS: 0.9233, UEM: 0.6294, LEM: 0.4113, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0886, partial_loss/deprel_loss: 0.1720, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3192, loss: 0.5584, batch_reg_loss: 0.1639, reg_loss: 0.1639 ||:  41%|####1     | 46/111 [00:32<00:47,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9496, UAS: 0.9586, LAS: 0.9236, UEM: 0.6407, LEM: 0.4244, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1205, partial_loss/deprel_loss: 0.1973, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3458, loss: 0.5557, batch_reg_loss: 0.1639, reg_loss: 0.1639 ||:  45%|####5     | 50/111 [00:35<00:43,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9588, LAS: 0.9235, UEM: 0.6325, LEM: 0.4154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2406, partial_loss/deprel_loss: 0.3505, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4924, loss: 0.5578, batch_reg_loss: 0.1639, reg_loss: 0.1639 ||:  49%|####8     | 54/111 [00:37<00:38,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9588, LAS: 0.9236, UEM: 0.6321, LEM: 0.4144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1250, partial_loss/deprel_loss: 0.2503, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3891, loss: 0.5572, batch_reg_loss: 0.1639, reg_loss: 0.1639 ||:  51%|#####1    | 57/111 [00:39<00:36,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9582, LAS: 0.9231, UEM: 0.6267, LEM: 0.4089, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2787, partial_loss/deprel_loss: 0.2862, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4485, loss: 0.5608, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  55%|#####4    | 61/111 [00:42<00:33,  1.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9581, LAS: 0.9230, UEM: 0.6202, LEM: 0.4024, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4928, partial_loss/deprel_loss: 0.4218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5998, loss: 0.5626, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  59%|#####8    | 65/111 [00:45<00:30,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9243, UAS: 0.9577, LAS: 0.9226, UEM: 0.6181, LEM: 0.3990, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3401, partial_loss/deprel_loss: 0.3742, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5312, loss: 0.5654, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  61%|######1   | 68/111 [00:47<00:29,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9583, LAS: 0.9231, UEM: 0.6201, LEM: 0.3982, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3537, partial_loss/deprel_loss: 0.4052, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5587, loss: 0.5631, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  64%|######3   | 71/111 [00:49<00:27,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9581, LAS: 0.9230, UEM: 0.6127, LEM: 0.3914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4975, partial_loss/deprel_loss: 0.4292, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6067, loss: 0.5656, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  67%|######6   | 74/111 [00:51<00:26,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9437, UAS: 0.9583, LAS: 0.9234, UEM: 0.6134, LEM: 0.3913, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2865, partial_loss/deprel_loss: 0.3171, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4748, loss: 0.5631, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  70%|#######   | 78/111 [00:54<00:22,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9589, LAS: 0.9240, UEM: 0.6244, LEM: 0.4020, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1680, partial_loss/deprel_loss: 0.2197, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3732, loss: 0.5580, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  73%|#######2  | 81/111 [00:56<00:20,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9413, UAS: 0.9588, LAS: 0.9238, UEM: 0.6206, LEM: 0.3978, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2257, partial_loss/deprel_loss: 0.2934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4437, loss: 0.5580, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  77%|#######6  | 85/111 [00:59<00:18,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9327, UAS: 0.9595, LAS: 0.9246, UEM: 0.6336, LEM: 0.4103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2709, partial_loss/deprel_loss: 0.3525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4999, loss: 0.5523, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  80%|########  | 89/111 [01:01<00:14,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9602, LAS: 0.9254, UEM: 0.6529, LEM: 0.4353, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1587, partial_loss/deprel_loss: 0.2924, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4294, loss: 0.5475, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  84%|########3 | 93/111 [01:05<00:13,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9599, LAS: 0.9252, UEM: 0.6513, LEM: 0.4335, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1936, partial_loss/deprel_loss: 0.2764, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4236, loss: 0.5494, batch_reg_loss: 0.1638, reg_loss: 0.1639 ||:  86%|########6 | 96/111 [01:07<00:10,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9597, LAS: 0.9249, UEM: 0.6490, LEM: 0.4296, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2162, partial_loss/deprel_loss: 0.3828, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5132, loss: 0.5507, batch_reg_loss: 0.1637, reg_loss: 0.1639 ||:  90%|######### | 100/111 [01:09<00:07,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9405, UAS: 0.9595, LAS: 0.9246, UEM: 0.6438, LEM: 0.4233, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2196, partial_loss/deprel_loss: 0.3284, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4704, loss: 0.5532, batch_reg_loss: 0.1637, reg_loss: 0.1639 ||:  95%|#########4| 105/111 [01:11<00:03,  1.65it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9597, LAS: 0.9248, UEM: 0.6440, LEM: 0.4238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3882, partial_loss/deprel_loss: 0.3587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5283, loss: 0.5515, batch_reg_loss: 0.1637, reg_loss: 0.1639 ||:  99%|#########9| 110/111 [01:13<00:00,  1.81it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9597, LAS: 0.9249, UEM: 0.6435, LEM: 0.4229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2821, partial_loss/deprel_loss: 0.3450, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4962, loss: 0.5510, batch_reg_loss: 0.1637, reg_loss: 0.1639 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
      "2023-04-07 01:24:02,965 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.345  |       N/A\n",
      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.282  |       N/A\n",
      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.164  |       N/A\n",
      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - UEM                      |     0.644  |       N/A\n",
      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - LAS                      |     0.925  |       N/A\n",
      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - loss                     |     0.551  |       N/A\n",
      "2023-04-07 01:24:02,966 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:24:02,967 - INFO - combo.training.tensorboard_writer - LEM                      |     0.423  |       N/A\n",
      "2023-04-07 01:24:02,967 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:24:02,967 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:24:02,967 - INFO - combo.training.tensorboard_writer - UAS                      |     0.960  |       N/A\n",
      "2023-04-07 01:24:02,967 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:24:02,967 - INFO - combo.training.tensorboard_writer - EM                       |     0.931  |       N/A\n",
      "2023-04-07 01:24:02,967 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:24:02,972 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:24:08,115 - INFO - combo.training.trainer - Epoch duration: 0:01:22.524054\n",
      "2023-04-07 01:24:08,116 - INFO - combo.training.trainer - Estimated training time remaining: 6:32:00\n",
      "2023-04-07 01:24:08,116 - INFO - allennlp.training.trainer - Epoch 113/399\n",
      "2023-04-07 01:24:08,119 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:24:08,120 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:24:08,127 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9435, LAS: 0.9077, UEM: 0.5920, LEM: 0.3600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1878, partial_loss/deprel_loss: 0.2747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4211, loss: 0.6665, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||:   3%|2         | 3/111 [00:02<01:18,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9525, LAS: 0.9181, UEM: 0.6117, LEM: 0.3944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3329, partial_loss/deprel_loss: 0.3963, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5473, loss: 0.5999, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||:   5%|5         | 6/111 [00:04<01:14,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9380, UAS: 0.9566, LAS: 0.9209, UEM: 0.6403, LEM: 0.4142, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1369, partial_loss/deprel_loss: 0.2747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4108, loss: 0.5777, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||:   8%|8         | 9/111 [00:06<01:12,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9572, UAS: 0.9597, LAS: 0.9256, UEM: 0.6848, LEM: 0.4760, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0767, partial_loss/deprel_loss: 0.1787, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3220, loss: 0.5496, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||:  11%|#         | 12/111 [00:08<01:11,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9600, LAS: 0.9256, UEM: 0.6684, LEM: 0.4553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5117, partial_loss/deprel_loss: 0.4077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5922, loss: 0.5426, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||:  14%|#3        | 15/111 [00:10<01:08,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9054, UAS: 0.9572, LAS: 0.9225, UEM: 0.6189, LEM: 0.4124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6246, partial_loss/deprel_loss: 0.5487, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7275, loss: 0.5690, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||:  17%|#7        | 19/111 [00:13<01:02,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9537, UAS: 0.9574, LAS: 0.9231, UEM: 0.6233, LEM: 0.4158, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1474, partial_loss/deprel_loss: 0.2087, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3601, loss: 0.5615, batch_reg_loss: 0.1637, reg_loss: 0.1637 ||:  21%|##        | 23/111 [00:15<00:57,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8803, UAS: 0.9573, LAS: 0.9233, UEM: 0.6406, LEM: 0.4323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0529, partial_loss/deprel_loss: 0.5422, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8079, loss: 0.5586, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||:  24%|##4       | 27/111 [00:18<00:54,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9564, LAS: 0.9221, UEM: 0.6399, LEM: 0.4344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1533, partial_loss/deprel_loss: 0.2707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4108, loss: 0.5640, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||:  27%|##7       | 30/111 [00:20<00:54,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9571, LAS: 0.9223, UEM: 0.6434, LEM: 0.4315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1653, partial_loss/deprel_loss: 0.2758, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4173, loss: 0.5608, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||:  30%|##9       | 33/111 [00:22<00:52,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9044, UAS: 0.9564, LAS: 0.9217, UEM: 0.6241, LEM: 0.4161, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6261, partial_loss/deprel_loss: 0.4662, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6618, loss: 0.5668, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||:  32%|###2      | 36/111 [00:24<00:51,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9566, LAS: 0.9218, UEM: 0.6162, LEM: 0.4052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3270, partial_loss/deprel_loss: 0.3358, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4977, loss: 0.5653, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||:  35%|###5      | 39/111 [00:26<00:50,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9144, UAS: 0.9567, LAS: 0.9220, UEM: 0.6088, LEM: 0.3970, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6791, partial_loss/deprel_loss: 0.4889, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6906, loss: 0.5671, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||:  38%|###7      | 42/111 [00:28<00:49,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9564, LAS: 0.9216, UEM: 0.6039, LEM: 0.3907, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1989, partial_loss/deprel_loss: 0.2975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4414, loss: 0.5713, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||:  41%|####1     | 46/111 [00:31<00:45,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9572, LAS: 0.9224, UEM: 0.6089, LEM: 0.3914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5235, partial_loss/deprel_loss: 0.4346, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6160, loss: 0.5652, batch_reg_loss: 0.1636, reg_loss: 0.1637 ||:  45%|####5     | 50/111 [00:34<00:42,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9082, UAS: 0.9569, LAS: 0.9224, UEM: 0.6093, LEM: 0.3951, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7306, partial_loss/deprel_loss: 0.5466, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7470, loss: 0.5666, batch_reg_loss: 0.1636, reg_loss: 0.1636 ||:  49%|####8     | 54/111 [00:36<00:38,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9574, LAS: 0.9229, UEM: 0.6208, LEM: 0.4067, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6226, partial_loss/deprel_loss: 0.4704, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6644, loss: 0.5625, batch_reg_loss: 0.1636, reg_loss: 0.1636 ||:  51%|#####1    | 57/111 [00:39<00:37,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9579, LAS: 0.9234, UEM: 0.6257, LEM: 0.4112, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3557, partial_loss/deprel_loss: 0.4244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5743, loss: 0.5590, batch_reg_loss: 0.1636, reg_loss: 0.1636 ||:  54%|#####4    | 60/111 [00:41<00:35,  1.43it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9586, LAS: 0.9242, UEM: 0.6372, LEM: 0.4214, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1545, partial_loss/deprel_loss: 0.2473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3923, loss: 0.5533, batch_reg_loss: 0.1636, reg_loss: 0.1636 ||:  57%|#####6    | 63/111 [00:43<00:36,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9245, UAS: 0.9583, LAS: 0.9240, UEM: 0.6283, LEM: 0.4121, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3313, partial_loss/deprel_loss: 0.3747, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5295, loss: 0.5554, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||:  60%|######    | 67/111 [00:46<00:31,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9525, UAS: 0.9595, LAS: 0.9252, UEM: 0.6533, LEM: 0.4396, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1309, partial_loss/deprel_loss: 0.2326, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3758, loss: 0.5470, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||:  63%|######3   | 70/111 [00:48<00:28,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9599, LAS: 0.9257, UEM: 0.6554, LEM: 0.4405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1910, partial_loss/deprel_loss: 0.3548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4856, loss: 0.5443, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||:  66%|######5   | 73/111 [00:50<00:28,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9596, LAS: 0.9254, UEM: 0.6500, LEM: 0.4346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3578, partial_loss/deprel_loss: 0.3686, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5300, loss: 0.5468, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||:  69%|######9   | 77/111 [00:53<00:24,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9601, LAS: 0.9257, UEM: 0.6518, LEM: 0.4329, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1751, partial_loss/deprel_loss: 0.2854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4268, loss: 0.5443, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||:  73%|#######2  | 81/111 [00:55<00:19,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8800, UAS: 0.9595, LAS: 0.9250, UEM: 0.6442, LEM: 0.4260, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8791, partial_loss/deprel_loss: 0.5936, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8142, loss: 0.5483, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||:  77%|#######7  | 86/111 [00:57<00:14,  1.67it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9598, LAS: 0.9254, UEM: 0.6547, LEM: 0.4429, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5151, partial_loss/deprel_loss: 0.4351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6146, loss: 0.5463, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||:  81%|########1 | 90/111 [01:00<00:13,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9604, LAS: 0.9259, UEM: 0.6577, LEM: 0.4424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2140, partial_loss/deprel_loss: 0.3738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5053, loss: 0.5433, batch_reg_loss: 0.1635, reg_loss: 0.1636 ||:  85%|########4 | 94/111 [01:02<00:10,  1.65it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9602, LAS: 0.9256, UEM: 0.6506, LEM: 0.4359, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4410, partial_loss/deprel_loss: 0.4332, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5982, loss: 0.5457, batch_reg_loss: 0.1634, reg_loss: 0.1636 ||:  88%|########8 | 98/111 [01:05<00:07,  1.63it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9604, LAS: 0.9258, UEM: 0.6540, LEM: 0.4368, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3462, partial_loss/deprel_loss: 0.3633, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5233, loss: 0.5434, batch_reg_loss: 0.1634, reg_loss: 0.1636 ||:  92%|#########1| 102/111 [01:07<00:05,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9605, LAS: 0.9260, UEM: 0.6514, LEM: 0.4324, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3090, partial_loss/deprel_loss: 0.3175, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4792, loss: 0.5419, batch_reg_loss: 0.1634, reg_loss: 0.1636 ||:  96%|#########6| 107/111 [01:10<00:02,  1.70it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9601, LAS: 0.9256, UEM: 0.6451, LEM: 0.4269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4750, partial_loss/deprel_loss: 0.4599, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6263, loss: 0.5441, batch_reg_loss: 0.1634, reg_loss: 0.1636 ||: 100%|##########| 111/111 [01:12<00:00,  1.54it/s]\n",
      "2023-04-07 01:25:23,464 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:25:23,464 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:25:23,464 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:25:23,464 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:25:23,464 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.460  |       N/A\n",
      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.475  |       N/A\n",
      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.164  |       N/A\n",
      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - UEM                      |     0.645  |       N/A\n",
      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - LAS                      |     0.926  |       N/A\n",
      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - loss                     |     0.544  |       N/A\n",
      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - LEM                      |     0.427  |       N/A\n",
      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - UAS                      |     0.960  |       N/A\n",
      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - EM                       |     0.915  |       N/A\n",
      "2023-04-07 01:25:23,465 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:25:23,472 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:25:28,456 - INFO - combo.training.trainer - Epoch duration: 0:01:20.340225\n",
      "2023-04-07 01:25:28,456 - INFO - combo.training.trainer - Estimated training time remaining: 6:30:34\n",
      "2023-04-07 01:25:28,457 - INFO - allennlp.training.trainer - Epoch 114/399\n",
      "2023-04-07 01:25:28,457 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:25:28,457 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:25:28,466 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9547, LAS: 0.9186, UEM: 0.4273, LEM: 0.1939, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6578, partial_loss/deprel_loss: 0.4807, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6796, loss: 0.6056, batch_reg_loss: 0.1634, reg_loss: 0.1634 ||:   3%|2         | 3/111 [00:02<01:21,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9297, UAS: 0.9578, LAS: 0.9234, UEM: 0.4774, LEM: 0.2359, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2891, partial_loss/deprel_loss: 0.3978, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5394, loss: 0.5772, batch_reg_loss: 0.1634, reg_loss: 0.1634 ||:   5%|5         | 6/111 [00:04<01:18,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9633, LAS: 0.9302, UEM: 0.5858, LEM: 0.3515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2834, partial_loss/deprel_loss: 0.3211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4769, loss: 0.5286, batch_reg_loss: 0.1634, reg_loss: 0.1634 ||:   9%|9         | 10/111 [00:06<01:11,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9626, LAS: 0.9286, UEM: 0.6194, LEM: 0.3824, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5775, partial_loss/deprel_loss: 0.5050, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6829, loss: 0.5309, batch_reg_loss: 0.1634, reg_loss: 0.1634 ||:  13%|#2        | 14/111 [00:09<01:05,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9637, LAS: 0.9305, UEM: 0.6935, LEM: 0.4949, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2059, partial_loss/deprel_loss: 0.3146, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4562, loss: 0.5180, batch_reg_loss: 0.1634, reg_loss: 0.1634 ||:  15%|#5        | 17/111 [00:11<01:08,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9251, UAS: 0.9644, LAS: 0.9308, UEM: 0.6832, LEM: 0.4742, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3690, partial_loss/deprel_loss: 0.4402, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5893, loss: 0.5159, batch_reg_loss: 0.1633, reg_loss: 0.1634 ||:  19%|#8        | 21/111 [00:14<01:02,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9633, LAS: 0.9294, UEM: 0.6628, LEM: 0.4527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6813, partial_loss/deprel_loss: 0.5702, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7558, loss: 0.5264, batch_reg_loss: 0.1633, reg_loss: 0.1634 ||:  22%|##1       | 24/111 [00:16<01:00,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9457, UAS: 0.9644, LAS: 0.9303, UEM: 0.6832, LEM: 0.4702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0925, partial_loss/deprel_loss: 0.2237, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3608, loss: 0.5173, batch_reg_loss: 0.1633, reg_loss: 0.1634 ||:  24%|##4       | 27/111 [00:18<00:58,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9140, UAS: 0.9624, LAS: 0.9282, UEM: 0.6623, LEM: 0.4533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4599, partial_loss/deprel_loss: 0.4563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6204, loss: 0.5314, batch_reg_loss: 0.1633, reg_loss: 0.1634 ||:  27%|##7       | 30/111 [00:20<00:56,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9620, LAS: 0.9284, UEM: 0.6473, LEM: 0.4383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6177, partial_loss/deprel_loss: 0.4161, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6197, loss: 0.5333, batch_reg_loss: 0.1633, reg_loss: 0.1634 ||:  31%|###       | 34/111 [00:23<00:51,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9632, LAS: 0.9297, UEM: 0.6585, LEM: 0.4422, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3120, partial_loss/deprel_loss: 0.3296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4894, loss: 0.5242, batch_reg_loss: 0.1633, reg_loss: 0.1634 ||:  34%|###4      | 38/111 [00:25<00:48,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9390, UAS: 0.9624, LAS: 0.9289, UEM: 0.6467, LEM: 0.4326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2178, partial_loss/deprel_loss: 0.2864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4360, loss: 0.5306, batch_reg_loss: 0.1633, reg_loss: 0.1633 ||:  38%|###7      | 42/111 [00:28<00:46,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9616, LAS: 0.9279, UEM: 0.6359, LEM: 0.4228, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7707, partial_loss/deprel_loss: 0.5840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7846, loss: 0.5386, batch_reg_loss: 0.1633, reg_loss: 0.1633 ||:  41%|####      | 45/111 [00:30<00:47,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9620, LAS: 0.9282, UEM: 0.6325, LEM: 0.4168, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2114, partial_loss/deprel_loss: 0.2645, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4172, loss: 0.5358, batch_reg_loss: 0.1633, reg_loss: 0.1633 ||:  43%|####3     | 48/111 [00:33<00:45,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9617, LAS: 0.9280, UEM: 0.6243, LEM: 0.4086, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3437, partial_loss/deprel_loss: 0.3858, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5407, loss: 0.5381, batch_reg_loss: 0.1633, reg_loss: 0.1633 ||:  46%|####5     | 51/111 [00:35<00:44,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9617, LAS: 0.9280, UEM: 0.6325, LEM: 0.4184, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3666, partial_loss/deprel_loss: 0.3718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5340, loss: 0.5358, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  49%|####8     | 54/111 [00:37<00:41,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8896, UAS: 0.9615, LAS: 0.9277, UEM: 0.6346, LEM: 0.4193, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9003, partial_loss/deprel_loss: 0.5767, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8046, loss: 0.5368, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  51%|#####1    | 57/111 [00:39<00:39,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8737, UAS: 0.9606, LAS: 0.9267, UEM: 0.6277, LEM: 0.4124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0115, partial_loss/deprel_loss: 0.6611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8944, loss: 0.5447, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  54%|#####4    | 60/111 [00:42<00:37,  1.35it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9222, UAS: 0.9609, LAS: 0.9269, UEM: 0.6307, LEM: 0.4115, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4027, partial_loss/deprel_loss: 0.4277, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5859, loss: 0.5431, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  57%|#####6    | 63/111 [00:44<00:36,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9607, LAS: 0.9267, UEM: 0.6229, LEM: 0.4040, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2619, partial_loss/deprel_loss: 0.3418, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4891, loss: 0.5432, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  60%|######    | 67/111 [00:46<00:31,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9613, LAS: 0.9271, UEM: 0.6294, LEM: 0.4077, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1762, partial_loss/deprel_loss: 0.3194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4539, loss: 0.5403, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  63%|######3   | 70/111 [00:49<00:29,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9609, LAS: 0.9267, UEM: 0.6307, LEM: 0.4092, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3327, partial_loss/deprel_loss: 0.3712, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5267, loss: 0.5436, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  66%|######5   | 73/111 [00:51<00:26,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9613, LAS: 0.9272, UEM: 0.6381, LEM: 0.4157, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2478, partial_loss/deprel_loss: 0.3511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4936, loss: 0.5398, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  68%|######8   | 76/111 [00:53<00:24,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9149, UAS: 0.9614, LAS: 0.9272, UEM: 0.6402, LEM: 0.4171, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4677, partial_loss/deprel_loss: 0.4691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6320, loss: 0.5406, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  72%|#######2  | 80/111 [00:55<00:20,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9616, LAS: 0.9273, UEM: 0.6387, LEM: 0.4146, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1989, partial_loss/deprel_loss: 0.3139, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4541, loss: 0.5391, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  76%|#######5  | 84/111 [00:57<00:17,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9078, UAS: 0.9616, LAS: 0.9271, UEM: 0.6359, LEM: 0.4101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6056, partial_loss/deprel_loss: 0.4984, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6830, loss: 0.5388, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  80%|########  | 89/111 [01:00<00:13,  1.67it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9432, UAS: 0.9613, LAS: 0.9268, UEM: 0.6340, LEM: 0.4079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1500, partial_loss/deprel_loss: 0.2520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3948, loss: 0.5409, batch_reg_loss: 0.1632, reg_loss: 0.1633 ||:  85%|########4 | 94/111 [01:02<00:09,  1.76it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9607, LAS: 0.9261, UEM: 0.6273, LEM: 0.4017, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4857, partial_loss/deprel_loss: 0.3974, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5782, loss: 0.5446, batch_reg_loss: 0.1631, reg_loss: 0.1633 ||:  89%|########9 | 99/111 [01:05<00:06,  1.87it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9608, LAS: 0.9263, UEM: 0.6391, LEM: 0.4190, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5761, partial_loss/deprel_loss: 0.4574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6442, loss: 0.5438, batch_reg_loss: 0.1631, reg_loss: 0.1633 ||:  93%|#########2| 103/111 [01:07<00:04,  1.69it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9232, UAS: 0.9606, LAS: 0.9262, UEM: 0.6421, LEM: 0.4215, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3545, partial_loss/deprel_loss: 0.4660, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6068, loss: 0.5446, batch_reg_loss: 0.1631, reg_loss: 0.1633 ||:  96%|#########6| 107/111 [01:10<00:02,  1.64it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9610, LAS: 0.9266, UEM: 0.6457, LEM: 0.4231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2279, partial_loss/deprel_loss: 0.2647, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4205, loss: 0.5415, batch_reg_loss: 0.1631, reg_loss: 0.1633 ||: 100%|##########| 111/111 [01:13<00:00,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9610, LAS: 0.9266, UEM: 0.6457, LEM: 0.4231, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2279, partial_loss/deprel_loss: 0.2647, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4205, loss: 0.5415, batch_reg_loss: 0.1631, reg_loss: 0.1633 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.265  |       N/A\n",
      "2023-04-07 01:26:44,758 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.228  |       N/A\n",
      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.163  |       N/A\n",
      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - UEM                      |     0.646  |       N/A\n",
      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - LAS                      |     0.927  |       N/A\n",
      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - loss                     |     0.542  |       N/A\n",
      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - LEM                      |     0.423  |       N/A\n",
      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - UAS                      |     0.961  |       N/A\n",
      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - EM                       |     0.937  |       N/A\n",
      "2023-04-07 01:26:44,759 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:26:44,764 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:26:49,799 - INFO - combo.training.trainer - Epoch duration: 0:01:21.342111\n",
      "2023-04-07 01:26:49,799 - INFO - combo.training.trainer - Estimated training time remaining: 6:29:11\n",
      "2023-04-07 01:26:49,799 - INFO - allennlp.training.trainer - Epoch 115/399\n",
      "2023-04-07 01:26:49,799 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:26:49,800 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:26:49,811 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9547, LAS: 0.9173, UEM: 0.3925, LEM: 0.1752, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3871, partial_loss/deprel_loss: 0.3791, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5438, loss: 0.5949, batch_reg_loss: 0.1631, reg_loss: 0.1631 ||:   4%|3         | 4/111 [00:02<01:03,  1.68it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9481, UAS: 0.9608, LAS: 0.9239, UEM: 0.6031, LEM: 0.3739, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0845, partial_loss/deprel_loss: 0.2596, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3876, loss: 0.5477, batch_reg_loss: 0.1631, reg_loss: 0.1631 ||:   6%|6         | 7/111 [00:04<01:06,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9610, LAS: 0.9251, UEM: 0.6085, LEM: 0.3740, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2537, partial_loss/deprel_loss: 0.3027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4560, loss: 0.5365, batch_reg_loss: 0.1631, reg_loss: 0.1631 ||:   9%|9         | 10/111 [00:06<01:05,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9606, LAS: 0.9248, UEM: 0.5913, LEM: 0.3514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3193, partial_loss/deprel_loss: 0.3527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5091, loss: 0.5387, batch_reg_loss: 0.1631, reg_loss: 0.1631 ||:  13%|#2        | 14/111 [00:09<01:02,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8811, UAS: 0.9561, LAS: 0.9205, UEM: 0.5787, LEM: 0.3493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9752, partial_loss/deprel_loss: 0.5953, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8343, loss: 0.5763, batch_reg_loss: 0.1631, reg_loss: 0.1631 ||:  16%|#6        | 18/111 [00:11<01:00,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9571, LAS: 0.9214, UEM: 0.5802, LEM: 0.3486, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4454, partial_loss/deprel_loss: 0.4338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5991, loss: 0.5686, batch_reg_loss: 0.1631, reg_loss: 0.1631 ||:  19%|#8        | 21/111 [00:13<00:59,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8998, UAS: 0.9558, LAS: 0.9203, UEM: 0.5699, LEM: 0.3397, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7849, partial_loss/deprel_loss: 0.5225, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7381, loss: 0.5809, batch_reg_loss: 0.1630, reg_loss: 0.1631 ||:  23%|##2       | 25/111 [00:16<00:54,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9003, UAS: 0.9560, LAS: 0.9204, UEM: 0.5712, LEM: 0.3433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7318, partial_loss/deprel_loss: 0.5219, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7270, loss: 0.5789, batch_reg_loss: 0.1630, reg_loss: 0.1631 ||:  26%|##6       | 29/111 [00:18<00:52,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9562, LAS: 0.9205, UEM: 0.5662, LEM: 0.3370, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4325, partial_loss/deprel_loss: 0.3829, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5558, loss: 0.5776, batch_reg_loss: 0.1630, reg_loss: 0.1631 ||:  29%|##8       | 32/111 [00:20<00:51,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9074, UAS: 0.9567, LAS: 0.9210, UEM: 0.5642, LEM: 0.3343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5532, partial_loss/deprel_loss: 0.4689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6488, loss: 0.5761, batch_reg_loss: 0.1630, reg_loss: 0.1631 ||:  32%|###2      | 36/111 [00:23<00:48,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9577, LAS: 0.9227, UEM: 0.5645, LEM: 0.3351, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2900, partial_loss/deprel_loss: 0.3423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4949, loss: 0.5676, batch_reg_loss: 0.1630, reg_loss: 0.1631 ||:  36%|###6      | 40/111 [00:25<00:44,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9432, UAS: 0.9593, LAS: 0.9242, UEM: 0.6023, LEM: 0.3702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1667, partial_loss/deprel_loss: 0.2403, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3885, loss: 0.5565, batch_reg_loss: 0.1630, reg_loss: 0.1631 ||:  40%|###9      | 44/111 [00:28<00:42,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9598, LAS: 0.9247, UEM: 0.6098, LEM: 0.3747, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1807, partial_loss/deprel_loss: 0.3618, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4886, loss: 0.5529, batch_reg_loss: 0.1630, reg_loss: 0.1630 ||:  43%|####3     | 48/111 [00:30<00:39,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8900, UAS: 0.9600, LAS: 0.9249, UEM: 0.6152, LEM: 0.3815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8968, partial_loss/deprel_loss: 0.6086, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8292, loss: 0.5531, batch_reg_loss: 0.1630, reg_loss: 0.1630 ||:  47%|####6     | 52/111 [00:33<00:38,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9760, UAS: 0.9603, LAS: 0.9255, UEM: 0.6436, LEM: 0.4230, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0247, partial_loss/deprel_loss: 0.0855, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2363, loss: 0.5484, batch_reg_loss: 0.1630, reg_loss: 0.1630 ||:  50%|#####     | 56/111 [00:37<00:40,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9620, UAS: 0.9613, LAS: 0.9268, UEM: 0.6714, LEM: 0.4588, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0662, partial_loss/deprel_loss: 0.1438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2913, loss: 0.5381, batch_reg_loss: 0.1630, reg_loss: 0.1630 ||:  53%|#####3    | 59/111 [00:39<00:40,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9611, LAS: 0.9266, UEM: 0.6727, LEM: 0.4602, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1327, partial_loss/deprel_loss: 0.2068, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3549, loss: 0.5380, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||:  57%|#####6    | 63/111 [00:42<00:37,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9608, LAS: 0.9264, UEM: 0.6661, LEM: 0.4527, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3382, partial_loss/deprel_loss: 0.3869, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5401, loss: 0.5396, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||:  59%|#####9    | 66/111 [00:45<00:33,  1.33it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9610, LAS: 0.9265, UEM: 0.6630, LEM: 0.4484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1927, partial_loss/deprel_loss: 0.3164, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4546, loss: 0.5398, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||:  64%|######3   | 71/111 [00:47<00:26,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9604, LAS: 0.9259, UEM: 0.6528, LEM: 0.4391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7439, partial_loss/deprel_loss: 0.5034, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7144, loss: 0.5445, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||:  68%|######8   | 76/111 [00:49<00:21,  1.63it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9079, UAS: 0.9600, LAS: 0.9254, UEM: 0.6427, LEM: 0.4295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6552, partial_loss/deprel_loss: 0.4768, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6753, loss: 0.5482, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||:  73%|#######2  | 81/111 [00:52<00:17,  1.76it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9605, LAS: 0.9259, UEM: 0.6488, LEM: 0.4346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1739, partial_loss/deprel_loss: 0.2751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4177, loss: 0.5444, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||:  77%|#######6  | 85/111 [00:54<00:14,  1.76it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9603, LAS: 0.9255, UEM: 0.6422, LEM: 0.4275, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1929, partial_loss/deprel_loss: 0.3498, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4813, loss: 0.5465, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||:  80%|########  | 89/111 [00:57<00:13,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9104, UAS: 0.9602, LAS: 0.9253, UEM: 0.6407, LEM: 0.4251, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5308, partial_loss/deprel_loss: 0.4559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6338, loss: 0.5477, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||:  84%|########3 | 93/111 [01:00<00:12,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9604, LAS: 0.9255, UEM: 0.6448, LEM: 0.4295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1062, partial_loss/deprel_loss: 0.2317, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3694, loss: 0.5461, batch_reg_loss: 0.1629, reg_loss: 0.1630 ||:  87%|########7 | 97/111 [01:03<00:09,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9604, LAS: 0.9255, UEM: 0.6440, LEM: 0.4280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7574, partial_loss/deprel_loss: 0.5058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7189, loss: 0.5467, batch_reg_loss: 0.1628, reg_loss: 0.1630 ||:  91%|######### | 101/111 [01:06<00:06,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9607, LAS: 0.9259, UEM: 0.6425, LEM: 0.4246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3432, partial_loss/deprel_loss: 0.3784, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5342, loss: 0.5447, batch_reg_loss: 0.1628, reg_loss: 0.1630 ||:  95%|#########4| 105/111 [01:09<00:04,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9607, LAS: 0.9259, UEM: 0.6409, LEM: 0.4238, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4736, partial_loss/deprel_loss: 0.4850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6455, loss: 0.5447, batch_reg_loss: 0.1628, reg_loss: 0.1630 ||:  98%|#########8| 109/111 [01:11<00:01,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9488, UAS: 0.9610, LAS: 0.9262, UEM: 0.6476, LEM: 0.4308, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0943, partial_loss/deprel_loss: 0.2058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3463, loss: 0.5421, batch_reg_loss: 0.1628, reg_loss: 0.1630 ||: 100%|##########| 111/111 [01:13<00:00,  1.52it/s]\n",
      "2023-04-07 01:28:05,803 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8771, UAS: 0.9357, LAS: 0.8788, UEM: 0.3387, LEM: 0.0753, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9730, partial_loss/deprel_loss: 35.4884, partial_loss/cycle_loss: 0.0000, batch_loss: 28.5853, loss: 31.0780, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:12,  1.09s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9552, LAS: 0.9039, UEM: 0.6997, LEM: 0.4008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1418, partial_loss/deprel_loss: 22.8051, partial_loss/cycle_loss: 0.0000, batch_loss: 18.2725, loss: 25.2398, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  31%|###       | 4/13 [00:04<00:09,  1.09s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8876, UAS: 0.9505, LAS: 0.9004, UEM: 0.6364, LEM: 0.3599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7520, partial_loss/deprel_loss: 28.9441, partial_loss/cycle_loss: 0.0000, batch_loss: 23.3056, loss: 25.0064, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  54%|#####3    | 7/13 [00:07<00:06,  1.04s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9062, UAS: 0.9546, LAS: 0.9063, UEM: 0.7099, LEM: 0.4538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5701, partial_loss/deprel_loss: 23.5040, partial_loss/cycle_loss: 0.0000, batch_loss: 18.9172, loss: 23.1846, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  69%|######9   | 9/13 [00:09<00:04,  1.06s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8905, UAS: 0.9528, LAS: 0.9035, UEM: 0.6763, LEM: 0.4070, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7413, partial_loss/deprel_loss: 33.2838, partial_loss/cycle_loss: 0.0000, batch_loss: 26.7753, loss: 23.2175, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  92%|#########2| 12/13 [00:11<00:00,  1.02it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8407, UAS: 0.9483, LAS: 0.8987, UEM: 0.6599, LEM: 0.3961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6642, partial_loss/deprel_loss: 54.1649, partial_loss/cycle_loss: 0.0000, batch_loss: 43.6647, loss: 24.7903, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.00it/s]\n",
      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - patience                 |     5.000  |       N/A\n",
      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.206  |    54.165\n",
      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.094  |     1.664\n",
      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.163  |     0.000\n",
      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - UEM                      |     0.648  |     0.660\n",
      "2023-04-07 01:28:18,777 - INFO - combo.training.tensorboard_writer - LAS                      |     0.926  |     0.899\n",
      "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - loss                     |     0.542  |    24.790\n",
      "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - LEM                      |     0.431  |     0.396\n",
      "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - UAS                      |     0.961  |     0.948\n",
      "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - EM                       |     0.949  |     0.841\n",
      "2023-04-07 01:28:18,778 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:28:18,783 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:28:23,018 - INFO - combo.training.trainer - Epoch duration: 0:01:33.219014\n",
      "2023-04-07 01:28:23,019 - INFO - combo.training.trainer - Estimated training time remaining: 6:28:17\n",
      "2023-04-07 01:28:23,019 - INFO - allennlp.training.trainer - Epoch 116/399\n",
      "2023-04-07 01:28:23,019 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:28:23,020 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:28:23,029 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9574, LAS: 0.9219, UEM: 0.5537, LEM: 0.3239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2990, partial_loss/deprel_loss: 0.3329, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4890, loss: 0.5787, batch_reg_loss: 0.1628, reg_loss: 0.1628 ||:   4%|3         | 4/111 [00:02<01:11,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9581, LAS: 0.9241, UEM: 0.5307, LEM: 0.3093, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6387, partial_loss/deprel_loss: 0.4368, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6399, loss: 0.5651, batch_reg_loss: 0.1628, reg_loss: 0.1628 ||:   7%|7         | 8/111 [00:05<01:07,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9591, LAS: 0.9241, UEM: 0.5168, LEM: 0.2895, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4099, partial_loss/deprel_loss: 0.4618, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6142, loss: 0.5604, batch_reg_loss: 0.1628, reg_loss: 0.1628 ||:  10%|9         | 11/111 [00:07<01:07,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9129, UAS: 0.9567, LAS: 0.9219, UEM: 0.5284, LEM: 0.3066, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4870, partial_loss/deprel_loss: 0.4399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6121, loss: 0.5698, batch_reg_loss: 0.1628, reg_loss: 0.1628 ||:  13%|#2        | 14/111 [00:09<01:08,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9312, UAS: 0.9564, LAS: 0.9219, UEM: 0.5200, LEM: 0.2981, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3841, partial_loss/deprel_loss: 0.3641, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5309, loss: 0.5723, batch_reg_loss: 0.1628, reg_loss: 0.1628 ||:  15%|#5        | 17/111 [00:11<01:07,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9589, LAS: 0.9248, UEM: 0.6190, LEM: 0.4255, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2891, partial_loss/deprel_loss: 0.3886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5315, loss: 0.5545, batch_reg_loss: 0.1628, reg_loss: 0.1628 ||:  18%|#8        | 20/111 [00:14<01:06,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9577, LAS: 0.9236, UEM: 0.6216, LEM: 0.4336, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5082, partial_loss/deprel_loss: 0.4548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6282, loss: 0.5616, batch_reg_loss: 0.1628, reg_loss: 0.1628 ||:  21%|##        | 23/111 [00:16<01:07,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9595, LAS: 0.9256, UEM: 0.6471, LEM: 0.4526, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1424, partial_loss/deprel_loss: 0.2302, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3754, loss: 0.5457, batch_reg_loss: 0.1627, reg_loss: 0.1628 ||:  23%|##3       | 26/111 [00:19<01:07,  1.26it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9190, UAS: 0.9588, LAS: 0.9249, UEM: 0.6298, LEM: 0.4361, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3933, partial_loss/deprel_loss: 0.4228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5796, loss: 0.5488, batch_reg_loss: 0.1627, reg_loss: 0.1628 ||:  26%|##6       | 29/111 [00:21<01:02,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9606, LAS: 0.9268, UEM: 0.6540, LEM: 0.4570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3722, partial_loss/deprel_loss: 0.3230, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4956, loss: 0.5388, batch_reg_loss: 0.1627, reg_loss: 0.1628 ||:  30%|##9       | 33/111 [00:23<00:54,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9612, LAS: 0.9271, UEM: 0.6495, LEM: 0.4434, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1959, partial_loss/deprel_loss: 0.3470, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4795, loss: 0.5359, batch_reg_loss: 0.1627, reg_loss: 0.1628 ||:  34%|###4      | 38/111 [00:26<00:47,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9500, UAS: 0.9614, LAS: 0.9273, UEM: 0.6543, LEM: 0.4509, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1142, partial_loss/deprel_loss: 0.1998, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3453, loss: 0.5354, batch_reg_loss: 0.1627, reg_loss: 0.1628 ||:  39%|###8      | 43/111 [00:28<00:40,  1.67it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9616, LAS: 0.9277, UEM: 0.6489, LEM: 0.4439, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2601, partial_loss/deprel_loss: 0.3257, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4753, loss: 0.5345, batch_reg_loss: 0.1627, reg_loss: 0.1627 ||:  43%|####3     | 48/111 [00:31<00:35,  1.75it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9430, UAS: 0.9621, LAS: 0.9282, UEM: 0.6544, LEM: 0.4447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1851, partial_loss/deprel_loss: 0.2794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4232, loss: 0.5299, batch_reg_loss: 0.1627, reg_loss: 0.1627 ||:  47%|####6     | 52/111 [00:33<00:35,  1.67it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9624, LAS: 0.9282, UEM: 0.6494, LEM: 0.4354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3444, partial_loss/deprel_loss: 0.4008, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5522, loss: 0.5285, batch_reg_loss: 0.1627, reg_loss: 0.1627 ||:  50%|#####     | 56/111 [00:36<00:35,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9626, LAS: 0.9284, UEM: 0.6518, LEM: 0.4341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2388, partial_loss/deprel_loss: 0.3454, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4868, loss: 0.5269, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||:  54%|#####4    | 60/111 [00:40<00:36,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9604, UAS: 0.9629, LAS: 0.9288, UEM: 0.6697, LEM: 0.4579, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0658, partial_loss/deprel_loss: 0.1754, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3161, loss: 0.5245, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||:  58%|#####7    | 64/111 [00:43<00:33,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9629, LAS: 0.9286, UEM: 0.6671, LEM: 0.4545, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1502, partial_loss/deprel_loss: 0.2937, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4276, loss: 0.5241, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||:  61%|######1   | 68/111 [00:45<00:29,  1.44it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9630, LAS: 0.9289, UEM: 0.6664, LEM: 0.4523, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2564, partial_loss/deprel_loss: 0.3409, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4866, loss: 0.5225, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||:  65%|######4   | 72/111 [00:48<00:25,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9107, UAS: 0.9620, LAS: 0.9276, UEM: 0.6565, LEM: 0.4431, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5197, partial_loss/deprel_loss: 0.4834, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6533, loss: 0.5320, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||:  68%|######8   | 76/111 [00:50<00:23,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8912, UAS: 0.9617, LAS: 0.9273, UEM: 0.6535, LEM: 0.4384, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8500, partial_loss/deprel_loss: 0.5179, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7469, loss: 0.5336, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||:  72%|#######2  | 80/111 [00:53<00:20,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9613, LAS: 0.9271, UEM: 0.6508, LEM: 0.4368, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5955, partial_loss/deprel_loss: 0.4227, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6198, loss: 0.5355, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||:  76%|#######5  | 84/111 [00:56<00:18,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9300, UAS: 0.9606, LAS: 0.9264, UEM: 0.6449, LEM: 0.4306, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3222, partial_loss/deprel_loss: 0.3930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5414, loss: 0.5413, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||:  79%|#######9  | 88/111 [00:58<00:15,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9381, UAS: 0.9608, LAS: 0.9267, UEM: 0.6465, LEM: 0.4318, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2406, partial_loss/deprel_loss: 0.3309, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4754, loss: 0.5395, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||:  83%|########2 | 92/111 [01:01<00:12,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9001, UAS: 0.9609, LAS: 0.9267, UEM: 0.6496, LEM: 0.4346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7109, partial_loss/deprel_loss: 0.4976, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7028, loss: 0.5385, batch_reg_loss: 0.1626, reg_loss: 0.1627 ||:  86%|########6 | 96/111 [01:04<00:10,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9066, UAS: 0.9610, LAS: 0.9268, UEM: 0.6488, LEM: 0.4326, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6543, partial_loss/deprel_loss: 0.4789, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6765, loss: 0.5377, batch_reg_loss: 0.1625, reg_loss: 0.1627 ||:  90%|######### | 100/111 [01:06<00:07,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9289, UAS: 0.9608, LAS: 0.9266, UEM: 0.6439, LEM: 0.4283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2691, partial_loss/deprel_loss: 0.3528, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4986, loss: 0.5396, batch_reg_loss: 0.1625, reg_loss: 0.1627 ||:  93%|#########2| 103/111 [01:08<00:05,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9610, LAS: 0.9268, UEM: 0.6465, LEM: 0.4289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1619, partial_loss/deprel_loss: 0.2886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4258, loss: 0.5377, batch_reg_loss: 0.1625, reg_loss: 0.1627 ||:  96%|#########6| 107/111 [01:11<00:02,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9608, LAS: 0.9265, UEM: 0.6469, LEM: 0.4300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1204, partial_loss/deprel_loss: 0.2431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3811, loss: 0.5391, batch_reg_loss: 0.1625, reg_loss: 0.1627 ||:  99%|#########9| 110/111 [01:13<00:00,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9609, LAS: 0.9266, UEM: 0.6485, LEM: 0.4310, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2016, partial_loss/deprel_loss: 0.2930, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4372, loss: 0.5382, batch_reg_loss: 0.1625, reg_loss: 0.1627 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
      "2023-04-07 01:29:40,436 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:29:40,436 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:29:40,436 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.293  |       N/A\n",
      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.202  |       N/A\n",
      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.163  |       N/A\n",
      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - UEM                      |     0.649  |       N/A\n",
      "2023-04-07 01:29:40,437 - INFO - combo.training.tensorboard_writer - LAS                      |     0.927  |       N/A\n",
      "2023-04-07 01:29:40,438 - INFO - combo.training.tensorboard_writer - loss                     |     0.538  |       N/A\n",
      "2023-04-07 01:29:40,438 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:29:40,438 - INFO - combo.training.tensorboard_writer - LEM                      |     0.431  |       N/A\n",
      "2023-04-07 01:29:40,438 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:29:40,438 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:29:40,438 - INFO - combo.training.tensorboard_writer - UAS                      |     0.961  |       N/A\n",
      "2023-04-07 01:29:40,439 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:29:40,439 - INFO - combo.training.tensorboard_writer - EM                       |     0.938  |       N/A\n",
      "2023-04-07 01:29:40,439 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:29:40,447 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:29:45,284 - INFO - combo.training.trainer - Epoch duration: 0:01:22.264978\n",
      "2023-04-07 01:29:45,284 - INFO - combo.training.trainer - Estimated training time remaining: 6:26:55\n",
      "2023-04-07 01:29:45,285 - INFO - allennlp.training.trainer - Epoch 117/399\n",
      "2023-04-07 01:29:45,285 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:29:45,286 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:29:45,297 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8930, UAS: 0.9410, LAS: 0.9072, UEM: 0.2115, LEM: 0.0673, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0066, partial_loss/deprel_loss: 0.4922, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7576, loss: 0.6695, batch_reg_loss: 0.1625, reg_loss: 0.1625 ||:   3%|2         | 3/111 [00:02<01:16,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9473, UAS: 0.9573, LAS: 0.9234, UEM: 0.6225, LEM: 0.4012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1534, partial_loss/deprel_loss: 0.2371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3829, loss: 0.5587, batch_reg_loss: 0.1625, reg_loss: 0.1625 ||:   5%|5         | 6/111 [00:04<01:13,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9597, LAS: 0.9265, UEM: 0.6303, LEM: 0.4005, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2763, partial_loss/deprel_loss: 0.2943, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4532, loss: 0.5306, batch_reg_loss: 0.1625, reg_loss: 0.1625 ||:   9%|9         | 10/111 [00:06<01:08,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9362, UAS: 0.9618, LAS: 0.9290, UEM: 0.6422, LEM: 0.4102, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3256, partial_loss/deprel_loss: 0.3279, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4899, loss: 0.5178, batch_reg_loss: 0.1625, reg_loss: 0.1625 ||:  13%|#2        | 14/111 [00:09<01:04,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9631, LAS: 0.9301, UEM: 0.6359, LEM: 0.3976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2475, partial_loss/deprel_loss: 0.3239, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4711, loss: 0.5122, batch_reg_loss: 0.1625, reg_loss: 0.1625 ||:  16%|#6        | 18/111 [00:11<00:57,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9630, LAS: 0.9298, UEM: 0.6229, LEM: 0.3805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3032, partial_loss/deprel_loss: 0.3606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5115, loss: 0.5102, batch_reg_loss: 0.1625, reg_loss: 0.1625 ||:  21%|##        | 23/111 [00:13<00:50,  1.74it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9634, LAS: 0.9309, UEM: 0.6398, LEM: 0.4021, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1709, partial_loss/deprel_loss: 0.2609, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4053, loss: 0.5038, batch_reg_loss: 0.1624, reg_loss: 0.1625 ||:  25%|##5       | 28/111 [00:15<00:43,  1.90it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9280, UAS: 0.9632, LAS: 0.9309, UEM: 0.6331, LEM: 0.3985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3200, partial_loss/deprel_loss: 0.4090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5536, loss: 0.5060, batch_reg_loss: 0.1624, reg_loss: 0.1625 ||:  29%|##8       | 32/111 [00:17<00:41,  1.91it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9744, UAS: 0.9632, LAS: 0.9312, UEM: 0.6660, LEM: 0.4534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0344, partial_loss/deprel_loss: 0.0977, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2474, loss: 0.5044, batch_reg_loss: 0.1624, reg_loss: 0.1625 ||:  32%|###2      | 36/111 [00:21<00:46,  1.62it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9634, LAS: 0.9313, UEM: 0.6693, LEM: 0.4571, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4329, partial_loss/deprel_loss: 0.4586, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6159, loss: 0.5044, batch_reg_loss: 0.1624, reg_loss: 0.1625 ||:  36%|###6      | 40/111 [00:23<00:45,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9075, UAS: 0.9626, LAS: 0.9303, UEM: 0.6647, LEM: 0.4514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6757, partial_loss/deprel_loss: 0.4823, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6834, loss: 0.5078, batch_reg_loss: 0.1624, reg_loss: 0.1625 ||:  40%|###9      | 44/111 [00:26<00:45,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9623, LAS: 0.9300, UEM: 0.6570, LEM: 0.4426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5023, partial_loss/deprel_loss: 0.4532, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6254, loss: 0.5114, batch_reg_loss: 0.1624, reg_loss: 0.1624 ||:  43%|####3     | 48/111 [00:29<00:42,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9164, UAS: 0.9624, LAS: 0.9300, UEM: 0.6613, LEM: 0.4473, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5246, partial_loss/deprel_loss: 0.4793, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6507, loss: 0.5130, batch_reg_loss: 0.1624, reg_loss: 0.1624 ||:  47%|####6     | 52/111 [00:32<00:39,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9625, LAS: 0.9299, UEM: 0.6535, LEM: 0.4376, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3355, partial_loss/deprel_loss: 0.3536, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5124, loss: 0.5163, batch_reg_loss: 0.1624, reg_loss: 0.1624 ||:  50%|#####     | 56/111 [00:34<00:34,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9621, LAS: 0.9293, UEM: 0.6491, LEM: 0.4327, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1408, partial_loss/deprel_loss: 0.2545, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3941, loss: 0.5204, batch_reg_loss: 0.1624, reg_loss: 0.1624 ||:  54%|#####4    | 60/111 [00:37<00:32,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9619, LAS: 0.9290, UEM: 0.6429, LEM: 0.4245, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4015, partial_loss/deprel_loss: 0.3097, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4904, loss: 0.5217, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  58%|#####7    | 64/111 [00:39<00:31,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8819, UAS: 0.9610, LAS: 0.9281, UEM: 0.6440, LEM: 0.4281, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0708, partial_loss/deprel_loss: 0.6247, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8763, loss: 0.5269, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  61%|######1   | 68/111 [00:42<00:29,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9601, LAS: 0.9271, UEM: 0.6366, LEM: 0.4217, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3447, partial_loss/deprel_loss: 0.3889, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5424, loss: 0.5337, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  64%|######3   | 71/111 [00:44<00:27,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9602, LAS: 0.9270, UEM: 0.6335, LEM: 0.4178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1685, partial_loss/deprel_loss: 0.3030, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4385, loss: 0.5353, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  67%|######6   | 74/111 [00:47<00:26,  1.41it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9603, LAS: 0.9271, UEM: 0.6388, LEM: 0.4246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5088, partial_loss/deprel_loss: 0.4509, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6248, loss: 0.5350, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  69%|######9   | 77/111 [00:49<00:24,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9032, UAS: 0.9606, LAS: 0.9274, UEM: 0.6483, LEM: 0.4373, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6415, partial_loss/deprel_loss: 0.5587, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7376, loss: 0.5339, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  72%|#######2  | 80/111 [00:51<00:22,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9608, LAS: 0.9275, UEM: 0.6506, LEM: 0.4383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4282, partial_loss/deprel_loss: 0.4634, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6186, loss: 0.5326, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  75%|#######4  | 83/111 [00:53<00:20,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9612, LAS: 0.9277, UEM: 0.6555, LEM: 0.4408, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2927, partial_loss/deprel_loss: 0.3332, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4874, loss: 0.5298, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  78%|#######8  | 87/111 [00:56<00:17,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9149, UAS: 0.9611, LAS: 0.9276, UEM: 0.6540, LEM: 0.4393, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6455, partial_loss/deprel_loss: 0.5085, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6982, loss: 0.5311, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  81%|########1 | 90/111 [00:58<00:15,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9606, LAS: 0.9271, UEM: 0.6474, LEM: 0.4331, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6479, partial_loss/deprel_loss: 0.4413, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6449, loss: 0.5349, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  85%|########4 | 94/111 [01:01<00:11,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9608, LAS: 0.9273, UEM: 0.6451, LEM: 0.4300, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3137, partial_loss/deprel_loss: 0.3642, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5164, loss: 0.5347, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  87%|########7 | 97/111 [01:03<00:09,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9607, LAS: 0.9271, UEM: 0.6447, LEM: 0.4293, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3215, partial_loss/deprel_loss: 0.4272, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5683, loss: 0.5362, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  90%|######### | 100/111 [01:05<00:07,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9605, LAS: 0.9269, UEM: 0.6461, LEM: 0.4320, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1824, partial_loss/deprel_loss: 0.2260, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3796, loss: 0.5365, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  93%|#########2| 103/111 [01:07<00:05,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9402, UAS: 0.9608, LAS: 0.9272, UEM: 0.6491, LEM: 0.4333, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1632, partial_loss/deprel_loss: 0.2947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4306, loss: 0.5345, batch_reg_loss: 0.1623, reg_loss: 0.1624 ||:  95%|#########5| 106/111 [01:10<00:03,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9608, LAS: 0.9271, UEM: 0.6473, LEM: 0.4307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2056, partial_loss/deprel_loss: 0.3438, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4784, loss: 0.5352, batch_reg_loss: 0.1622, reg_loss: 0.1624 ||:  99%|#########9| 110/111 [01:12<00:00,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9331, UAS: 0.9608, LAS: 0.9271, UEM: 0.6470, LEM: 0.4302, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3199, partial_loss/deprel_loss: 0.3751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5263, loss: 0.5351, batch_reg_loss: 0.1622, reg_loss: 0.1624 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
      "2023-04-07 01:31:01,940 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:31:01,940 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:31:01,940 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:31:01,940 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:31:01,940 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:31:01,940 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:31:01,940 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.375  |       N/A\n",
      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.320  |       N/A\n",
      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.162  |       N/A\n",
      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - UEM                      |     0.647  |       N/A\n",
      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - LAS                      |     0.927  |       N/A\n",
      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - loss                     |     0.535  |       N/A\n",
      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - LEM                      |     0.430  |       N/A\n",
      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - UAS                      |     0.961  |       N/A\n",
      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:31:01,941 - INFO - combo.training.tensorboard_writer - EM                       |     0.933  |       N/A\n",
      "2023-04-07 01:31:01,942 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:31:01,947 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:31:06,980 - INFO - combo.training.trainer - Epoch duration: 0:01:21.695775\n",
      "2023-04-07 01:31:06,981 - INFO - combo.training.trainer - Estimated training time remaining: 6:25:32\n",
      "2023-04-07 01:31:06,981 - INFO - allennlp.training.trainer - Epoch 118/399\n",
      "2023-04-07 01:31:06,982 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:31:06,982 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:31:06,992 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9584, LAS: 0.9244, UEM: 0.5742, LEM: 0.3493, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5284, partial_loss/deprel_loss: 0.4591, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6352, loss: 0.5838, batch_reg_loss: 0.1622, reg_loss: 0.1622 ||:   5%|4         | 5/111 [00:02<00:49,  2.13it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9661, LAS: 0.9330, UEM: 0.6756, LEM: 0.4417, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2489, partial_loss/deprel_loss: 0.3630, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5024, loss: 0.5213, batch_reg_loss: 0.1622, reg_loss: 0.1622 ||:   8%|8         | 9/111 [00:05<00:53,  1.89it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9642, LAS: 0.9312, UEM: 0.6472, LEM: 0.4141, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2436, partial_loss/deprel_loss: 0.3190, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4661, loss: 0.5239, batch_reg_loss: 0.1622, reg_loss: 0.1622 ||:  12%|#1        | 13/111 [00:07<00:54,  1.79it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9160, UAS: 0.9629, LAS: 0.9304, UEM: 0.6386, LEM: 0.4124, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6097, partial_loss/deprel_loss: 0.4469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6417, loss: 0.5277, batch_reg_loss: 0.1622, reg_loss: 0.1622 ||:  15%|#5        | 17/111 [00:10<00:55,  1.70it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9627, LAS: 0.9306, UEM: 0.6374, LEM: 0.4183, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4281, partial_loss/deprel_loss: 0.3719, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5453, loss: 0.5259, batch_reg_loss: 0.1622, reg_loss: 0.1622 ||:  19%|#8        | 21/111 [00:12<00:54,  1.66it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9628, LAS: 0.9302, UEM: 0.6381, LEM: 0.4163, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4613, partial_loss/deprel_loss: 0.4099, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5824, loss: 0.5261, batch_reg_loss: 0.1622, reg_loss: 0.1622 ||:  23%|##3       | 26/111 [00:15<00:47,  1.78it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9468, UAS: 0.9630, LAS: 0.9303, UEM: 0.6479, LEM: 0.4259, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1632, partial_loss/deprel_loss: 0.2524, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3967, loss: 0.5214, batch_reg_loss: 0.1622, reg_loss: 0.1622 ||:  28%|##7       | 31/111 [00:17<00:42,  1.87it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8916, UAS: 0.9633, LAS: 0.9307, UEM: 0.6835, LEM: 0.4758, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9265, partial_loss/deprel_loss: 0.5708, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8041, loss: 0.5189, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||:  32%|###1      | 35/111 [00:20<00:45,  1.66it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9635, LAS: 0.9309, UEM: 0.6790, LEM: 0.4666, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3176, partial_loss/deprel_loss: 0.3150, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4776, loss: 0.5163, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||:  35%|###5      | 39/111 [00:23<00:48,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9580, UAS: 0.9644, LAS: 0.9317, UEM: 0.7036, LEM: 0.4959, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0596, partial_loss/deprel_loss: 0.1671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3077, loss: 0.5090, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||:  38%|###7      | 42/111 [00:26<00:49,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9243, UAS: 0.9646, LAS: 0.9317, UEM: 0.6970, LEM: 0.4853, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4318, partial_loss/deprel_loss: 0.4018, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5699, loss: 0.5093, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||:  41%|####1     | 46/111 [00:28<00:45,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9643, LAS: 0.9313, UEM: 0.6905, LEM: 0.4775, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2069, partial_loss/deprel_loss: 0.3115, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4527, loss: 0.5109, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||:  44%|####4     | 49/111 [00:30<00:42,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9520, UAS: 0.9647, LAS: 0.9317, UEM: 0.6980, LEM: 0.4860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0849, partial_loss/deprel_loss: 0.1925, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3331, loss: 0.5082, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||:  47%|####6     | 52/111 [00:33<00:41,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9057, UAS: 0.9636, LAS: 0.9306, UEM: 0.6847, LEM: 0.4741, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7901, partial_loss/deprel_loss: 0.4558, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6847, loss: 0.5165, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||:  50%|#####     | 56/111 [00:35<00:37,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9637, LAS: 0.9306, UEM: 0.6816, LEM: 0.4689, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3447, partial_loss/deprel_loss: 0.3302, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4952, loss: 0.5146, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||:  53%|#####3    | 59/111 [00:37<00:35,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9631, LAS: 0.9296, UEM: 0.6729, LEM: 0.4598, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3769, partial_loss/deprel_loss: 0.4646, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6091, loss: 0.5212, batch_reg_loss: 0.1621, reg_loss: 0.1622 ||:  56%|#####5    | 62/111 [00:39<00:33,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9633, LAS: 0.9297, UEM: 0.6692, LEM: 0.4535, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2217, partial_loss/deprel_loss: 0.3478, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4846, loss: 0.5206, batch_reg_loss: 0.1621, reg_loss: 0.1621 ||:  59%|#####9    | 66/111 [00:41<00:28,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9627, LAS: 0.9290, UEM: 0.6628, LEM: 0.4461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6047, partial_loss/deprel_loss: 0.4760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6637, loss: 0.5258, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  63%|######3   | 70/111 [00:45<00:28,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9625, LAS: 0.9287, UEM: 0.6564, LEM: 0.4398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4710, partial_loss/deprel_loss: 0.4209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5930, loss: 0.5275, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  66%|######5   | 73/111 [00:47<00:26,  1.41it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9627, LAS: 0.9290, UEM: 0.6556, LEM: 0.4382, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3633, partial_loss/deprel_loss: 0.3333, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5013, loss: 0.5263, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  69%|######9   | 77/111 [00:49<00:22,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9437, UAS: 0.9630, LAS: 0.9293, UEM: 0.6552, LEM: 0.4360, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2212, partial_loss/deprel_loss: 0.2669, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4198, loss: 0.5241, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  73%|#######2  | 81/111 [00:52<00:20,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9634, LAS: 0.9297, UEM: 0.6572, LEM: 0.4348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1872, partial_loss/deprel_loss: 0.2738, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4185, loss: 0.5218, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  77%|#######6  | 85/111 [00:54<00:17,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9632, LAS: 0.9295, UEM: 0.6530, LEM: 0.4303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2652, partial_loss/deprel_loss: 0.3209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4717, loss: 0.5238, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  80%|########  | 89/111 [00:57<00:14,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9628, LAS: 0.9290, UEM: 0.6508, LEM: 0.4269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2090, partial_loss/deprel_loss: 0.3746, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5034, loss: 0.5269, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  84%|########3 | 93/111 [01:00<00:12,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9627, LAS: 0.9289, UEM: 0.6587, LEM: 0.4366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1577, partial_loss/deprel_loss: 0.2665, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4067, loss: 0.5265, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  87%|########7 | 97/111 [01:03<00:10,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9625, LAS: 0.9288, UEM: 0.6574, LEM: 0.4358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4383, partial_loss/deprel_loss: 0.4457, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6062, loss: 0.5284, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  90%|######### | 100/111 [01:05<00:07,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9621, LAS: 0.9284, UEM: 0.6529, LEM: 0.4315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8222, partial_loss/deprel_loss: 0.5854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7947, loss: 0.5315, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  93%|#########2| 103/111 [01:07<00:05,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9622, LAS: 0.9286, UEM: 0.6580, LEM: 0.4379, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5416, partial_loss/deprel_loss: 0.4245, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6099, loss: 0.5292, batch_reg_loss: 0.1620, reg_loss: 0.1621 ||:  95%|#########5| 106/111 [01:10<00:03,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8870, UAS: 0.9617, LAS: 0.9280, UEM: 0.6534, LEM: 0.4338, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0117, partial_loss/deprel_loss: 0.5263, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7853, loss: 0.5327, batch_reg_loss: 0.1619, reg_loss: 0.1621 ||:  99%|#########9| 110/111 [01:13<00:00,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9006, UAS: 0.9615, LAS: 0.9277, UEM: 0.6512, LEM: 0.4323, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6477, partial_loss/deprel_loss: 0.5848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7593, loss: 0.5348, batch_reg_loss: 0.1619, reg_loss: 0.1621 ||: 100%|##########| 111/111 [01:13<00:00,  1.50it/s]\n",
      "2023-04-07 01:32:24,077 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:32:24,077 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:32:24,077 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:32:24,077 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:32:24,077 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.585  |       N/A\n",
      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.648  |       N/A\n",
      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.162  |       N/A\n",
      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - UEM                      |     0.651  |       N/A\n",
      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - LAS                      |     0.928  |       N/A\n",
      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - loss                     |     0.535  |       N/A\n",
      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - LEM                      |     0.432  |       N/A\n",
      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - UAS                      |     0.961  |       N/A\n",
      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - EM                       |     0.901  |       N/A\n",
      "2023-04-07 01:32:24,078 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:32:24,083 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:32:29,151 - INFO - combo.training.trainer - Epoch duration: 0:01:22.169650\n",
      "2023-04-07 01:32:29,152 - INFO - combo.training.trainer - Estimated training time remaining: 6:24:11\n",
      "2023-04-07 01:32:29,153 - INFO - allennlp.training.trainer - Epoch 119/399\n",
      "2023-04-07 01:32:29,153 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:32:29,153 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:32:29,162 - INFO - allennlp.training.trainer - Training\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9560, LAS: 0.9230, UEM: 0.6512, LEM: 0.4110, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6316, partial_loss/deprel_loss: 0.4480, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6467, loss: 0.5886, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||:   5%|4         | 5/111 [00:02<00:52,  2.00it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8882, UAS: 0.9547, LAS: 0.9204, UEM: 0.5686, LEM: 0.3328, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9893, partial_loss/deprel_loss: 0.5484, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7985, loss: 0.5991, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||:   9%|9         | 10/111 [00:04<00:49,  2.05it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9562, LAS: 0.9221, UEM: 0.5881, LEM: 0.3630, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6123, partial_loss/deprel_loss: 0.4122, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6141, loss: 0.5779, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||:  14%|#3        | 15/111 [00:07<00:46,  2.07it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9342, UAS: 0.9558, LAS: 0.9221, UEM: 0.5655, LEM: 0.3452, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3024, partial_loss/deprel_loss: 0.3077, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4686, loss: 0.5763, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||:  17%|#7        | 19/111 [00:09<00:49,  1.88it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9103, UAS: 0.9567, LAS: 0.9229, UEM: 0.5671, LEM: 0.3446, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4757, partial_loss/deprel_loss: 0.4163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5901, loss: 0.5670, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||:  21%|##        | 23/111 [00:12<00:49,  1.78it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9273, UAS: 0.9571, LAS: 0.9234, UEM: 0.6038, LEM: 0.3925, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2781, partial_loss/deprel_loss: 0.3534, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5002, loss: 0.5615, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||:  23%|##3       | 26/111 [00:14<00:53,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9688, UAS: 0.9594, LAS: 0.9259, UEM: 0.6656, LEM: 0.4674, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0312, partial_loss/deprel_loss: 0.1093, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2556, loss: 0.5430, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||:  26%|##6       | 29/111 [00:17<00:56,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9607, LAS: 0.9274, UEM: 0.6750, LEM: 0.4757, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1359, partial_loss/deprel_loss: 0.2697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4048, loss: 0.5329, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||:  29%|##8       | 32/111 [00:19<00:57,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9607, LAS: 0.9274, UEM: 0.6677, LEM: 0.4672, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2178, partial_loss/deprel_loss: 0.2610, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4143, loss: 0.5330, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||:  32%|###1      | 35/111 [00:21<00:54,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9408, UAS: 0.9616, LAS: 0.9282, UEM: 0.6710, LEM: 0.4637, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2761, partial_loss/deprel_loss: 0.3460, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4939, loss: 0.5294, batch_reg_loss: 0.1619, reg_loss: 0.1619 ||:  34%|###4      | 38/111 [00:23<00:51,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9283, UAS: 0.9621, LAS: 0.9284, UEM: 0.6754, LEM: 0.4638, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2917, partial_loss/deprel_loss: 0.3887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5312, loss: 0.5263, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  37%|###6      | 41/111 [00:25<00:49,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9617, LAS: 0.9280, UEM: 0.6783, LEM: 0.4673, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0769, partial_loss/deprel_loss: 0.2259, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3580, loss: 0.5280, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  40%|###9      | 44/111 [00:27<00:47,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9621, LAS: 0.9284, UEM: 0.6747, LEM: 0.4613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3800, partial_loss/deprel_loss: 0.3772, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5396, loss: 0.5269, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  42%|####2     | 47/111 [00:29<00:44,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9163, UAS: 0.9608, LAS: 0.9271, UEM: 0.6570, LEM: 0.4461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5127, partial_loss/deprel_loss: 0.4390, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6155, loss: 0.5357, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  46%|####5     | 51/111 [00:32<00:41,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9614, LAS: 0.9277, UEM: 0.6581, LEM: 0.4439, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3493, partial_loss/deprel_loss: 0.4118, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5611, loss: 0.5331, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  50%|####9     | 55/111 [00:35<00:38,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9612, LAS: 0.9275, UEM: 0.6545, LEM: 0.4409, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4683, partial_loss/deprel_loss: 0.4351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6035, loss: 0.5331, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  52%|#####2    | 58/111 [00:37<00:37,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9071, UAS: 0.9610, LAS: 0.9275, UEM: 0.6621, LEM: 0.4544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5465, partial_loss/deprel_loss: 0.4218, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6085, loss: 0.5332, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  55%|#####4    | 61/111 [00:39<00:35,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9610, LAS: 0.9276, UEM: 0.6568, LEM: 0.4468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3979, partial_loss/deprel_loss: 0.4106, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5698, loss: 0.5333, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  58%|#####7    | 64/111 [00:42<00:34,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9608, LAS: 0.9273, UEM: 0.6518, LEM: 0.4414, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2573, partial_loss/deprel_loss: 0.3191, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4686, loss: 0.5350, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  60%|######    | 67/111 [00:44<00:31,  1.38it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9607, LAS: 0.9271, UEM: 0.6513, LEM: 0.4398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1883, partial_loss/deprel_loss: 0.3120, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4490, loss: 0.5358, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  63%|######3   | 70/111 [00:46<00:29,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9607, LAS: 0.9270, UEM: 0.6530, LEM: 0.4406, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3512, partial_loss/deprel_loss: 0.3129, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4823, loss: 0.5351, batch_reg_loss: 0.1618, reg_loss: 0.1619 ||:  67%|######6   | 74/111 [00:49<00:26,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9603, LAS: 0.9266, UEM: 0.6537, LEM: 0.4407, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2083, partial_loss/deprel_loss: 0.3212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4603, loss: 0.5373, batch_reg_loss: 0.1618, reg_loss: 0.1618 ||:  70%|#######   | 78/111 [00:51<00:23,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9600, LAS: 0.9264, UEM: 0.6507, LEM: 0.4395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7320, partial_loss/deprel_loss: 0.4751, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6882, loss: 0.5391, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||:  73%|#######2  | 81/111 [00:54<00:22,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8880, UAS: 0.9596, LAS: 0.9260, UEM: 0.6459, LEM: 0.4345, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9141, partial_loss/deprel_loss: 0.5886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8154, loss: 0.5417, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||:  77%|#######6  | 85/111 [00:56<00:18,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9133, UAS: 0.9593, LAS: 0.9257, UEM: 0.6400, LEM: 0.4291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5148, partial_loss/deprel_loss: 0.4794, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6482, loss: 0.5443, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||:  79%|#######9  | 88/111 [00:59<00:16,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9596, LAS: 0.9261, UEM: 0.6410, LEM: 0.4290, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3060, partial_loss/deprel_loss: 0.2798, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4468, loss: 0.5411, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||:  82%|########1 | 91/111 [01:01<00:14,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9600, LAS: 0.9265, UEM: 0.6463, LEM: 0.4342, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3279, partial_loss/deprel_loss: 0.3422, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5010, loss: 0.5384, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||:  85%|########4 | 94/111 [01:03<00:12,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9601, LAS: 0.9266, UEM: 0.6469, LEM: 0.4343, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3405, partial_loss/deprel_loss: 0.3789, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5329, loss: 0.5386, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||:  87%|########7 | 97/111 [01:05<00:09,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9112, UAS: 0.9602, LAS: 0.9266, UEM: 0.6479, LEM: 0.4355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5201, partial_loss/deprel_loss: 0.4496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6254, loss: 0.5378, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||:  90%|######### | 100/111 [01:07<00:07,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9144, UAS: 0.9606, LAS: 0.9270, UEM: 0.6509, LEM: 0.4367, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5157, partial_loss/deprel_loss: 0.5044, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6684, loss: 0.5354, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||:  94%|#########3| 104/111 [01:09<00:04,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9607, LAS: 0.9271, UEM: 0.6519, LEM: 0.4374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2124, partial_loss/deprel_loss: 0.3220, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4618, loss: 0.5335, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||:  97%|#########7| 108/111 [01:12<00:02,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9607, LAS: 0.9272, UEM: 0.6491, LEM: 0.4348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2512, partial_loss/deprel_loss: 0.2724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4298, loss: 0.5331, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||: 100%|##########| 111/111 [01:14<00:00,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9358, UAS: 0.9607, LAS: 0.9272, UEM: 0.6491, LEM: 0.4348, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2512, partial_loss/deprel_loss: 0.2724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4298, loss: 0.5331, batch_reg_loss: 0.1617, reg_loss: 0.1618 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
      "2023-04-07 01:33:46,617 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:33:46,617 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:33:46,617 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:33:46,617 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:33:46,617 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:33:46,617 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.272  |       N/A\n",
      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.251  |       N/A\n",
      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.162  |       N/A\n",
      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - UEM                      |     0.649  |       N/A\n",
      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - LAS                      |     0.927  |       N/A\n",
      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - loss                     |     0.533  |       N/A\n",
      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - LEM                      |     0.435  |       N/A\n",
      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - UAS                      |     0.961  |       N/A\n",
      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - EM                       |     0.936  |       N/A\n",
      "2023-04-07 01:33:46,618 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:33:46,623 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:33:54,256 - INFO - combo.training.trainer - Epoch duration: 0:01:25.103205\n",
      "2023-04-07 01:33:54,256 - INFO - combo.training.trainer - Estimated training time remaining: 6:22:56\n",
      "2023-04-07 01:33:54,257 - INFO - allennlp.training.trainer - Epoch 120/399\n",
      "2023-04-07 01:33:54,258 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:33:54,259 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:33:54,269 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9004, UAS: 0.9501, LAS: 0.9170, UEM: 0.5021, LEM: 0.3026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8535, partial_loss/deprel_loss: 0.5228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7506, loss: 0.5918, batch_reg_loss: 0.1617, reg_loss: 0.1617 ||:   4%|3         | 4/111 [00:02<01:01,  1.75it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9183, UAS: 0.9531, LAS: 0.9200, UEM: 0.4871, LEM: 0.2667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5064, partial_loss/deprel_loss: 0.4212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5999, loss: 0.5803, batch_reg_loss: 0.1617, reg_loss: 0.1617 ||:   7%|7         | 8/111 [00:05<01:02,  1.64it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9130, UAS: 0.9541, LAS: 0.9206, UEM: 0.5231, LEM: 0.3075, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6122, partial_loss/deprel_loss: 0.4584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6508, loss: 0.5758, batch_reg_loss: 0.1616, reg_loss: 0.1617 ||:  10%|9         | 11/111 [00:07<01:05,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9580, LAS: 0.9244, UEM: 0.5806, LEM: 0.3570, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3549, partial_loss/deprel_loss: 0.3522, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5143, loss: 0.5547, batch_reg_loss: 0.1616, reg_loss: 0.1617 ||:  13%|#2        | 14/111 [00:09<01:05,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9164, UAS: 0.9595, LAS: 0.9262, UEM: 0.5897, LEM: 0.3669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5475, partial_loss/deprel_loss: 0.4541, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6344, loss: 0.5433, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||:  16%|#6        | 18/111 [00:12<01:01,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9603, LAS: 0.9269, UEM: 0.5869, LEM: 0.3581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3965, partial_loss/deprel_loss: 0.3725, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5389, loss: 0.5377, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||:  20%|#9        | 22/111 [00:14<00:58,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9740, UAS: 0.9625, LAS: 0.9299, UEM: 0.6652, LEM: 0.4636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0359, partial_loss/deprel_loss: 0.1071, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2545, loss: 0.5194, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||:  23%|##2       | 25/111 [00:17<01:00,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9603, LAS: 0.9278, UEM: 0.6394, LEM: 0.4425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2706, partial_loss/deprel_loss: 0.3206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4722, loss: 0.5364, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||:  26%|##6       | 29/111 [00:19<00:55,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9281, UAS: 0.9608, LAS: 0.9282, UEM: 0.6520, LEM: 0.4574, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2792, partial_loss/deprel_loss: 0.3689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5125, loss: 0.5330, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||:  29%|##8       | 32/111 [00:21<00:54,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9617, LAS: 0.9292, UEM: 0.6638, LEM: 0.4631, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6578, partial_loss/deprel_loss: 0.3979, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6114, loss: 0.5262, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||:  32%|###2      | 36/111 [00:24<00:51,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9205, UAS: 0.9611, LAS: 0.9286, UEM: 0.6649, LEM: 0.4640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4831, partial_loss/deprel_loss: 0.4557, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6227, loss: 0.5295, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||:  36%|###6      | 40/111 [00:27<00:48,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9621, LAS: 0.9297, UEM: 0.6798, LEM: 0.4768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3156, partial_loss/deprel_loss: 0.4022, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5464, loss: 0.5221, batch_reg_loss: 0.1616, reg_loss: 0.1616 ||:  39%|###8      | 43/111 [00:29<00:46,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9175, UAS: 0.9620, LAS: 0.9296, UEM: 0.6714, LEM: 0.4641, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5441, partial_loss/deprel_loss: 0.4304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6147, loss: 0.5224, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  42%|####2     | 47/111 [00:31<00:42,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9086, UAS: 0.9619, LAS: 0.9292, UEM: 0.6658, LEM: 0.4540, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5552, partial_loss/deprel_loss: 0.4651, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6446, loss: 0.5248, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  46%|####5     | 51/111 [00:34<00:40,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9021, UAS: 0.9615, LAS: 0.9288, UEM: 0.6645, LEM: 0.4538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7061, partial_loss/deprel_loss: 0.5740, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7619, loss: 0.5273, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  49%|####8     | 54/111 [00:36<00:38,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9615, LAS: 0.9286, UEM: 0.6585, LEM: 0.4443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3896, partial_loss/deprel_loss: 0.4041, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5627, loss: 0.5292, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  52%|#####2    | 58/111 [00:38<00:34,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9204, UAS: 0.9623, LAS: 0.9292, UEM: 0.6673, LEM: 0.4507, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3596, partial_loss/deprel_loss: 0.4629, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6037, loss: 0.5255, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  56%|#####5    | 62/111 [00:41<00:32,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9382, UAS: 0.9628, LAS: 0.9299, UEM: 0.6752, LEM: 0.4595, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2684, partial_loss/deprel_loss: 0.3365, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4844, loss: 0.5204, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  59%|#####8    | 65/111 [00:43<00:31,  1.44it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9619, LAS: 0.9288, UEM: 0.6688, LEM: 0.4528, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3563, partial_loss/deprel_loss: 0.3716, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5301, loss: 0.5295, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  61%|######1   | 68/111 [00:46<00:30,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9540, UAS: 0.9615, LAS: 0.9283, UEM: 0.6717, LEM: 0.4592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0960, partial_loss/deprel_loss: 0.1973, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3385, loss: 0.5329, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  64%|######3   | 71/111 [00:48<00:29,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9340, UAS: 0.9619, LAS: 0.9286, UEM: 0.6709, LEM: 0.4567, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2529, partial_loss/deprel_loss: 0.3776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5141, loss: 0.5311, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  68%|######7   | 75/111 [00:51<00:25,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9210, UAS: 0.9617, LAS: 0.9284, UEM: 0.6664, LEM: 0.4508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4704, partial_loss/deprel_loss: 0.4265, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5967, loss: 0.5322, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  71%|#######1  | 79/111 [00:53<00:22,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9618, LAS: 0.9285, UEM: 0.6676, LEM: 0.4516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2552, partial_loss/deprel_loss: 0.3319, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4780, loss: 0.5314, batch_reg_loss: 0.1615, reg_loss: 0.1616 ||:  74%|#######3  | 82/111 [00:56<00:20,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9618, LAS: 0.9283, UEM: 0.6666, LEM: 0.4497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1772, partial_loss/deprel_loss: 0.2633, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4075, loss: 0.5323, batch_reg_loss: 0.1614, reg_loss: 0.1616 ||:  77%|#######7  | 86/111 [00:58<00:17,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8862, UAS: 0.9617, LAS: 0.9283, UEM: 0.6735, LEM: 0.4597, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0861, partial_loss/deprel_loss: 0.5565, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8239, loss: 0.5321, batch_reg_loss: 0.1614, reg_loss: 0.1616 ||:  80%|########  | 89/111 [01:01<00:15,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9616, LAS: 0.9283, UEM: 0.6689, LEM: 0.4549, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2165, partial_loss/deprel_loss: 0.3058, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4494, loss: 0.5322, batch_reg_loss: 0.1614, reg_loss: 0.1615 ||:  84%|########3 | 93/111 [01:03<00:12,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9617, LAS: 0.9281, UEM: 0.6673, LEM: 0.4515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1981, partial_loss/deprel_loss: 0.3654, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4933, loss: 0.5328, batch_reg_loss: 0.1614, reg_loss: 0.1615 ||:  86%|########6 | 96/111 [01:05<00:10,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9617, LAS: 0.9281, UEM: 0.6644, LEM: 0.4475, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3597, partial_loss/deprel_loss: 0.3367, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5027, loss: 0.5319, batch_reg_loss: 0.1614, reg_loss: 0.1615 ||:  90%|######### | 100/111 [01:08<00:07,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9613, LAS: 0.9277, UEM: 0.6560, LEM: 0.4402, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3539, partial_loss/deprel_loss: 0.3841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5394, loss: 0.5347, batch_reg_loss: 0.1614, reg_loss: 0.1615 ||:  95%|#########4| 105/111 [01:10<00:03,  1.66it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9615, LAS: 0.9278, UEM: 0.6528, LEM: 0.4349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1941, partial_loss/deprel_loss: 0.3065, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4454, loss: 0.5337, batch_reg_loss: 0.1614, reg_loss: 0.1615 ||:  99%|#########9| 110/111 [01:12<00:00,  1.82it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9616, LAS: 0.9279, UEM: 0.6534, LEM: 0.4346, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2313, partial_loss/deprel_loss: 0.3515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4888, loss: 0.5333, batch_reg_loss: 0.1614, reg_loss: 0.1615 ||: 100%|##########| 111/111 [01:12<00:00,  1.52it/s]\n",
      "2023-04-07 01:35:10,476 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9340, LAS: 0.8843, UEM: 0.7299, LEM: 0.4799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1551, partial_loss/deprel_loss: 22.5874, partial_loss/cycle_loss: 0.0000, batch_loss: 18.1009, loss: 30.5976, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  15%|#5        | 2/13 [00:02<00:12,  1.10s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9231, UAS: 0.9563, LAS: 0.9123, UEM: 0.8067, LEM: 0.5765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3924, partial_loss/deprel_loss: 25.3394, partial_loss/cycle_loss: 0.0000, batch_loss: 20.3500, loss: 21.9278, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  38%|###8      | 5/13 [00:05<00:08,  1.06s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8809, UAS: 0.9492, LAS: 0.9002, UEM: 0.7154, LEM: 0.4758, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1023, partial_loss/deprel_loss: 41.2377, partial_loss/cycle_loss: 0.0000, batch_loss: 33.2106, loss: 24.2740, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:08<00:05,  1.04s/it]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9480, LAS: 0.8980, UEM: 0.6665, LEM: 0.4116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7164, partial_loss/deprel_loss: 32.8922, partial_loss/cycle_loss: 0.0000, batch_loss: 26.4571, loss: 23.9450, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:10<00:01,  1.01it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9475, LAS: 0.8973, UEM: 0.6503, LEM: 0.3892, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4480, partial_loss/deprel_loss: 23.6254, partial_loss/cycle_loss: 0.0000, batch_loss: 18.9900, loss: 24.5413, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.03it/s]\n",
      "2023-04-07 01:35:23,094 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:35:23,094 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-07 01:35:23,094 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 01:35:23,094 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - patience                 |     4.000  |       N/A\n",
      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.351  |    23.625\n",
      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.231  |     0.448\n",
      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.162  |     0.000\n",
      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - UEM                      |     0.653  |     0.650\n",
      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - LAS                      |     0.928  |     0.897\n",
      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - loss                     |     0.533  |    24.541\n",
      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - LEM                      |     0.435  |     0.389\n",
      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |     0.947\n",
      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-07 01:35:23,095 - INFO - combo.training.tensorboard_writer - EM                       |     0.935  |     0.914\n",
      "2023-04-07 01:35:23,096 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:35:23,101 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:35:28,020 - INFO - combo.training.trainer - Epoch duration: 0:01:33.762829\n",
      "2023-04-07 01:35:28,021 - INFO - combo.training.trainer - Estimated training time remaining: 6:22:01\n",
      "2023-04-07 01:35:28,021 - INFO - allennlp.training.trainer - Epoch 121/399\n",
      "2023-04-07 01:35:28,021 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:35:28,021 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:35:28,028 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9115, UAS: 0.9625, LAS: 0.9278, UEM: 0.6975, LEM: 0.4612, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6757, partial_loss/deprel_loss: 0.4689, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6717, loss: 0.5151, batch_reg_loss: 0.1614, reg_loss: 0.1614 ||:   3%|2         | 3/111 [00:02<01:16,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9672, LAS: 0.9355, UEM: 0.7027, LEM: 0.4777, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2837, partial_loss/deprel_loss: 0.3431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4926, loss: 0.4797, batch_reg_loss: 0.1614, reg_loss: 0.1614 ||:   6%|6         | 7/111 [00:04<01:10,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9059, UAS: 0.9678, LAS: 0.9357, UEM: 0.7548, LEM: 0.5496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6550, partial_loss/deprel_loss: 0.5144, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7039, loss: 0.4759, batch_reg_loss: 0.1614, reg_loss: 0.1614 ||:   9%|9         | 10/111 [00:06<01:08,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9383, UAS: 0.9662, LAS: 0.9341, UEM: 0.7161, LEM: 0.5052, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2910, partial_loss/deprel_loss: 0.2941, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4548, loss: 0.4895, batch_reg_loss: 0.1613, reg_loss: 0.1614 ||:  12%|#1        | 13/111 [00:08<01:07,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9625, LAS: 0.9294, UEM: 0.7186, LEM: 0.5103, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0669, partial_loss/deprel_loss: 0.2664, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3879, loss: 0.5213, batch_reg_loss: 0.1613, reg_loss: 0.1614 ||:  14%|#4        | 16/111 [00:11<01:07,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9170, UAS: 0.9621, LAS: 0.9291, UEM: 0.6897, LEM: 0.4818, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4282, partial_loss/deprel_loss: 0.4310, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5918, loss: 0.5272, batch_reg_loss: 0.1613, reg_loss: 0.1614 ||:  18%|#8        | 20/111 [00:13<01:02,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9629, LAS: 0.9297, UEM: 0.7008, LEM: 0.4936, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4723, partial_loss/deprel_loss: 0.4305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6002, loss: 0.5215, batch_reg_loss: 0.1613, reg_loss: 0.1614 ||:  21%|##        | 23/111 [00:15<01:02,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9048, UAS: 0.9615, LAS: 0.9286, UEM: 0.6829, LEM: 0.4761, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7597, partial_loss/deprel_loss: 0.5481, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7517, loss: 0.5324, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||:  23%|##3       | 26/111 [00:17<00:59,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9601, LAS: 0.9271, UEM: 0.6503, LEM: 0.4472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3940, partial_loss/deprel_loss: 0.3808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5447, loss: 0.5419, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||:  27%|##7       | 30/111 [00:20<00:56,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9327, UAS: 0.9600, LAS: 0.9269, UEM: 0.6390, LEM: 0.4315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3166, partial_loss/deprel_loss: 0.3335, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4914, loss: 0.5444, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||:  30%|##9       | 33/111 [00:22<00:54,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9123, UAS: 0.9602, LAS: 0.9271, UEM: 0.6246, LEM: 0.4132, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5958, partial_loss/deprel_loss: 0.4498, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6403, loss: 0.5440, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||:  33%|###3      | 37/111 [00:25<00:49,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8925, UAS: 0.9592, LAS: 0.9259, UEM: 0.6117, LEM: 0.4009, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9584, partial_loss/deprel_loss: 0.5039, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7561, loss: 0.5516, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||:  36%|###6      | 40/111 [00:27<00:48,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8916, UAS: 0.9582, LAS: 0.9248, UEM: 0.5995, LEM: 0.3884, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8587, partial_loss/deprel_loss: 0.6059, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8177, loss: 0.5590, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||:  39%|###8      | 43/111 [00:29<00:46,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9592, LAS: 0.9257, UEM: 0.6153, LEM: 0.4001, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1867, partial_loss/deprel_loss: 0.2768, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4200, loss: 0.5514, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||:  41%|####1     | 46/111 [00:31<00:46,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8932, UAS: 0.9586, LAS: 0.9252, UEM: 0.6056, LEM: 0.3905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8144, partial_loss/deprel_loss: 0.5216, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7414, loss: 0.5554, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||:  45%|####5     | 50/111 [00:34<00:42,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9596, LAS: 0.9260, UEM: 0.6167, LEM: 0.3957, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1388, partial_loss/deprel_loss: 0.2741, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4083, loss: 0.5495, batch_reg_loss: 0.1613, reg_loss: 0.1613 ||:  48%|####7     | 53/111 [00:36<00:41,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9271, UAS: 0.9602, LAS: 0.9265, UEM: 0.6188, LEM: 0.3926, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2883, partial_loss/deprel_loss: 0.3921, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5326, loss: 0.5468, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||:  51%|#####1    | 57/111 [00:39<00:37,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9598, LAS: 0.9262, UEM: 0.6186, LEM: 0.3944, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1625, partial_loss/deprel_loss: 0.2233, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3724, loss: 0.5476, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||:  55%|#####4    | 61/111 [00:41<00:33,  1.49it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9179, UAS: 0.9602, LAS: 0.9266, UEM: 0.6270, LEM: 0.4035, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4080, partial_loss/deprel_loss: 0.4123, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5727, loss: 0.5433, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||:  59%|#####8    | 65/111 [00:43<00:29,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9449, UAS: 0.9609, LAS: 0.9273, UEM: 0.6400, LEM: 0.4165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1509, partial_loss/deprel_loss: 0.2523, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3933, loss: 0.5379, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||:  62%|######2   | 69/111 [00:46<00:25,  1.65it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9614, LAS: 0.9277, UEM: 0.6463, LEM: 0.4210, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2193, partial_loss/deprel_loss: 0.3163, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4581, loss: 0.5341, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||:  66%|######5   | 73/111 [00:48<00:22,  1.73it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9614, LAS: 0.9276, UEM: 0.6457, LEM: 0.4195, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2231, partial_loss/deprel_loss: 0.3305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4702, loss: 0.5339, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||:  70%|#######   | 78/111 [00:50<00:18,  1.83it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9732, UAS: 0.9616, LAS: 0.9279, UEM: 0.6571, LEM: 0.4395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0336, partial_loss/deprel_loss: 0.0988, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2469, loss: 0.5322, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||:  74%|#######3  | 82/111 [00:53<00:17,  1.63it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9616, LAS: 0.9279, UEM: 0.6532, LEM: 0.4341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5493, partial_loss/deprel_loss: 0.4245, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6106, loss: 0.5317, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||:  77%|#######7  | 86/111 [00:56<00:16,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9492, UAS: 0.9621, LAS: 0.9284, UEM: 0.6628, LEM: 0.4424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1212, partial_loss/deprel_loss: 0.2469, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3829, loss: 0.5276, batch_reg_loss: 0.1612, reg_loss: 0.1613 ||:  81%|########1 | 90/111 [00:58<00:13,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9621, LAS: 0.9284, UEM: 0.6589, LEM: 0.4386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2574, partial_loss/deprel_loss: 0.3425, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4866, loss: 0.5275, batch_reg_loss: 0.1611, reg_loss: 0.1613 ||:  85%|########4 | 94/111 [01:01<00:10,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9617, LAS: 0.9281, UEM: 0.6526, LEM: 0.4330, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4018, partial_loss/deprel_loss: 0.4294, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5850, loss: 0.5303, batch_reg_loss: 0.1611, reg_loss: 0.1613 ||:  88%|########8 | 98/111 [01:03<00:08,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9618, LAS: 0.9281, UEM: 0.6492, LEM: 0.4280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2187, partial_loss/deprel_loss: 0.3255, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4653, loss: 0.5298, batch_reg_loss: 0.1611, reg_loss: 0.1613 ||:  92%|#########1| 102/111 [01:06<00:05,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9526, UAS: 0.9621, LAS: 0.9285, UEM: 0.6590, LEM: 0.4395, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1560, partial_loss/deprel_loss: 0.2417, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3856, loss: 0.5267, batch_reg_loss: 0.1611, reg_loss: 0.1612 ||:  95%|#########5| 106/111 [01:09<00:03,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9620, LAS: 0.9284, UEM: 0.6538, LEM: 0.4340, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2230, partial_loss/deprel_loss: 0.3147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4574, loss: 0.5279, batch_reg_loss: 0.1611, reg_loss: 0.1612 ||:  99%|#########9| 110/111 [01:11<00:00,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9317, UAS: 0.9620, LAS: 0.9284, UEM: 0.6522, LEM: 0.4325, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3857, partial_loss/deprel_loss: 0.3601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5263, loss: 0.5279, batch_reg_loss: 0.1611, reg_loss: 0.1612 ||: 100%|##########| 111/111 [01:12<00:00,  1.53it/s]\n",
      "2023-04-07 01:36:43,250 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:36:43,250 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:36:43,250 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:36:43,250 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:36:43,250 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.360  |       N/A\n",
      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.386  |       N/A\n",
      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.161  |       N/A\n",
      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - UEM                      |     0.652  |       N/A\n",
      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - LAS                      |     0.928  |       N/A\n",
      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - loss                     |     0.528  |       N/A\n",
      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - LEM                      |     0.433  |       N/A\n",
      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |       N/A\n",
      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - EM                       |     0.932  |       N/A\n",
      "2023-04-07 01:36:43,251 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:36:43,257 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:36:49,054 - INFO - combo.training.trainer - Epoch duration: 0:01:21.032962\n",
      "2023-04-07 01:36:49,054 - INFO - combo.training.trainer - Estimated training time remaining: 6:20:36\n",
      "2023-04-07 01:36:49,054 - INFO - allennlp.training.trainer - Epoch 122/399\n",
      "2023-04-07 01:36:49,055 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:36:49,055 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:36:49,065 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9468, UAS: 0.9650, LAS: 0.9338, UEM: 0.6522, LEM: 0.4229, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1713, partial_loss/deprel_loss: 0.2491, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3946, loss: 0.4751, batch_reg_loss: 0.1611, reg_loss: 0.1611 ||:   3%|2         | 3/111 [00:02<01:13,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9424, UAS: 0.9639, LAS: 0.9312, UEM: 0.6423, LEM: 0.4008, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1668, partial_loss/deprel_loss: 0.2690, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4096, loss: 0.4931, batch_reg_loss: 0.1611, reg_loss: 0.1611 ||:   5%|5         | 6/111 [00:04<01:15,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9088, UAS: 0.9595, LAS: 0.9277, UEM: 0.6090, LEM: 0.3797, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6934, partial_loss/deprel_loss: 0.4242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6391, loss: 0.5225, batch_reg_loss: 0.1611, reg_loss: 0.1611 ||:   8%|8         | 9/111 [00:06<01:12,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9198, UAS: 0.9620, LAS: 0.9302, UEM: 0.6435, LEM: 0.4178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5243, partial_loss/deprel_loss: 0.4132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5965, loss: 0.5120, batch_reg_loss: 0.1611, reg_loss: 0.1611 ||:  11%|#         | 12/111 [00:08<01:10,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9144, UAS: 0.9622, LAS: 0.9303, UEM: 0.6295, LEM: 0.4019, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5368, partial_loss/deprel_loss: 0.4377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6186, loss: 0.5119, batch_reg_loss: 0.1610, reg_loss: 0.1611 ||:  14%|#4        | 16/111 [00:11<01:06,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9502, UAS: 0.9621, LAS: 0.9310, UEM: 0.6313, LEM: 0.4091, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1706, partial_loss/deprel_loss: 0.2616, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4044, loss: 0.5085, batch_reg_loss: 0.1610, reg_loss: 0.1611 ||:  18%|#8        | 20/111 [00:13<01:02,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9392, UAS: 0.9600, LAS: 0.9284, UEM: 0.6104, LEM: 0.3878, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2424, partial_loss/deprel_loss: 0.3302, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4736, loss: 0.5285, batch_reg_loss: 0.1610, reg_loss: 0.1611 ||:  22%|##1       | 24/111 [00:16<00:57,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9351, UAS: 0.9605, LAS: 0.9289, UEM: 0.6192, LEM: 0.3952, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2865, partial_loss/deprel_loss: 0.2876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4484, loss: 0.5258, batch_reg_loss: 0.1610, reg_loss: 0.1611 ||:  24%|##4       | 27/111 [00:18<00:57,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9619, LAS: 0.9303, UEM: 0.6544, LEM: 0.4337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1432, partial_loss/deprel_loss: 0.2489, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3888, loss: 0.5141, batch_reg_loss: 0.1610, reg_loss: 0.1611 ||:  27%|##7       | 30/111 [00:21<00:58,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9629, LAS: 0.9312, UEM: 0.6662, LEM: 0.4462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3693, partial_loss/deprel_loss: 0.3934, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5496, loss: 0.5084, batch_reg_loss: 0.1610, reg_loss: 0.1610 ||:  30%|##9       | 33/111 [00:23<00:57,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9082, UAS: 0.9629, LAS: 0.9305, UEM: 0.6631, LEM: 0.4380, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5729, partial_loss/deprel_loss: 0.5477, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7137, loss: 0.5118, batch_reg_loss: 0.1610, reg_loss: 0.1610 ||:  32%|###2      | 36/111 [00:25<00:53,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9633, LAS: 0.9313, UEM: 0.6878, LEM: 0.4793, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2916, partial_loss/deprel_loss: 0.3384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4900, loss: 0.5070, batch_reg_loss: 0.1610, reg_loss: 0.1610 ||:  35%|###5      | 39/111 [00:27<00:54,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9255, UAS: 0.9630, LAS: 0.9308, UEM: 0.6790, LEM: 0.4691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4333, partial_loss/deprel_loss: 0.4353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5959, loss: 0.5128, batch_reg_loss: 0.1610, reg_loss: 0.1610 ||:  38%|###7      | 42/111 [00:29<00:50,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9631, LAS: 0.9308, UEM: 0.6764, LEM: 0.4639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5079, partial_loss/deprel_loss: 0.3939, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5777, loss: 0.5122, batch_reg_loss: 0.1610, reg_loss: 0.1610 ||:  41%|####      | 45/111 [00:31<00:47,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9343, UAS: 0.9633, LAS: 0.9310, UEM: 0.6768, LEM: 0.4627, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2611, partial_loss/deprel_loss: 0.3371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4829, loss: 0.5085, batch_reg_loss: 0.1610, reg_loss: 0.1610 ||:  45%|####5     | 50/111 [00:34<00:38,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9636, LAS: 0.9313, UEM: 0.6799, LEM: 0.4677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1367, partial_loss/deprel_loss: 0.2098, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3562, loss: 0.5074, batch_reg_loss: 0.1610, reg_loss: 0.1610 ||:  49%|####8     | 54/111 [00:36<00:36,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9640, LAS: 0.9317, UEM: 0.6884, LEM: 0.4791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4297, partial_loss/deprel_loss: 0.4490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6061, loss: 0.5048, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||:  52%|#####2    | 58/111 [00:39<00:34,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9637, LAS: 0.9314, UEM: 0.6777, LEM: 0.4678, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3982, partial_loss/deprel_loss: 0.3819, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5461, loss: 0.5078, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||:  56%|#####5    | 62/111 [00:42<00:31,  1.55it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9078, UAS: 0.9630, LAS: 0.9305, UEM: 0.6654, LEM: 0.4556, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6359, partial_loss/deprel_loss: 0.4622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6578, loss: 0.5146, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||:  59%|#####9    | 66/111 [00:44<00:28,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9625, LAS: 0.9298, UEM: 0.6570, LEM: 0.4457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3815, partial_loss/deprel_loss: 0.3840, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5444, loss: 0.5197, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||:  63%|######3   | 70/111 [00:46<00:24,  1.67it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8922, UAS: 0.9622, LAS: 0.9297, UEM: 0.6520, LEM: 0.4398, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0289, partial_loss/deprel_loss: 0.5635, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8175, loss: 0.5221, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||:  68%|######7   | 75/111 [00:48<00:20,  1.78it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9626, LAS: 0.9299, UEM: 0.6525, LEM: 0.4355, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2345, partial_loss/deprel_loss: 0.3180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4622, loss: 0.5188, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||:  72%|#######2  | 80/111 [00:51<00:16,  1.86it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9625, LAS: 0.9298, UEM: 0.6539, LEM: 0.4358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2805, partial_loss/deprel_loss: 0.3755, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5174, loss: 0.5198, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||:  76%|#######5  | 84/111 [00:54<00:16,  1.69it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8951, UAS: 0.9627, LAS: 0.9299, UEM: 0.6608, LEM: 0.4438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7551, partial_loss/deprel_loss: 0.5496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7516, loss: 0.5183, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||:  79%|#######9  | 88/111 [00:56<00:14,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9150, UAS: 0.9627, LAS: 0.9299, UEM: 0.6589, LEM: 0.4416, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5500, partial_loss/deprel_loss: 0.4632, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6415, loss: 0.5184, batch_reg_loss: 0.1609, reg_loss: 0.1610 ||:  83%|########2 | 92/111 [00:59<00:12,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9560, UAS: 0.9624, LAS: 0.9296, UEM: 0.6645, LEM: 0.4490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0866, partial_loss/deprel_loss: 0.1841, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3254, loss: 0.5205, batch_reg_loss: 0.1608, reg_loss: 0.1610 ||:  86%|########6 | 96/111 [01:03<00:10,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9414, UAS: 0.9627, LAS: 0.9298, UEM: 0.6662, LEM: 0.4488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1921, partial_loss/deprel_loss: 0.2776, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4213, loss: 0.5180, batch_reg_loss: 0.1608, reg_loss: 0.1610 ||:  90%|######### | 100/111 [01:05<00:07,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9373, UAS: 0.9626, LAS: 0.9297, UEM: 0.6625, LEM: 0.4451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2944, partial_loss/deprel_loss: 0.3515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5009, loss: 0.5188, batch_reg_loss: 0.1608, reg_loss: 0.1610 ||:  94%|#########3| 104/111 [01:08<00:04,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9178, UAS: 0.9625, LAS: 0.9296, UEM: 0.6571, LEM: 0.4391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4424, partial_loss/deprel_loss: 0.4296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5929, loss: 0.5207, batch_reg_loss: 0.1608, reg_loss: 0.1610 ||:  97%|#########7| 108/111 [01:10<00:01,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8862, UAS: 0.9621, LAS: 0.9291, UEM: 0.6547, LEM: 0.4372, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9304, partial_loss/deprel_loss: 0.6028, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8291, loss: 0.5234, batch_reg_loss: 0.1608, reg_loss: 0.1609 ||: 100%|##########| 111/111 [01:12<00:00,  1.52it/s]\n",
      "2023-04-07 01:38:04,746 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.603  |       N/A\n",
      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.930  |       N/A\n",
      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.161  |       N/A\n",
      "2023-04-07 01:38:04,747 - INFO - combo.training.tensorboard_writer - UEM                      |     0.655  |       N/A\n",
      "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - LAS                      |     0.929  |       N/A\n",
      "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - loss                     |     0.523  |       N/A\n",
      "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - LEM                      |     0.437  |       N/A\n",
      "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |       N/A\n",
      "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - EM                       |     0.886  |       N/A\n",
      "2023-04-07 01:38:04,748 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:38:04,753 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:38:09,561 - INFO - combo.training.trainer - Epoch duration: 0:01:20.506074\n",
      "2023-04-07 01:38:09,561 - INFO - combo.training.trainer - Estimated training time remaining: 6:19:10\n",
      "2023-04-07 01:38:09,561 - INFO - allennlp.training.trainer - Epoch 123/399\n",
      "2023-04-07 01:38:09,561 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:38:09,562 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:38:09,571 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9549, LAS: 0.9194, UEM: 0.5681, LEM: 0.3599, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5232, partial_loss/deprel_loss: 0.4827, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6516, loss: 0.6007, batch_reg_loss: 0.1608, reg_loss: 0.1608 ||:   3%|2         | 3/111 [00:02<01:23,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9627, LAS: 0.9298, UEM: 0.6188, LEM: 0.3916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2662, partial_loss/deprel_loss: 0.3589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5011, loss: 0.5094, batch_reg_loss: 0.1608, reg_loss: 0.1608 ||:   6%|6         | 7/111 [00:04<01:16,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9634, LAS: 0.9311, UEM: 0.6393, LEM: 0.4116, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1946, partial_loss/deprel_loss: 0.2854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4280, loss: 0.5030, batch_reg_loss: 0.1608, reg_loss: 0.1608 ||:   9%|9         | 10/111 [00:07<01:13,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9355, UAS: 0.9645, LAS: 0.9316, UEM: 0.6506, LEM: 0.4153, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2571, partial_loss/deprel_loss: 0.3332, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4788, loss: 0.5021, batch_reg_loss: 0.1608, reg_loss: 0.1608 ||:  13%|#2        | 14/111 [00:09<01:08,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9662, LAS: 0.9337, UEM: 0.6572, LEM: 0.4175, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2175, partial_loss/deprel_loss: 0.2773, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4261, loss: 0.4903, batch_reg_loss: 0.1608, reg_loss: 0.1608 ||:  16%|#6        | 18/111 [00:12<01:02,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9576, UAS: 0.9671, LAS: 0.9346, UEM: 0.6837, LEM: 0.4518, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0700, partial_loss/deprel_loss: 0.1836, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3216, loss: 0.4854, batch_reg_loss: 0.1608, reg_loss: 0.1608 ||:  19%|#8        | 21/111 [00:14<01:02,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9189, UAS: 0.9682, LAS: 0.9361, UEM: 0.7249, LEM: 0.5181, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5037, partial_loss/deprel_loss: 0.4371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6111, loss: 0.4779, batch_reg_loss: 0.1607, reg_loss: 0.1608 ||:  22%|##1       | 24/111 [00:16<01:03,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9669, LAS: 0.9349, UEM: 0.7034, LEM: 0.4947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3045, partial_loss/deprel_loss: 0.3622, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5114, loss: 0.4832, batch_reg_loss: 0.1607, reg_loss: 0.1608 ||:  25%|##5       | 28/111 [00:19<00:56,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9646, LAS: 0.9328, UEM: 0.6862, LEM: 0.4788, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2151, partial_loss/deprel_loss: 0.3070, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4493, loss: 0.4968, batch_reg_loss: 0.1607, reg_loss: 0.1608 ||:  29%|##8       | 32/111 [00:21<00:52,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9367, UAS: 0.9639, LAS: 0.9318, UEM: 0.6867, LEM: 0.4800, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2530, partial_loss/deprel_loss: 0.3480, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4897, loss: 0.5024, batch_reg_loss: 0.1607, reg_loss: 0.1608 ||:  32%|###2      | 36/111 [00:24<00:49,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9632, LAS: 0.9314, UEM: 0.6798, LEM: 0.4733, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3144, partial_loss/deprel_loss: 0.3244, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4831, loss: 0.5084, batch_reg_loss: 0.1607, reg_loss: 0.1608 ||:  36%|###6      | 40/111 [00:26<00:45,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9416, UAS: 0.9624, LAS: 0.9305, UEM: 0.6818, LEM: 0.4755, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1474, partial_loss/deprel_loss: 0.2510, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3910, loss: 0.5125, batch_reg_loss: 0.1607, reg_loss: 0.1607 ||:  40%|###9      | 44/111 [00:29<00:45,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9616, LAS: 0.9297, UEM: 0.6681, LEM: 0.4633, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4001, partial_loss/deprel_loss: 0.4014, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5619, loss: 0.5174, batch_reg_loss: 0.1607, reg_loss: 0.1607 ||:  42%|####2     | 47/111 [00:31<00:43,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9159, UAS: 0.9607, LAS: 0.9289, UEM: 0.6482, LEM: 0.4455, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5704, partial_loss/deprel_loss: 0.4718, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6522, loss: 0.5269, batch_reg_loss: 0.1607, reg_loss: 0.1607 ||:  47%|####6     | 52/111 [00:34<00:36,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9599, LAS: 0.9278, UEM: 0.6335, LEM: 0.4289, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3542, partial_loss/deprel_loss: 0.3405, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5039, loss: 0.5339, batch_reg_loss: 0.1607, reg_loss: 0.1607 ||:  51%|#####1    | 57/111 [00:36<00:31,  1.74it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9248, UAS: 0.9601, LAS: 0.9277, UEM: 0.6278, LEM: 0.4223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3126, partial_loss/deprel_loss: 0.3265, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4844, loss: 0.5320, batch_reg_loss: 0.1607, reg_loss: 0.1607 ||:  56%|#####5    | 62/111 [00:38<00:26,  1.86it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9605, LAS: 0.9281, UEM: 0.6417, LEM: 0.4369, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1840, partial_loss/deprel_loss: 0.2735, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4163, loss: 0.5269, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  59%|#####9    | 66/111 [00:41<00:26,  1.70it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9610, LAS: 0.9285, UEM: 0.6508, LEM: 0.4438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2534, partial_loss/deprel_loss: 0.3795, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5149, loss: 0.5238, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  63%|######3   | 70/111 [00:44<00:26,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9156, UAS: 0.9610, LAS: 0.9285, UEM: 0.6460, LEM: 0.4381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6746, partial_loss/deprel_loss: 0.4760, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6763, loss: 0.5240, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  67%|######6   | 74/111 [00:47<00:24,  1.50it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9408, UAS: 0.9608, LAS: 0.9282, UEM: 0.6378, LEM: 0.4305, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2414, partial_loss/deprel_loss: 0.3349, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4768, loss: 0.5275, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  70%|#######   | 78/111 [00:49<00:21,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9609, LAS: 0.9282, UEM: 0.6335, LEM: 0.4236, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3490, partial_loss/deprel_loss: 0.3569, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5159, loss: 0.5275, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  74%|#######3  | 82/111 [00:52<00:18,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9609, LAS: 0.9282, UEM: 0.6348, LEM: 0.4253, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1496, partial_loss/deprel_loss: 0.2676, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4046, loss: 0.5278, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  77%|#######7  | 86/111 [00:54<00:15,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9612, LAS: 0.9283, UEM: 0.6366, LEM: 0.4246, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2001, partial_loss/deprel_loss: 0.2907, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4332, loss: 0.5276, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  81%|########1 | 90/111 [01:00<00:17,  1.17it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9614, LAS: 0.9285, UEM: 0.6366, LEM: 0.4239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1536, partial_loss/deprel_loss: 0.2921, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4250, loss: 0.5268, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  84%|########3 | 93/111 [01:02<00:14,  1.21it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9613, LAS: 0.9283, UEM: 0.6353, LEM: 0.4225, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6619, partial_loss/deprel_loss: 0.4325, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6390, loss: 0.5270, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  87%|########7 | 97/111 [01:05<00:10,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9027, UAS: 0.9613, LAS: 0.9283, UEM: 0.6374, LEM: 0.4249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5876, partial_loss/deprel_loss: 0.5230, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6964, loss: 0.5270, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  90%|######### | 100/111 [01:07<00:08,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9580, UAS: 0.9616, LAS: 0.9286, UEM: 0.6455, LEM: 0.4341, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0841, partial_loss/deprel_loss: 0.1611, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3063, loss: 0.5250, batch_reg_loss: 0.1606, reg_loss: 0.1607 ||:  93%|#########2| 103/111 [01:09<00:05,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9521, UAS: 0.9621, LAS: 0.9290, UEM: 0.6533, LEM: 0.4414, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0820, partial_loss/deprel_loss: 0.2228, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3552, loss: 0.5223, batch_reg_loss: 0.1605, reg_loss: 0.1607 ||:  95%|#########5| 106/111 [01:11<00:03,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9618, LAS: 0.9288, UEM: 0.6516, LEM: 0.4389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3803, partial_loss/deprel_loss: 0.3741, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5359, loss: 0.5229, batch_reg_loss: 0.1605, reg_loss: 0.1607 ||:  99%|#########9| 110/111 [01:14<00:00,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9619, LAS: 0.9288, UEM: 0.6520, LEM: 0.4385, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2427, partial_loss/deprel_loss: 0.2956, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4456, loss: 0.5222, batch_reg_loss: 0.1605, reg_loss: 0.1607 ||: 100%|##########| 111/111 [01:14<00:00,  1.48it/s]\n",
      "2023-04-07 01:39:27,734 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:39:27,734 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:39:27,734 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:39:27,734 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:39:27,734 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:39:27,734 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:39:27,734 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.296  |       N/A\n",
      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.243  |       N/A\n",
      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.161  |       N/A\n",
      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - UEM                      |     0.652  |       N/A\n",
      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - LAS                      |     0.929  |       N/A\n",
      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - loss                     |     0.522  |       N/A\n",
      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - LEM                      |     0.439  |       N/A\n",
      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |       N/A\n",
      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - EM                       |     0.935  |       N/A\n",
      "2023-04-07 01:39:27,735 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:39:27,740 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:39:32,872 - INFO - combo.training.trainer - Epoch duration: 0:01:23.310651\n",
      "2023-04-07 01:39:32,872 - INFO - combo.training.trainer - Estimated training time remaining: 6:17:51\n",
      "2023-04-07 01:39:32,872 - INFO - allennlp.training.trainer - Epoch 124/399\n",
      "2023-04-07 01:39:32,872 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:39:32,873 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:39:32,880 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9491, LAS: 0.9161, UEM: 0.6139, LEM: 0.4149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5117, partial_loss/deprel_loss: 0.4023, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5847, loss: 0.5831, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||:   3%|2         | 3/111 [00:02<01:17,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9380, UAS: 0.9620, LAS: 0.9297, UEM: 0.7283, LEM: 0.5279, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2584, partial_loss/deprel_loss: 0.3415, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4854, loss: 0.4947, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||:   6%|6         | 7/111 [00:04<01:11,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9410, UAS: 0.9588, LAS: 0.9263, UEM: 0.6802, LEM: 0.4857, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2412, partial_loss/deprel_loss: 0.2967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4461, loss: 0.5317, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||:   9%|9         | 10/111 [00:06<01:12,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9610, LAS: 0.9292, UEM: 0.6884, LEM: 0.4948, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2238, partial_loss/deprel_loss: 0.2941, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4406, loss: 0.5143, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||:  12%|#1        | 13/111 [00:09<01:10,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9613, LAS: 0.9293, UEM: 0.6973, LEM: 0.5000, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1493, partial_loss/deprel_loss: 0.2606, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3989, loss: 0.5118, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||:  14%|#4        | 16/111 [00:11<01:11,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9637, LAS: 0.9318, UEM: 0.7138, LEM: 0.5118, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1904, partial_loss/deprel_loss: 0.2853, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4268, loss: 0.4976, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||:  17%|#7        | 19/111 [00:14<01:11,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9254, UAS: 0.9640, LAS: 0.9321, UEM: 0.6946, LEM: 0.4842, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4298, partial_loss/deprel_loss: 0.4258, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5871, loss: 0.4999, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||:  21%|##        | 23/111 [00:16<01:04,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9295, UAS: 0.9647, LAS: 0.9322, UEM: 0.6975, LEM: 0.4816, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2924, partial_loss/deprel_loss: 0.3637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5099, loss: 0.4974, batch_reg_loss: 0.1605, reg_loss: 0.1605 ||:  23%|##3       | 26/111 [00:18<01:00,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9642, LAS: 0.9318, UEM: 0.6884, LEM: 0.4722, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1649, partial_loss/deprel_loss: 0.2476, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3915, loss: 0.5012, batch_reg_loss: 0.1604, reg_loss: 0.1605 ||:  27%|##7       | 30/111 [00:21<00:55,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8632, UAS: 0.9608, LAS: 0.9285, UEM: 0.6741, LEM: 0.4611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3414, partial_loss/deprel_loss: 0.6991, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9880, loss: 0.5256, batch_reg_loss: 0.1604, reg_loss: 0.1605 ||:  32%|###1      | 35/111 [00:23<00:47,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9401, UAS: 0.9610, LAS: 0.9290, UEM: 0.6652, LEM: 0.4505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2631, partial_loss/deprel_loss: 0.2850, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4410, loss: 0.5230, batch_reg_loss: 0.1604, reg_loss: 0.1605 ||:  36%|###6      | 40/111 [00:25<00:40,  1.75it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9040, UAS: 0.9595, LAS: 0.9278, UEM: 0.6427, LEM: 0.4307, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7856, partial_loss/deprel_loss: 0.4250, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6576, loss: 0.5322, batch_reg_loss: 0.1604, reg_loss: 0.1605 ||:  41%|####      | 45/111 [00:27<00:35,  1.88it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9603, LAS: 0.9287, UEM: 0.6684, LEM: 0.4677, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1457, partial_loss/deprel_loss: 0.3193, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4450, loss: 0.5273, batch_reg_loss: 0.1604, reg_loss: 0.1605 ||:  44%|####4     | 49/111 [00:30<00:34,  1.78it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9606, LAS: 0.9289, UEM: 0.6664, LEM: 0.4633, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1772, partial_loss/deprel_loss: 0.3141, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4471, loss: 0.5259, batch_reg_loss: 0.1604, reg_loss: 0.1605 ||:  48%|####7     | 53/111 [00:33<00:34,  1.66it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9604, LAS: 0.9284, UEM: 0.6559, LEM: 0.4512, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4398, partial_loss/deprel_loss: 0.4302, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5925, loss: 0.5301, batch_reg_loss: 0.1604, reg_loss: 0.1605 ||:  51%|#####1    | 57/111 [00:36<00:35,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9336, UAS: 0.9608, LAS: 0.9289, UEM: 0.6569, LEM: 0.4490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2930, partial_loss/deprel_loss: 0.3515, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5002, loss: 0.5271, batch_reg_loss: 0.1604, reg_loss: 0.1604 ||:  55%|#####4    | 61/111 [00:39<00:33,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9346, UAS: 0.9612, LAS: 0.9292, UEM: 0.6546, LEM: 0.4441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3279, partial_loss/deprel_loss: 0.3412, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4989, loss: 0.5240, batch_reg_loss: 0.1604, reg_loss: 0.1604 ||:  59%|#####8    | 65/111 [00:42<00:31,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9193, UAS: 0.9609, LAS: 0.9288, UEM: 0.6453, LEM: 0.4344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4810, partial_loss/deprel_loss: 0.4411, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6094, loss: 0.5271, batch_reg_loss: 0.1604, reg_loss: 0.1604 ||:  62%|######2   | 69/111 [00:44<00:27,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9244, UAS: 0.9615, LAS: 0.9291, UEM: 0.6501, LEM: 0.4342, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3155, partial_loss/deprel_loss: 0.4211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5603, loss: 0.5236, batch_reg_loss: 0.1604, reg_loss: 0.1604 ||:  66%|######5   | 73/111 [00:47<00:25,  1.48it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9460, UAS: 0.9618, LAS: 0.9295, UEM: 0.6574, LEM: 0.4425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1190, partial_loss/deprel_loss: 0.2381, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3747, loss: 0.5203, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||:  69%|######9   | 77/111 [00:50<00:23,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9397, UAS: 0.9619, LAS: 0.9296, UEM: 0.6547, LEM: 0.4383, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2334, partial_loss/deprel_loss: 0.2876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4371, loss: 0.5202, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||:  72%|#######2  | 80/111 [00:52<00:21,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9544, UAS: 0.9620, LAS: 0.9295, UEM: 0.6601, LEM: 0.4470, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0805, partial_loss/deprel_loss: 0.1624, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3063, loss: 0.5197, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||:  75%|#######4  | 83/111 [00:54<00:19,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9623, LAS: 0.9298, UEM: 0.6635, LEM: 0.4503, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4317, partial_loss/deprel_loss: 0.4249, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5866, loss: 0.5184, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||:  78%|#######8  | 87/111 [00:57<00:16,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9623, LAS: 0.9299, UEM: 0.6621, LEM: 0.4477, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2083, partial_loss/deprel_loss: 0.3284, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4647, loss: 0.5186, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||:  82%|########1 | 91/111 [00:59<00:13,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9624, LAS: 0.9299, UEM: 0.6604, LEM: 0.4445, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3465, partial_loss/deprel_loss: 0.3166, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4829, loss: 0.5171, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||:  85%|########4 | 94/111 [01:01<00:11,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9430, UAS: 0.9622, LAS: 0.9298, UEM: 0.6586, LEM: 0.4426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1817, partial_loss/deprel_loss: 0.2733, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4153, loss: 0.5183, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||:  88%|########8 | 98/111 [01:04<00:08,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9143, UAS: 0.9618, LAS: 0.9294, UEM: 0.6544, LEM: 0.4381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4789, partial_loss/deprel_loss: 0.4105, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5844, loss: 0.5203, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||:  92%|#########1| 102/111 [01:07<00:05,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9501, UAS: 0.9622, LAS: 0.9298, UEM: 0.6596, LEM: 0.4425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1177, partial_loss/deprel_loss: 0.2160, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3566, loss: 0.5175, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||:  95%|#########5| 106/111 [01:09<00:03,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9620, LAS: 0.9296, UEM: 0.6558, LEM: 0.4387, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2018, partial_loss/deprel_loss: 0.3323, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4664, loss: 0.5189, batch_reg_loss: 0.1603, reg_loss: 0.1604 ||:  99%|#########9| 110/111 [01:12<00:00,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9184, UAS: 0.9619, LAS: 0.9295, UEM: 0.6539, LEM: 0.4372, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5260, partial_loss/deprel_loss: 0.4188, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6005, loss: 0.5196, batch_reg_loss: 0.1602, reg_loss: 0.1604 ||: 100%|##########| 111/111 [01:13<00:00,  1.52it/s]\n",
      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.419  |       N/A\n",
      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.526  |       N/A\n",
      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.160  |       N/A\n",
      "2023-04-07 01:40:49,216 - INFO - combo.training.tensorboard_writer - UEM                      |     0.654  |       N/A\n",
      "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - LAS                      |     0.929  |       N/A\n",
      "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - loss                     |     0.520  |       N/A\n",
      "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - LEM                      |     0.437  |       N/A\n",
      "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |       N/A\n",
      "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - EM                       |     0.918  |       N/A\n",
      "2023-04-07 01:40:49,217 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:40:49,222 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:40:54,297 - INFO - combo.training.trainer - Epoch duration: 0:01:21.425042\n",
      "2023-04-07 01:40:54,298 - INFO - combo.training.trainer - Estimated training time remaining: 6:16:27\n",
      "2023-04-07 01:40:54,298 - INFO - allennlp.training.trainer - Epoch 125/399\n",
      "2023-04-07 01:40:54,298 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:40:54,299 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:40:54,308 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9613, LAS: 0.9313, UEM: 0.6735, LEM: 0.4888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5213, partial_loss/deprel_loss: 0.4072, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5903, loss: 0.4758, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||:   3%|2         | 3/111 [00:02<01:25,  1.26it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9322, UAS: 0.9645, LAS: 0.9329, UEM: 0.6774, LEM: 0.4719, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3121, partial_loss/deprel_loss: 0.3536, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5055, loss: 0.4733, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||:   5%|5         | 6/111 [00:04<01:24,  1.24it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9421, UAS: 0.9655, LAS: 0.9342, UEM: 0.6826, LEM: 0.4728, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1777, partial_loss/deprel_loss: 0.2511, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3966, loss: 0.4649, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||:   8%|8         | 9/111 [00:07<01:23,  1.23it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9142, UAS: 0.9650, LAS: 0.9340, UEM: 0.6952, LEM: 0.5047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5937, partial_loss/deprel_loss: 0.4311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6239, loss: 0.4787, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||:  11%|#         | 12/111 [00:09<01:19,  1.25it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9408, UAS: 0.9649, LAS: 0.9337, UEM: 0.6848, LEM: 0.4846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2166, partial_loss/deprel_loss: 0.3294, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4670, loss: 0.4813, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||:  14%|#4        | 16/111 [00:11<01:09,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9513, UAS: 0.9660, LAS: 0.9351, UEM: 0.7062, LEM: 0.5062, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1316, partial_loss/deprel_loss: 0.2023, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3484, loss: 0.4730, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||:  19%|#8        | 21/111 [00:14<00:59,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9748, UAS: 0.9654, LAS: 0.9346, UEM: 0.7213, LEM: 0.5392, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0280, partial_loss/deprel_loss: 0.0973, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2436, loss: 0.4750, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||:  23%|##3       | 26/111 [00:17<00:52,  1.62it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9428, UAS: 0.9653, LAS: 0.9340, UEM: 0.7162, LEM: 0.5280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1675, partial_loss/deprel_loss: 0.2431, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3882, loss: 0.4790, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||:  28%|##7       | 31/111 [00:19<00:45,  1.75it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9649, LAS: 0.9334, UEM: 0.7044, LEM: 0.5135, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2151, partial_loss/deprel_loss: 0.2969, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4407, loss: 0.4833, batch_reg_loss: 0.1602, reg_loss: 0.1602 ||:  32%|###1      | 35/111 [00:22<00:47,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9654, LAS: 0.9339, UEM: 0.7023, LEM: 0.5059, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3088, partial_loss/deprel_loss: 0.3605, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5103, loss: 0.4810, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||:  35%|###5      | 39/111 [00:25<00:47,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9652, UAS: 0.9658, LAS: 0.9344, UEM: 0.7101, LEM: 0.5151, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0582, partial_loss/deprel_loss: 0.1520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2933, loss: 0.4785, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||:  39%|###8      | 43/111 [00:28<00:47,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9472, UAS: 0.9658, LAS: 0.9344, UEM: 0.7116, LEM: 0.5160, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1175, partial_loss/deprel_loss: 0.2207, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3602, loss: 0.4784, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||:  41%|####1     | 46/111 [00:30<00:45,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9330, UAS: 0.9647, LAS: 0.9330, UEM: 0.7041, LEM: 0.5079, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2282, partial_loss/deprel_loss: 0.3713, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5028, loss: 0.4888, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||:  44%|####4     | 49/111 [00:32<00:43,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9644, LAS: 0.9326, UEM: 0.7008, LEM: 0.5038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1494, partial_loss/deprel_loss: 0.2460, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3868, loss: 0.4925, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||:  47%|####6     | 52/111 [00:34<00:42,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9156, UAS: 0.9636, LAS: 0.9317, UEM: 0.6896, LEM: 0.4940, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5430, partial_loss/deprel_loss: 0.4607, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6372, loss: 0.4988, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||:  50%|####9     | 55/111 [00:37<00:40,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9318, UAS: 0.9632, LAS: 0.9313, UEM: 0.6814, LEM: 0.4846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3158, partial_loss/deprel_loss: 0.4089, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5504, loss: 0.5032, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||:  52%|#####2    | 58/111 [00:39<00:38,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9521, UAS: 0.9635, LAS: 0.9314, UEM: 0.6849, LEM: 0.4860, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0668, partial_loss/deprel_loss: 0.2211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3503, loss: 0.5031, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||:  55%|#####4    | 61/111 [00:41<00:36,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9631, LAS: 0.9309, UEM: 0.6769, LEM: 0.4773, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2835, partial_loss/deprel_loss: 0.3242, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4761, loss: 0.5067, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||:  59%|#####8    | 65/111 [00:43<00:31,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9349, UAS: 0.9631, LAS: 0.9309, UEM: 0.6753, LEM: 0.4744, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2259, partial_loss/deprel_loss: 0.3241, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4645, loss: 0.5067, batch_reg_loss: 0.1601, reg_loss: 0.1602 ||:  62%|######2   | 69/111 [00:46<00:28,  1.48it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9258, UAS: 0.9633, LAS: 0.9310, UEM: 0.6719, LEM: 0.4695, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3911, partial_loss/deprel_loss: 0.3975, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5563, loss: 0.5057, batch_reg_loss: 0.1601, reg_loss: 0.1601 ||:  66%|######5   | 73/111 [00:48<00:24,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9328, UAS: 0.9633, LAS: 0.9308, UEM: 0.6678, LEM: 0.4625, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2641, partial_loss/deprel_loss: 0.3907, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5254, loss: 0.5079, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  69%|######9   | 77/111 [00:52<00:23,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9255, UAS: 0.9636, LAS: 0.9310, UEM: 0.6684, LEM: 0.4607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3835, partial_loss/deprel_loss: 0.4084, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5635, loss: 0.5069, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  72%|#######2  | 80/111 [00:54<00:21,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9632, LAS: 0.9306, UEM: 0.6658, LEM: 0.4573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2415, partial_loss/deprel_loss: 0.2731, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4268, loss: 0.5088, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  75%|#######4  | 83/111 [00:56<00:19,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9625, LAS: 0.9298, UEM: 0.6636, LEM: 0.4546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1750, partial_loss/deprel_loss: 0.3212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4520, loss: 0.5155, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  77%|#######7  | 86/111 [00:58<00:17,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9195, UAS: 0.9619, LAS: 0.9293, UEM: 0.6578, LEM: 0.4483, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4905, partial_loss/deprel_loss: 0.4107, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5867, loss: 0.5193, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  81%|########1 | 90/111 [01:01<00:14,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9208, UAS: 0.9620, LAS: 0.9293, UEM: 0.6549, LEM: 0.4443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3594, partial_loss/deprel_loss: 0.3532, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5144, loss: 0.5188, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  85%|########4 | 94/111 [01:03<00:11,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9413, UAS: 0.9620, LAS: 0.9293, UEM: 0.6545, LEM: 0.4433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1414, partial_loss/deprel_loss: 0.2675, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4023, loss: 0.5179, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  88%|########8 | 98/111 [01:06<00:09,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9618, LAS: 0.9291, UEM: 0.6529, LEM: 0.4411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1656, partial_loss/deprel_loss: 0.2876, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4232, loss: 0.5198, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  91%|######### | 101/111 [01:08<00:06,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9024, UAS: 0.9616, LAS: 0.9288, UEM: 0.6486, LEM: 0.4364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5981, partial_loss/deprel_loss: 0.4744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6592, loss: 0.5213, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  94%|#########3| 104/111 [01:10<00:04,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9617, LAS: 0.9288, UEM: 0.6468, LEM: 0.4344, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4200, partial_loss/deprel_loss: 0.3656, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5364, loss: 0.5212, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  96%|#########6| 107/111 [01:12<00:02,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9187, UAS: 0.9617, LAS: 0.9290, UEM: 0.6453, LEM: 0.4317, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4425, partial_loss/deprel_loss: 0.4211, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5854, loss: 0.5202, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||:  99%|#########9| 110/111 [01:15<00:00,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9619, LAS: 0.9291, UEM: 0.6506, LEM: 0.4377, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1172, partial_loss/deprel_loss: 0.2338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3705, loss: 0.5188, batch_reg_loss: 0.1600, reg_loss: 0.1601 ||: 100%|##########| 111/111 [01:16<00:00,  1.46it/s]\n",
      "2023-04-07 01:42:13,636 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9276, UAS: 0.9530, LAS: 0.9045, UEM: 0.6088, LEM: 0.3165, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3952, partial_loss/deprel_loss: 16.7865, partial_loss/cycle_loss: 0.0000, batch_loss: 13.5082, loss: 20.0456, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:09,  1.05it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9492, LAS: 0.8996, UEM: 0.5886, LEM: 0.3032, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4041, partial_loss/deprel_loss: 25.1117, partial_loss/cycle_loss: 0.0000, batch_loss: 20.1702, loss: 22.7926, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:06,  1.04it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8697, UAS: 0.9418, LAS: 0.8909, UEM: 0.5511, LEM: 0.2718, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3135, partial_loss/deprel_loss: 45.1808, partial_loss/cycle_loss: 0.0000, batch_loss: 36.4074, loss: 26.0686, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  69%|######9   | 9/13 [00:08<00:03,  1.08it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8880, UAS: 0.9479, LAS: 0.8988, UEM: 0.6540, LEM: 0.4003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7454, partial_loss/deprel_loss: 28.2911, partial_loss/cycle_loss: 0.0000, batch_loss: 22.7820, loss: 24.2716, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:10<00:00,  1.20it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8880, UAS: 0.9479, LAS: 0.8988, UEM: 0.6540, LEM: 0.4003, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7454, partial_loss/deprel_loss: 28.2911, partial_loss/cycle_loss: 0.0000, batch_loss: 22.7820, loss: 24.2716, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:10<00:00,  1.21it/s]\n",
      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - patience                 |     3.000  |       N/A\n",
      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.234  |    28.291\n",
      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.117  |     0.745\n",
      "2023-04-07 01:42:24,426 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.160  |     0.000\n",
      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - UEM                      |     0.651  |     0.654\n",
      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - LAS                      |     0.929  |     0.899\n",
      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - loss                     |     0.519  |    24.272\n",
      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - LEM                      |     0.438  |     0.400\n",
      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |     0.948\n",
      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - EM                       |     0.947  |     0.888\n",
      "2023-04-07 01:42:24,427 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:42:24,432 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:42:31,104 - INFO - combo.training.trainer - Epoch duration: 0:01:36.805760\n",
      "2023-04-07 01:42:31,104 - INFO - combo.training.trainer - Estimated training time remaining: 6:15:37\n",
      "2023-04-07 01:42:31,105 - INFO - allennlp.training.trainer - Epoch 126/399\n",
      "2023-04-07 01:42:31,105 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:42:31,106 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:42:31,115 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8970, UAS: 0.9523, LAS: 0.9153, UEM: 0.4448, LEM: 0.1759, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8348, partial_loss/deprel_loss: 0.5327, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7531, loss: 0.6257, batch_reg_loss: 0.1600, reg_loss: 0.1600 ||:   3%|2         | 3/111 [00:02<01:16,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9519, LAS: 0.9174, UEM: 0.4296, LEM: 0.1925, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3077, partial_loss/deprel_loss: 0.3612, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5105, loss: 0.6160, batch_reg_loss: 0.1600, reg_loss: 0.1600 ||:   5%|5         | 6/111 [00:04<01:16,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9510, UAS: 0.9612, LAS: 0.9279, UEM: 0.6479, LEM: 0.4082, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1347, partial_loss/deprel_loss: 0.2565, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3921, loss: 0.5449, batch_reg_loss: 0.1600, reg_loss: 0.1600 ||:   8%|8         | 9/111 [00:06<01:17,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9316, UAS: 0.9587, LAS: 0.9255, UEM: 0.5725, LEM: 0.3480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3705, partial_loss/deprel_loss: 0.3808, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5387, loss: 0.5659, batch_reg_loss: 0.1600, reg_loss: 0.1600 ||:  12%|#1        | 13/111 [00:09<01:11,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9550, LAS: 0.9218, UEM: 0.5284, LEM: 0.3201, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3982, partial_loss/deprel_loss: 0.3401, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5117, loss: 0.5809, batch_reg_loss: 0.1599, reg_loss: 0.1600 ||:  14%|#4        | 16/111 [00:11<01:08,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9485, UAS: 0.9576, LAS: 0.9248, UEM: 0.5812, LEM: 0.3710, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1394, partial_loss/deprel_loss: 0.1916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3411, loss: 0.5551, batch_reg_loss: 0.1599, reg_loss: 0.1600 ||:  17%|#7        | 19/111 [00:13<01:07,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9102, UAS: 0.9591, LAS: 0.9260, UEM: 0.6086, LEM: 0.3964, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5340, partial_loss/deprel_loss: 0.4585, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6335, loss: 0.5456, batch_reg_loss: 0.1599, reg_loss: 0.1600 ||:  20%|#9        | 22/111 [00:16<01:04,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9595, LAS: 0.9265, UEM: 0.6058, LEM: 0.3898, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2019, partial_loss/deprel_loss: 0.2954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4366, loss: 0.5419, batch_reg_loss: 0.1599, reg_loss: 0.1600 ||:  23%|##2       | 25/111 [00:18<01:02,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9592, LAS: 0.9265, UEM: 0.5935, LEM: 0.3796, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2432, partial_loss/deprel_loss: 0.3101, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4567, loss: 0.5441, batch_reg_loss: 0.1599, reg_loss: 0.1600 ||:  25%|##5       | 28/111 [00:20<01:00,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9537, UAS: 0.9607, LAS: 0.9278, UEM: 0.6173, LEM: 0.3985, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0671, partial_loss/deprel_loss: 0.2273, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3552, loss: 0.5343, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||:  29%|##8       | 32/111 [00:23<00:56,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9744, UAS: 0.9618, LAS: 0.9291, UEM: 0.6616, LEM: 0.4600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0308, partial_loss/deprel_loss: 0.1074, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2519, loss: 0.5274, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||:  32%|###1      | 35/111 [00:25<00:57,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9629, LAS: 0.9300, UEM: 0.6791, LEM: 0.4738, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1931, partial_loss/deprel_loss: 0.2645, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4101, loss: 0.5188, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||:  34%|###4      | 38/111 [00:28<00:55,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9293, UAS: 0.9631, LAS: 0.9299, UEM: 0.6741, LEM: 0.4640, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3212, partial_loss/deprel_loss: 0.3834, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5308, loss: 0.5209, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||:  37%|###6      | 41/111 [00:30<00:53,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9458, UAS: 0.9636, LAS: 0.9306, UEM: 0.6738, LEM: 0.4614, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1649, partial_loss/deprel_loss: 0.2527, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3950, loss: 0.5159, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||:  40%|###9      | 44/111 [00:32<00:49,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8795, UAS: 0.9616, LAS: 0.9286, UEM: 0.6619, LEM: 0.4516, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1917, partial_loss/deprel_loss: 0.6342, partial_loss/cycle_loss: 0.0000, batch_loss: 0.9055, loss: 0.5302, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||:  42%|####2     | 47/111 [00:34<00:46,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9264, UAS: 0.9616, LAS: 0.9287, UEM: 0.6567, LEM: 0.4456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3388, partial_loss/deprel_loss: 0.3337, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4945, loss: 0.5289, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||:  45%|####5     | 50/111 [00:36<00:43,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9174, UAS: 0.9619, LAS: 0.9291, UEM: 0.6671, LEM: 0.4614, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4964, partial_loss/deprel_loss: 0.3825, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5651, loss: 0.5256, batch_reg_loss: 0.1599, reg_loss: 0.1599 ||:  48%|####7     | 53/111 [00:38<00:41,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9622, LAS: 0.9292, UEM: 0.6709, LEM: 0.4650, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3431, partial_loss/deprel_loss: 0.4040, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5517, loss: 0.5249, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||:  51%|#####1    | 57/111 [00:41<00:37,  1.44it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9502, UAS: 0.9625, LAS: 0.9295, UEM: 0.6701, LEM: 0.4623, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1366, partial_loss/deprel_loss: 0.2424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3811, loss: 0.5231, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||:  55%|#####4    | 61/111 [00:43<00:32,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9627, LAS: 0.9295, UEM: 0.6651, LEM: 0.4552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2284, partial_loss/deprel_loss: 0.3486, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4844, loss: 0.5233, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||:  59%|#####8    | 65/111 [00:46<00:30,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9307, UAS: 0.9625, LAS: 0.9294, UEM: 0.6603, LEM: 0.4487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2891, partial_loss/deprel_loss: 0.3650, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5096, loss: 0.5236, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||:  62%|######2   | 69/111 [00:49<00:28,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9370, UAS: 0.9630, LAS: 0.9299, UEM: 0.6681, LEM: 0.4553, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2423, partial_loss/deprel_loss: 0.3194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4638, loss: 0.5196, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||:  65%|######4   | 72/111 [00:51<00:27,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9628, LAS: 0.9297, UEM: 0.6628, LEM: 0.4496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5273, partial_loss/deprel_loss: 0.4679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6396, loss: 0.5218, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||:  68%|######7   | 75/111 [00:54<00:27,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9489, UAS: 0.9633, LAS: 0.9302, UEM: 0.6708, LEM: 0.4573, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1428, partial_loss/deprel_loss: 0.2046, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3520, loss: 0.5175, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||:  71%|#######1  | 79/111 [00:56<00:23,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9580, UAS: 0.9638, LAS: 0.9310, UEM: 0.6793, LEM: 0.4667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0782, partial_loss/deprel_loss: 0.1631, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3059, loss: 0.5128, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||:  75%|#######4  | 83/111 [00:59<00:20,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9636, LAS: 0.9306, UEM: 0.6747, LEM: 0.4620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1512, partial_loss/deprel_loss: 0.2864, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4191, loss: 0.5153, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||:  78%|#######8  | 87/111 [01:02<00:16,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9326, UAS: 0.9633, LAS: 0.9305, UEM: 0.6681, LEM: 0.4555, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2875, partial_loss/deprel_loss: 0.3476, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4953, loss: 0.5166, batch_reg_loss: 0.1598, reg_loss: 0.1599 ||:  82%|########1 | 91/111 [01:04<00:12,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9631, LAS: 0.9301, UEM: 0.6639, LEM: 0.4504, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1869, partial_loss/deprel_loss: 0.2987, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4361, loss: 0.5193, batch_reg_loss: 0.1597, reg_loss: 0.1599 ||:  86%|########5 | 95/111 [01:06<00:10,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9625, LAS: 0.9295, UEM: 0.6547, LEM: 0.4417, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3615, partial_loss/deprel_loss: 0.4692, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6074, loss: 0.5237, batch_reg_loss: 0.1597, reg_loss: 0.1599 ||:  90%|######### | 100/111 [01:09<00:06,  1.70it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9627, LAS: 0.9297, UEM: 0.6560, LEM: 0.4417, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2675, partial_loss/deprel_loss: 0.2865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4424, loss: 0.5225, batch_reg_loss: 0.1597, reg_loss: 0.1599 ||:  94%|#########3| 104/111 [01:11<00:03,  1.75it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9630, LAS: 0.9299, UEM: 0.6602, LEM: 0.4442, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3212, partial_loss/deprel_loss: 0.3380, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4944, loss: 0.5203, batch_reg_loss: 0.1597, reg_loss: 0.1598 ||:  97%|#########7| 108/111 [01:13<00:01,  1.68it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9630, LAS: 0.9301, UEM: 0.6596, LEM: 0.4437, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1864, partial_loss/deprel_loss: 0.2761, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4179, loss: 0.5199, batch_reg_loss: 0.1597, reg_loss: 0.1598 ||: 100%|##########| 111/111 [01:15<00:00,  1.46it/s]\n",
      "2023-04-07 01:43:50,185 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.276  |       N/A\n",
      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.186  |       N/A\n",
      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.160  |       N/A\n",
      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - UEM                      |     0.660  |       N/A\n",
      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - LAS                      |     0.930  |       N/A\n",
      "2023-04-07 01:43:50,186 - INFO - combo.training.tensorboard_writer - loss                     |     0.520  |       N/A\n",
      "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - LEM                      |     0.444  |       N/A\n",
      "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |       N/A\n",
      "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - EM                       |     0.943  |       N/A\n",
      "2023-04-07 01:43:50,187 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:43:50,192 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:44:00,241 - INFO - combo.training.trainer - Epoch duration: 0:01:29.136743\n",
      "2023-04-07 01:44:00,242 - INFO - combo.training.trainer - Estimated training time remaining: 6:14:29\n",
      "2023-04-07 01:44:00,242 - INFO - allennlp.training.trainer - Epoch 127/399\n",
      "2023-04-07 01:44:00,242 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:44:00,243 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:44:00,251 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9285, UAS: 0.9666, LAS: 0.9335, UEM: 0.6822, LEM: 0.4690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4385, partial_loss/deprel_loss: 0.3819, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5529, loss: 0.4783, batch_reg_loss: 0.1597, reg_loss: 0.1597 ||:   3%|2         | 3/111 [00:02<01:17,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9445, UAS: 0.9638, LAS: 0.9309, UEM: 0.6726, LEM: 0.4667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1425, partial_loss/deprel_loss: 0.2496, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3879, loss: 0.5058, batch_reg_loss: 0.1597, reg_loss: 0.1597 ||:   5%|5         | 6/111 [00:04<01:16,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9277, UAS: 0.9619, LAS: 0.9283, UEM: 0.5965, LEM: 0.3874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2555, partial_loss/deprel_loss: 0.3948, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5267, loss: 0.5256, batch_reg_loss: 0.1597, reg_loss: 0.1597 ||:   9%|9         | 10/111 [00:06<01:10,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9636, LAS: 0.9300, UEM: 0.6324, LEM: 0.4101, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4912, partial_loss/deprel_loss: 0.4681, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6324, loss: 0.5159, batch_reg_loss: 0.1597, reg_loss: 0.1597 ||:  12%|#1        | 13/111 [00:09<01:11,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9109, UAS: 0.9637, LAS: 0.9308, UEM: 0.6668, LEM: 0.4577, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6734, partial_loss/deprel_loss: 0.4497, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6541, loss: 0.5116, batch_reg_loss: 0.1597, reg_loss: 0.1597 ||:  14%|#4        | 16/111 [00:11<01:10,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9514, UAS: 0.9639, LAS: 0.9320, UEM: 0.6639, LEM: 0.4582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2104, partial_loss/deprel_loss: 0.2366, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3910, loss: 0.5048, batch_reg_loss: 0.1597, reg_loss: 0.1597 ||:  18%|#8        | 20/111 [00:14<01:05,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9408, UAS: 0.9655, LAS: 0.9335, UEM: 0.6962, LEM: 0.4888, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1528, partial_loss/deprel_loss: 0.2687, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4052, loss: 0.4916, batch_reg_loss: 0.1596, reg_loss: 0.1597 ||:  21%|##        | 23/111 [00:16<01:03,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9310, UAS: 0.9646, LAS: 0.9324, UEM: 0.6944, LEM: 0.4846, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3410, partial_loss/deprel_loss: 0.3548, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5116, loss: 0.4969, batch_reg_loss: 0.1596, reg_loss: 0.1597 ||:  23%|##3       | 26/111 [00:18<01:00,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9652, LAS: 0.9334, UEM: 0.7096, LEM: 0.5095, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2559, partial_loss/deprel_loss: 0.3340, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4780, loss: 0.4899, batch_reg_loss: 0.1596, reg_loss: 0.1597 ||:  26%|##6       | 29/111 [00:20<00:58,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9217, UAS: 0.9649, LAS: 0.9331, UEM: 0.7063, LEM: 0.5084, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5047, partial_loss/deprel_loss: 0.4043, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5840, loss: 0.4897, batch_reg_loss: 0.1596, reg_loss: 0.1597 ||:  29%|##8       | 32/111 [00:22<00:55,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9226, UAS: 0.9646, LAS: 0.9326, UEM: 0.7006, LEM: 0.5012, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4657, partial_loss/deprel_loss: 0.4395, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6044, loss: 0.4926, batch_reg_loss: 0.1596, reg_loss: 0.1597 ||:  32%|###1      | 35/111 [00:25<00:54,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9638, LAS: 0.9318, UEM: 0.6895, LEM: 0.4905, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4964, partial_loss/deprel_loss: 0.4363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6079, loss: 0.4988, batch_reg_loss: 0.1596, reg_loss: 0.1597 ||:  34%|###4      | 38/111 [00:27<00:52,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9643, LAS: 0.9322, UEM: 0.6923, LEM: 0.4881, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1772, partial_loss/deprel_loss: 0.2341, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3823, loss: 0.4965, batch_reg_loss: 0.1596, reg_loss: 0.1596 ||:  37%|###6      | 41/111 [00:29<00:49,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9366, UAS: 0.9650, LAS: 0.9329, UEM: 0.6934, LEM: 0.4853, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3462, partial_loss/deprel_loss: 0.3507, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5094, loss: 0.4947, batch_reg_loss: 0.1596, reg_loss: 0.1596 ||:  41%|####      | 45/111 [00:31<00:45,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9247, UAS: 0.9646, LAS: 0.9323, UEM: 0.6840, LEM: 0.4736, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3669, partial_loss/deprel_loss: 0.4550, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5969, loss: 0.4992, batch_reg_loss: 0.1596, reg_loss: 0.1596 ||:  43%|####3     | 48/111 [00:34<00:44,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9263, UAS: 0.9646, LAS: 0.9325, UEM: 0.6855, LEM: 0.4765, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5006, partial_loss/deprel_loss: 0.3715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5569, loss: 0.4968, batch_reg_loss: 0.1596, reg_loss: 0.1596 ||:  46%|####5     | 51/111 [00:36<00:42,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9466, UAS: 0.9644, LAS: 0.9320, UEM: 0.6830, LEM: 0.4708, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1502, partial_loss/deprel_loss: 0.2345, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3772, loss: 0.5002, batch_reg_loss: 0.1596, reg_loss: 0.1596 ||:  50%|####9     | 55/111 [00:38<00:37,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9305, UAS: 0.9638, LAS: 0.9313, UEM: 0.6721, LEM: 0.4593, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2561, partial_loss/deprel_loss: 0.3670, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5043, loss: 0.5036, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  53%|#####3    | 59/111 [00:41<00:34,  1.52it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9442, UAS: 0.9633, LAS: 0.9308, UEM: 0.6646, LEM: 0.4515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2075, partial_loss/deprel_loss: 0.2798, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4249, loss: 0.5076, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  57%|#####6    | 63/111 [00:43<00:31,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9526, UAS: 0.9636, LAS: 0.9312, UEM: 0.6650, LEM: 0.4502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1355, partial_loss/deprel_loss: 0.2434, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3814, loss: 0.5041, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  60%|######    | 67/111 [00:46<00:28,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9367, UAS: 0.9630, LAS: 0.9306, UEM: 0.6607, LEM: 0.4461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2619, partial_loss/deprel_loss: 0.3262, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4728, loss: 0.5077, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  64%|######3   | 71/111 [00:48<00:25,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8759, UAS: 0.9626, LAS: 0.9302, UEM: 0.6624, LEM: 0.4463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.1859, partial_loss/deprel_loss: 0.6156, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8891, loss: 0.5098, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  68%|######7   | 75/111 [00:51<00:24,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9623, LAS: 0.9297, UEM: 0.6539, LEM: 0.4374, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4116, partial_loss/deprel_loss: 0.3849, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5497, loss: 0.5136, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  71%|#######1  | 79/111 [00:53<00:20,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9441, UAS: 0.9624, LAS: 0.9298, UEM: 0.6510, LEM: 0.4334, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2462, partial_loss/deprel_loss: 0.2908, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4414, loss: 0.5126, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  75%|#######4  | 83/111 [00:56<00:18,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9621, LAS: 0.9296, UEM: 0.6472, LEM: 0.4299, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1450, partial_loss/deprel_loss: 0.2571, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3941, loss: 0.5159, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  78%|#######8  | 87/111 [00:59<00:16,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9028, UAS: 0.9611, LAS: 0.9285, UEM: 0.6402, LEM: 0.4247, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6970, partial_loss/deprel_loss: 0.5140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7101, loss: 0.5234, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  81%|########1 | 90/111 [01:01<00:14,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9616, LAS: 0.9290, UEM: 0.6462, LEM: 0.4303, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2819, partial_loss/deprel_loss: 0.3448, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4917, loss: 0.5197, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  85%|########4 | 94/111 [01:04<00:11,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9470, UAS: 0.9612, LAS: 0.9286, UEM: 0.6422, LEM: 0.4280, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1579, partial_loss/deprel_loss: 0.2391, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3823, loss: 0.5220, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  88%|########8 | 98/111 [01:06<00:08,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9374, UAS: 0.9614, LAS: 0.9288, UEM: 0.6433, LEM: 0.4273, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2286, partial_loss/deprel_loss: 0.3183, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4598, loss: 0.5200, batch_reg_loss: 0.1595, reg_loss: 0.1596 ||:  93%|#########2| 103/111 [01:08<00:04,  1.68it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9692, UAS: 0.9617, LAS: 0.9292, UEM: 0.6548, LEM: 0.4426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0445, partial_loss/deprel_loss: 0.1054, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2527, loss: 0.5181, batch_reg_loss: 0.1594, reg_loss: 0.1596 ||:  97%|#########7| 108/111 [01:11<00:01,  1.73it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9456, UAS: 0.9619, LAS: 0.9293, UEM: 0.6544, LEM: 0.4415, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1877, partial_loss/deprel_loss: 0.2913, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4300, loss: 0.5172, batch_reg_loss: 0.1594, reg_loss: 0.1596 ||: 100%|##########| 111/111 [01:12<00:00,  1.52it/s]\n",
      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.291  |       N/A\n",
      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.188  |       N/A\n",
      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.160  |       N/A\n",
      "2023-04-07 01:45:16,359 - INFO - combo.training.tensorboard_writer - UEM                      |     0.654  |       N/A\n",
      "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - LAS                      |     0.929  |       N/A\n",
      "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - loss                     |     0.517  |       N/A\n",
      "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - LEM                      |     0.441  |       N/A\n",
      "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |       N/A\n",
      "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - EM                       |     0.946  |       N/A\n",
      "2023-04-07 01:45:16,360 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:45:16,364 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:45:21,256 - INFO - combo.training.trainer - Epoch duration: 0:01:21.013571\n",
      "2023-04-07 01:45:21,256 - INFO - combo.training.trainer - Estimated training time remaining: 6:13:04\n",
      "2023-04-07 01:45:21,257 - INFO - allennlp.training.trainer - Epoch 128/399\n",
      "2023-04-07 01:45:21,257 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:45:21,258 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:45:21,267 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9033, UAS: 0.9686, LAS: 0.9401, UEM: 0.8848, LEM: 0.7510, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7817, partial_loss/deprel_loss: 0.4661, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6887, loss: 0.4405, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||:   3%|2         | 3/111 [00:02<01:29,  1.21it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9469, UAS: 0.9672, LAS: 0.9368, UEM: 0.8125, LEM: 0.6448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1316, partial_loss/deprel_loss: 0.2365, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3749, loss: 0.4518, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||:   5%|5         | 6/111 [00:04<01:22,  1.27it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9654, LAS: 0.9340, UEM: 0.7629, LEM: 0.5667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3529, partial_loss/deprel_loss: 0.3521, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5117, loss: 0.4713, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||:   9%|9         | 10/111 [00:07<01:14,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9637, LAS: 0.9319, UEM: 0.7178, LEM: 0.5154, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3760, partial_loss/deprel_loss: 0.3832, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5412, loss: 0.4924, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||:  12%|#1        | 13/111 [00:09<01:10,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9636, LAS: 0.9311, UEM: 0.6900, LEM: 0.4815, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3804, partial_loss/deprel_loss: 0.4062, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5605, loss: 0.5032, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||:  14%|#4        | 16/111 [00:11<01:07,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9628, LAS: 0.9302, UEM: 0.6866, LEM: 0.4737, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2117, partial_loss/deprel_loss: 0.3412, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4747, loss: 0.5149, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||:  17%|#7        | 19/111 [00:13<01:04,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9633, LAS: 0.9300, UEM: 0.6896, LEM: 0.4680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3266, partial_loss/deprel_loss: 0.3767, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5260, loss: 0.5101, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||:  20%|#9        | 22/111 [00:15<01:02,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9712, UAS: 0.9636, LAS: 0.9310, UEM: 0.7128, LEM: 0.5145, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0364, partial_loss/deprel_loss: 0.1140, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2578, loss: 0.5061, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||:  23%|##3       | 26/111 [00:18<01:01,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9292, UAS: 0.9634, LAS: 0.9309, UEM: 0.6973, LEM: 0.4973, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3625, partial_loss/deprel_loss: 0.3910, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5447, loss: 0.5099, batch_reg_loss: 0.1594, reg_loss: 0.1594 ||:  26%|##6       | 29/111 [00:20<01:00,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9117, UAS: 0.9631, LAS: 0.9306, UEM: 0.6848, LEM: 0.4836, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6988, partial_loss/deprel_loss: 0.4732, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6777, loss: 0.5138, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||:  29%|##8       | 32/111 [00:22<00:57,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9393, UAS: 0.9634, LAS: 0.9310, UEM: 0.6844, LEM: 0.4811, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1891, partial_loss/deprel_loss: 0.3036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4400, loss: 0.5123, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||:  32%|###1      | 35/111 [00:24<00:54,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9637, LAS: 0.9314, UEM: 0.6839, LEM: 0.4814, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3352, partial_loss/deprel_loss: 0.4113, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5554, loss: 0.5115, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||:  35%|###5      | 39/111 [00:27<00:49,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9635, LAS: 0.9312, UEM: 0.6794, LEM: 0.4762, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1725, partial_loss/deprel_loss: 0.3144, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4454, loss: 0.5129, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||:  38%|###7      | 42/111 [00:29<00:49,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9314, UAS: 0.9634, LAS: 0.9313, UEM: 0.6717, LEM: 0.4660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2903, partial_loss/deprel_loss: 0.3103, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4656, loss: 0.5106, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||:  41%|####1     | 46/111 [00:32<00:44,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9631, LAS: 0.9309, UEM: 0.6701, LEM: 0.4657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3267, partial_loss/deprel_loss: 0.3545, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5083, loss: 0.5113, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||:  44%|####4     | 49/111 [00:34<00:43,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9639, LAS: 0.9318, UEM: 0.6815, LEM: 0.4748, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1246, partial_loss/deprel_loss: 0.2929, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4186, loss: 0.5053, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||:  47%|####6     | 52/111 [00:36<00:41,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9413, UAS: 0.9647, LAS: 0.9326, UEM: 0.6911, LEM: 0.4791, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2317, partial_loss/deprel_loss: 0.3164, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4588, loss: 0.4997, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||:  50%|#####     | 56/111 [00:39<00:38,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9196, UAS: 0.9643, LAS: 0.9323, UEM: 0.6836, LEM: 0.4717, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5482, partial_loss/deprel_loss: 0.4451, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6250, loss: 0.5023, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||:  53%|#####3    | 59/111 [00:41<00:36,  1.44it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9204, UAS: 0.9643, LAS: 0.9320, UEM: 0.6791, LEM: 0.4649, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3415, partial_loss/deprel_loss: 0.4532, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5901, loss: 0.5038, batch_reg_loss: 0.1593, reg_loss: 0.1594 ||:  56%|#####5    | 62/111 [00:43<00:34,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9440, UAS: 0.9637, LAS: 0.9313, UEM: 0.6766, LEM: 0.4639, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1466, partial_loss/deprel_loss: 0.2395, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3802, loss: 0.5083, batch_reg_loss: 0.1593, reg_loss: 0.1593 ||:  59%|#####8    | 65/111 [00:45<00:32,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9634, LAS: 0.9310, UEM: 0.6691, LEM: 0.4564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5409, partial_loss/deprel_loss: 0.4361, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6163, loss: 0.5110, batch_reg_loss: 0.1593, reg_loss: 0.1593 ||:  61%|######1   | 68/111 [00:47<00:30,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9635, LAS: 0.9313, UEM: 0.6709, LEM: 0.4585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3952, partial_loss/deprel_loss: 0.3686, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5331, loss: 0.5081, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||:  64%|######3   | 71/111 [00:49<00:28,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9457, UAS: 0.9629, LAS: 0.9306, UEM: 0.6680, LEM: 0.4550, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1545, partial_loss/deprel_loss: 0.2424, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3841, loss: 0.5118, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||:  68%|######7   | 75/111 [00:52<00:24,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9399, UAS: 0.9630, LAS: 0.9309, UEM: 0.6637, LEM: 0.4490, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2650, partial_loss/deprel_loss: 0.3520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4938, loss: 0.5100, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||:  71%|#######1  | 79/111 [00:54<00:20,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9333, UAS: 0.9628, LAS: 0.9307, UEM: 0.6595, LEM: 0.4460, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2778, partial_loss/deprel_loss: 0.3128, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4650, loss: 0.5112, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||:  76%|#######5  | 84/111 [00:56<00:15,  1.70it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9197, UAS: 0.9622, LAS: 0.9302, UEM: 0.6550, LEM: 0.4419, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4723, partial_loss/deprel_loss: 0.4125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5837, loss: 0.5147, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||:  79%|#######9  | 88/111 [00:59<00:13,  1.71it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9390, UAS: 0.9624, LAS: 0.9305, UEM: 0.6550, LEM: 0.4425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3401, partial_loss/deprel_loss: 0.2957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4638, loss: 0.5130, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||:  84%|########3 | 93/111 [01:01<00:09,  1.85it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9624, LAS: 0.9306, UEM: 0.6547, LEM: 0.4426, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4645, partial_loss/deprel_loss: 0.3790, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5553, loss: 0.5128, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||:  87%|########7 | 97/111 [01:03<00:07,  1.76it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9192, UAS: 0.9625, LAS: 0.9306, UEM: 0.6569, LEM: 0.4456, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5331, partial_loss/deprel_loss: 0.3988, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5848, loss: 0.5122, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||:  91%|######### | 101/111 [01:06<00:06,  1.63it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9470, UAS: 0.9622, LAS: 0.9302, UEM: 0.6549, LEM: 0.4436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1454, partial_loss/deprel_loss: 0.2793, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4117, loss: 0.5142, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||:  95%|#########4| 105/111 [01:09<00:03,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9422, UAS: 0.9624, LAS: 0.9303, UEM: 0.6560, LEM: 0.4425, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1664, partial_loss/deprel_loss: 0.2886, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4233, loss: 0.5129, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||:  98%|#########8| 109/111 [01:12<00:01,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9176, UAS: 0.9622, LAS: 0.9302, UEM: 0.6526, LEM: 0.4394, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5603, partial_loss/deprel_loss: 0.4172, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6050, loss: 0.5139, batch_reg_loss: 0.1592, reg_loss: 0.1593 ||: 100%|##########| 111/111 [01:13<00:00,  1.50it/s]\n",
      "2023-04-07 01:46:37,762 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.417  |       N/A\n",
      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.560  |       N/A\n",
      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.159  |       N/A\n",
      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - UEM                      |     0.653  |       N/A\n",
      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - LAS                      |     0.930  |       N/A\n",
      "2023-04-07 01:46:37,763 - INFO - combo.training.tensorboard_writer - loss                     |     0.514  |       N/A\n",
      "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - LEM                      |     0.439  |       N/A\n",
      "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - UAS                      |     0.962  |       N/A\n",
      "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - EM                       |     0.918  |       N/A\n",
      "2023-04-07 01:46:37,764 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:46:37,768 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:46:41,880 - INFO - combo.training.trainer - Epoch duration: 0:01:20.623541\n",
      "2023-04-07 01:46:41,881 - INFO - combo.training.trainer - Estimated training time remaining: 6:11:38\n",
      "2023-04-07 01:46:41,881 - INFO - allennlp.training.trainer - Epoch 129/399\n",
      "2023-04-07 01:46:41,881 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:46:41,882 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:46:41,889 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8972, UAS: 0.9571, LAS: 0.9253, UEM: 0.6291, LEM: 0.4178, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8287, partial_loss/deprel_loss: 0.4590, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6921, loss: 0.5324, batch_reg_loss: 0.1592, reg_loss: 0.1592 ||:   3%|2         | 3/111 [00:02<01:26,  1.25it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9592, LAS: 0.9265, UEM: 0.5725, LEM: 0.3463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4818, partial_loss/deprel_loss: 0.4078, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5818, loss: 0.5464, batch_reg_loss: 0.1591, reg_loss: 0.1592 ||:   5%|5         | 6/111 [00:04<01:20,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9294, UAS: 0.9626, LAS: 0.9302, UEM: 0.5930, LEM: 0.3601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3725, partial_loss/deprel_loss: 0.3704, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5299, loss: 0.5211, batch_reg_loss: 0.1591, reg_loss: 0.1592 ||:   8%|8         | 9/111 [00:06<01:15,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9246, UAS: 0.9638, LAS: 0.9326, UEM: 0.6199, LEM: 0.3914, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4593, partial_loss/deprel_loss: 0.3696, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5467, loss: 0.5010, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||:  11%|#         | 12/111 [00:08<01:11,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9417, UAS: 0.9640, LAS: 0.9327, UEM: 0.6444, LEM: 0.4161, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1979, partial_loss/deprel_loss: 0.3103, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4470, loss: 0.4944, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||:  14%|#3        | 15/111 [00:10<01:09,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9640, LAS: 0.9322, UEM: 0.6360, LEM: 0.4038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2576, partial_loss/deprel_loss: 0.2993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4501, loss: 0.4992, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||:  16%|#6        | 18/111 [00:12<01:06,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9204, UAS: 0.9635, LAS: 0.9319, UEM: 0.6334, LEM: 0.4055, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5344, partial_loss/deprel_loss: 0.4422, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6198, loss: 0.5011, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||:  19%|#8        | 21/111 [00:15<01:07,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9634, LAS: 0.9314, UEM: 0.6320, LEM: 0.3991, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2485, partial_loss/deprel_loss: 0.3423, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4827, loss: 0.5029, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||:  22%|##1       | 24/111 [00:17<01:03,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9456, UAS: 0.9630, LAS: 0.9313, UEM: 0.6391, LEM: 0.4144, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1685, partial_loss/deprel_loss: 0.2535, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3956, loss: 0.5036, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||:  25%|##5       | 28/111 [00:19<00:57,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9584, UAS: 0.9631, LAS: 0.9318, UEM: 0.6667, LEM: 0.4546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0664, partial_loss/deprel_loss: 0.1603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3006, loss: 0.4998, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||:  28%|##7       | 31/111 [00:22<00:57,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9255, UAS: 0.9630, LAS: 0.9316, UEM: 0.6514, LEM: 0.4349, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5565, partial_loss/deprel_loss: 0.4437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6253, loss: 0.5023, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||:  32%|###1      | 35/111 [00:24<00:53,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9644, LAS: 0.9331, UEM: 0.6810, LEM: 0.4665, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1582, partial_loss/deprel_loss: 0.2944, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4262, loss: 0.4920, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||:  34%|###4      | 38/111 [00:27<00:52,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9537, UAS: 0.9647, LAS: 0.9334, UEM: 0.6813, LEM: 0.4670, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1636, partial_loss/deprel_loss: 0.1904, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3441, loss: 0.4904, batch_reg_loss: 0.1591, reg_loss: 0.1591 ||:  37%|###6      | 41/111 [00:29<00:50,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9418, UAS: 0.9655, LAS: 0.9341, UEM: 0.6899, LEM: 0.4729, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1564, partial_loss/deprel_loss: 0.2981, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4288, loss: 0.4847, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  40%|###9      | 44/111 [00:31<00:49,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9234, UAS: 0.9650, LAS: 0.9336, UEM: 0.6775, LEM: 0.4600, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3987, partial_loss/deprel_loss: 0.3938, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5538, loss: 0.4880, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  43%|####3     | 48/111 [00:34<00:43,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9524, UAS: 0.9650, LAS: 0.9337, UEM: 0.6821, LEM: 0.4667, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0927, partial_loss/deprel_loss: 0.2014, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3387, loss: 0.4874, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  46%|####5     | 51/111 [00:36<00:43,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9400, UAS: 0.9645, LAS: 0.9329, UEM: 0.6861, LEM: 0.4691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1431, partial_loss/deprel_loss: 0.2954, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4239, loss: 0.4911, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  49%|####8     | 54/111 [00:38<00:41,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9640, LAS: 0.9326, UEM: 0.6750, LEM: 0.4590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4421, partial_loss/deprel_loss: 0.3833, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5540, loss: 0.4949, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  52%|#####2    | 58/111 [00:41<00:36,  1.44it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9638, LAS: 0.9325, UEM: 0.6746, LEM: 0.4601, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6530, partial_loss/deprel_loss: 0.3825, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5956, loss: 0.4935, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  56%|#####5    | 62/111 [00:43<00:32,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9447, UAS: 0.9637, LAS: 0.9322, UEM: 0.6696, LEM: 0.4541, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2146, partial_loss/deprel_loss: 0.2791, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4252, loss: 0.4968, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  59%|#####9    | 66/111 [00:45<00:28,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9640, LAS: 0.9326, UEM: 0.6803, LEM: 0.4734, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3815, partial_loss/deprel_loss: 0.4428, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5895, loss: 0.4949, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  63%|######3   | 70/111 [00:47<00:24,  1.67it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9169, UAS: 0.9629, LAS: 0.9315, UEM: 0.6715, LEM: 0.4660, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6440, partial_loss/deprel_loss: 0.4679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6621, loss: 0.5023, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  67%|######6   | 74/111 [00:49<00:21,  1.75it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9433, UAS: 0.9632, LAS: 0.9317, UEM: 0.6740, LEM: 0.4683, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2068, partial_loss/deprel_loss: 0.2518, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4017, loss: 0.5003, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  71%|#######1  | 79/111 [00:52<00:17,  1.86it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9632, LAS: 0.9317, UEM: 0.6723, LEM: 0.4657, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3288, partial_loss/deprel_loss: 0.3709, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5215, loss: 0.5008, batch_reg_loss: 0.1590, reg_loss: 0.1591 ||:  75%|#######4  | 83/111 [00:54<00:15,  1.82it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9262, UAS: 0.9627, LAS: 0.9313, UEM: 0.6709, LEM: 0.4648, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3954, partial_loss/deprel_loss: 0.3580, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5244, loss: 0.5027, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||:  78%|#######8  | 87/111 [00:57<00:14,  1.65it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9434, UAS: 0.9632, LAS: 0.9318, UEM: 0.6740, LEM: 0.4668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1702, partial_loss/deprel_loss: 0.2829, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4193, loss: 0.5005, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||:  82%|########1 | 91/111 [01:00<00:12,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9632, LAS: 0.9318, UEM: 0.6711, LEM: 0.4630, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3401, partial_loss/deprel_loss: 0.3492, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5063, loss: 0.5009, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||:  86%|########5 | 95/111 [01:03<00:10,  1.53it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9354, UAS: 0.9633, LAS: 0.9318, UEM: 0.6691, LEM: 0.4596, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2271, partial_loss/deprel_loss: 0.3264, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4655, loss: 0.5007, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||:  89%|########9 | 99/111 [01:05<00:07,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8938, UAS: 0.9627, LAS: 0.9312, UEM: 0.6639, LEM: 0.4552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8737, partial_loss/deprel_loss: 0.5311, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7585, loss: 0.5051, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||:  93%|#########2| 103/111 [01:08<00:05,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9308, UAS: 0.9626, LAS: 0.9309, UEM: 0.6591, LEM: 0.4496, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2589, partial_loss/deprel_loss: 0.3584, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4974, loss: 0.5073, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||:  96%|#########6| 107/111 [01:11<00:02,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9420, UAS: 0.9626, LAS: 0.9310, UEM: 0.6551, LEM: 0.4449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2786, partial_loss/deprel_loss: 0.3110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4634, loss: 0.5071, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||: 100%|##########| 111/111 [01:13<00:00,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9420, UAS: 0.9626, LAS: 0.9310, UEM: 0.6551, LEM: 0.4449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2786, partial_loss/deprel_loss: 0.3110, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4634, loss: 0.5071, batch_reg_loss: 0.1589, reg_loss: 0.1590 ||: 100%|##########| 111/111 [01:13<00:00,  1.50it/s]\n",
      "2023-04-07 01:47:59,072 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:47:59,072 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:47:59,072 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:47:59,072 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:47:59,072 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
      "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.311  |       N/A\n",
      "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.279  |       N/A\n",
      "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.159  |       N/A\n",
      "2023-04-07 01:47:59,073 - INFO - combo.training.tensorboard_writer - UEM                      |     0.655  |       N/A\n",
      "2023-04-07 01:47:59,074 - INFO - combo.training.tensorboard_writer - LAS                      |     0.931  |       N/A\n",
      "2023-04-07 01:47:59,074 - INFO - combo.training.tensorboard_writer - loss                     |     0.507  |       N/A\n",
      "2023-04-07 01:47:59,074 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:47:59,074 - INFO - combo.training.tensorboard_writer - LEM                      |     0.445  |       N/A\n",
      "2023-04-07 01:47:59,074 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:47:59,074 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:47:59,074 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |       N/A\n",
      "2023-04-07 01:47:59,075 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:47:59,075 - INFO - combo.training.tensorboard_writer - EM                       |     0.942  |       N/A\n",
      "2023-04-07 01:47:59,075 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2023-04-07 01:47:59,081 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:48:06,063 - INFO - combo.training.trainer - Epoch duration: 0:01:24.181700\n",
      "2023-04-07 01:48:06,063 - INFO - combo.training.trainer - Estimated training time remaining: 6:10:20\n",
      "2023-04-07 01:48:06,063 - INFO - allennlp.training.trainer - Epoch 130/399\n",
      "2023-04-07 01:48:06,063 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:48:06,064 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:48:06,073 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9369, UAS: 0.9644, LAS: 0.9321, UEM: 0.6007, LEM: 0.3618, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2983, partial_loss/deprel_loss: 0.2848, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4464, loss: 0.5070, batch_reg_loss: 0.1589, reg_loss: 0.1589 ||:   4%|3         | 4/111 [00:02<01:06,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9630, LAS: 0.9319, UEM: 0.5347, LEM: 0.2950, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2984, partial_loss/deprel_loss: 0.3859, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5272, loss: 0.5090, batch_reg_loss: 0.1589, reg_loss: 0.1589 ||:   7%|7         | 8/111 [00:05<01:05,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9131, UAS: 0.9602, LAS: 0.9286, UEM: 0.5392, LEM: 0.3094, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5463, partial_loss/deprel_loss: 0.4304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6124, loss: 0.5236, batch_reg_loss: 0.1589, reg_loss: 0.1589 ||:  11%|#         | 12/111 [00:07<01:00,  1.63it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9450, UAS: 0.9631, LAS: 0.9321, UEM: 0.5913, LEM: 0.3613, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1982, partial_loss/deprel_loss: 0.2946, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4342, loss: 0.5061, batch_reg_loss: 0.1589, reg_loss: 0.1589 ||:  14%|#3        | 15/111 [00:09<01:00,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9651, LAS: 0.9341, UEM: 0.6675, LEM: 0.4530, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1868, partial_loss/deprel_loss: 0.2916, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4295, loss: 0.4874, batch_reg_loss: 0.1589, reg_loss: 0.1589 ||:  16%|#6        | 18/111 [00:11<01:02,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9496, UAS: 0.9650, LAS: 0.9341, UEM: 0.6555, LEM: 0.4358, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1861, partial_loss/deprel_loss: 0.2947, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4318, loss: 0.4924, batch_reg_loss: 0.1588, reg_loss: 0.1589 ||:  19%|#8        | 21/111 [00:13<01:01,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9653, LAS: 0.9344, UEM: 0.6473, LEM: 0.4239, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3484, partial_loss/deprel_loss: 0.3837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5355, loss: 0.4921, batch_reg_loss: 0.1588, reg_loss: 0.1589 ||:  22%|##1       | 24/111 [00:15<00:59,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9186, UAS: 0.9638, LAS: 0.9329, UEM: 0.6244, LEM: 0.4037, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5195, partial_loss/deprel_loss: 0.4305, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6071, loss: 0.5015, batch_reg_loss: 0.1588, reg_loss: 0.1589 ||:  25%|##5       | 28/111 [00:18<00:55,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9630, LAS: 0.9317, UEM: 0.6259, LEM: 0.4043, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9956, partial_loss/deprel_loss: 0.5592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8053, loss: 0.5075, batch_reg_loss: 0.1588, reg_loss: 0.1589 ||:  29%|##8       | 32/111 [00:21<00:52,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9632, LAS: 0.9318, UEM: 0.6266, LEM: 0.4038, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4981, partial_loss/deprel_loss: 0.4304, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6027, loss: 0.5074, batch_reg_loss: 0.1588, reg_loss: 0.1588 ||:  32%|###2      | 36/111 [00:23<00:48,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9090, UAS: 0.9640, LAS: 0.9322, UEM: 0.6423, LEM: 0.4150, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5620, partial_loss/deprel_loss: 0.4993, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6706, loss: 0.5044, batch_reg_loss: 0.1588, reg_loss: 0.1588 ||:  36%|###6      | 40/111 [00:26<00:46,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9436, UAS: 0.9647, LAS: 0.9332, UEM: 0.6779, LEM: 0.4652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1671, partial_loss/deprel_loss: 0.2614, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4013, loss: 0.4988, batch_reg_loss: 0.1588, reg_loss: 0.1588 ||:  39%|###8      | 43/111 [00:29<00:50,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9457, UAS: 0.9657, LAS: 0.9343, UEM: 0.7038, LEM: 0.4956, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1492, partial_loss/deprel_loss: 0.2090, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3558, loss: 0.4886, batch_reg_loss: 0.1588, reg_loss: 0.1588 ||:  42%|####2     | 47/111 [00:31<00:44,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9126, UAS: 0.9643, LAS: 0.9328, UEM: 0.6897, LEM: 0.4799, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6428, partial_loss/deprel_loss: 0.4771, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6690, loss: 0.4994, batch_reg_loss: 0.1588, reg_loss: 0.1588 ||:  47%|####6     | 52/111 [00:34<00:37,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9641, LAS: 0.9324, UEM: 0.6784, LEM: 0.4671, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4256, partial_loss/deprel_loss: 0.3724, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5417, loss: 0.5004, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  51%|#####1    | 57/111 [00:36<00:31,  1.71it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9473, UAS: 0.9646, LAS: 0.9329, UEM: 0.6881, LEM: 0.4768, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1164, partial_loss/deprel_loss: 0.2322, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3677, loss: 0.4959, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  55%|#####4    | 61/111 [00:38<00:29,  1.70it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9084, UAS: 0.9646, LAS: 0.9331, UEM: 0.6927, LEM: 0.4829, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7745, partial_loss/deprel_loss: 0.3842, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6210, loss: 0.4928, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  59%|#####8    | 65/111 [00:41<00:28,  1.60it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9164, UAS: 0.9634, LAS: 0.9317, UEM: 0.6818, LEM: 0.4728, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6007, partial_loss/deprel_loss: 0.4266, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6201, loss: 0.5024, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  62%|######2   | 69/111 [00:44<00:28,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9018, UAS: 0.9624, LAS: 0.9309, UEM: 0.6704, LEM: 0.4636, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7995, partial_loss/deprel_loss: 0.4756, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6991, loss: 0.5085, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  66%|######5   | 73/111 [00:47<00:26,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9094, UAS: 0.9618, LAS: 0.9302, UEM: 0.6615, LEM: 0.4558, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5721, partial_loss/deprel_loss: 0.4385, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6239, loss: 0.5133, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  68%|######8   | 76/111 [00:49<00:24,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9620, LAS: 0.9302, UEM: 0.6593, LEM: 0.4514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1839, partial_loss/deprel_loss: 0.2956, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4320, loss: 0.5124, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  71%|#######1  | 79/111 [00:51<00:22,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9622, LAS: 0.9302, UEM: 0.6649, LEM: 0.4552, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0736, partial_loss/deprel_loss: 0.2425, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3674, loss: 0.5128, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  74%|#######3  | 82/111 [00:54<00:21,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9530, UAS: 0.9626, LAS: 0.9307, UEM: 0.6698, LEM: 0.4592, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1218, partial_loss/deprel_loss: 0.2427, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3772, loss: 0.5096, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  77%|#######6  | 85/111 [00:56<00:19,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9298, UAS: 0.9628, LAS: 0.9308, UEM: 0.6682, LEM: 0.4564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3937, partial_loss/deprel_loss: 0.3968, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5549, loss: 0.5091, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  79%|#######9  | 88/111 [00:58<00:17,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9350, UAS: 0.9630, LAS: 0.9310, UEM: 0.6678, LEM: 0.4544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2192, partial_loss/deprel_loss: 0.3421, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4762, loss: 0.5076, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  82%|########1 | 91/111 [01:00<00:14,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8878, UAS: 0.9628, LAS: 0.9308, UEM: 0.6676, LEM: 0.4532, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0291, partial_loss/deprel_loss: 0.5194, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7800, loss: 0.5087, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  85%|########4 | 94/111 [01:03<00:12,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9181, UAS: 0.9626, LAS: 0.9306, UEM: 0.6626, LEM: 0.4482, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5218, partial_loss/deprel_loss: 0.4520, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6246, loss: 0.5101, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  87%|########7 | 97/111 [01:05<00:10,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9303, UAS: 0.9626, LAS: 0.9306, UEM: 0.6591, LEM: 0.4438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3161, partial_loss/deprel_loss: 0.3380, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4923, loss: 0.5099, batch_reg_loss: 0.1587, reg_loss: 0.1588 ||:  91%|######### | 101/111 [01:08<00:07,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9092, UAS: 0.9627, LAS: 0.9307, UEM: 0.6601, LEM: 0.4457, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7448, partial_loss/deprel_loss: 0.5054, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7119, loss: 0.5095, batch_reg_loss: 0.1586, reg_loss: 0.1588 ||:  95%|#########4| 105/111 [01:10<00:04,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9627, LAS: 0.9308, UEM: 0.6589, LEM: 0.4450, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1161, partial_loss/deprel_loss: 0.2363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3709, loss: 0.5088, batch_reg_loss: 0.1586, reg_loss: 0.1588 ||:  98%|#########8| 109/111 [01:13<00:01,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9158, UAS: 0.9627, LAS: 0.9307, UEM: 0.6574, LEM: 0.4431, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6138, partial_loss/deprel_loss: 0.4042, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6048, loss: 0.5099, batch_reg_loss: 0.1586, reg_loss: 0.1588 ||: 100%|##########| 111/111 [01:14<00:00,  1.49it/s]\n",
      "2023-04-07 01:49:23,847 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9558, LAS: 0.9078, UEM: 0.7180, LEM: 0.4174, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4751, partial_loss/deprel_loss: 23.4358, partial_loss/cycle_loss: 0.0000, batch_loss: 18.8436, loss: 24.3775, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:08,  1.14it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8372, UAS: 0.9387, LAS: 0.8868, UEM: 0.5723, LEM: 0.3041, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.6799, partial_loss/deprel_loss: 53.1680, partial_loss/cycle_loss: 0.0000, batch_loss: 42.8704, loss: 28.7997, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:06,  1.07it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9395, LAS: 0.8866, UEM: 0.5282, LEM: 0.2489, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7739, partial_loss/deprel_loss: 28.3741, partial_loss/cycle_loss: 0.0000, batch_loss: 22.8540, loss: 27.7545, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  69%|######9   | 9/13 [00:08<00:03,  1.07it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9477, UAS: 0.9457, LAS: 0.8958, UEM: 0.6517, LEM: 0.4020, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1904, partial_loss/deprel_loss: 17.1259, partial_loss/cycle_loss: 0.0000, batch_loss: 13.7388, loss: 25.1794, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:10<00:01,  1.03it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9482, LAS: 0.8982, UEM: 0.6599, LEM: 0.3943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5900, partial_loss/deprel_loss: 23.0872, partial_loss/cycle_loss: 0.0000, batch_loss: 18.5878, loss: 24.2782, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.00s/it]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9014, UAS: 0.9482, LAS: 0.8982, UEM: 0.6599, LEM: 0.3943, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5900, partial_loss/deprel_loss: 23.0872, partial_loss/cycle_loss: 0.0000, batch_loss: 18.5878, loss: 24.2782, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.01it/s]\n",
      "2023-04-07 01:49:36,765 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:49:36,765 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - patience                 |     2.000  |       N/A\n",
      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.404  |    23.087\n",
      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.614  |     0.590\n",
      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.159  |     0.000\n",
      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - UEM                      |     0.657  |     0.660\n",
      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - LAS                      |     0.931  |     0.898\n",
      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - loss                     |     0.510  |    24.278\n",
      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - LEM                      |     0.443  |     0.394\n",
      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-07 01:49:36,766 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-07 01:49:36,767 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |     0.948\n",
      "2023-04-07 01:49:36,767 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-07 01:49:36,767 - INFO - combo.training.tensorboard_writer - EM                       |     0.916  |     0.901\n",
      "2023-04-07 01:49:36,767 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:49:36,772 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:49:41,759 - INFO - combo.training.trainer - Epoch duration: 0:01:35.695957\n",
      "2023-04-07 01:49:41,760 - INFO - combo.training.trainer - Estimated training time remaining: 6:09:25\n",
      "2023-04-07 01:49:41,760 - INFO - allennlp.training.trainer - Epoch 131/399\n",
      "2023-04-07 01:49:41,760 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:49:41,761 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:49:41,771 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9404, UAS: 0.9658, LAS: 0.9335, UEM: 0.6562, LEM: 0.4297, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2158, partial_loss/deprel_loss: 0.3432, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4763, loss: 0.4845, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||:   3%|2         | 3/111 [00:02<01:25,  1.27it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9385, UAS: 0.9690, LAS: 0.9351, UEM: 0.6834, LEM: 0.4218, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2940, partial_loss/deprel_loss: 0.3080, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4639, loss: 0.4758, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||:   5%|5         | 6/111 [00:04<01:19,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9434, UAS: 0.9650, LAS: 0.9318, UEM: 0.6375, LEM: 0.4047, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1942, partial_loss/deprel_loss: 0.2715, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4146, loss: 0.5000, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||:   9%|9         | 10/111 [00:06<01:09,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9116, UAS: 0.9639, LAS: 0.9309, UEM: 0.6198, LEM: 0.3833, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4991, partial_loss/deprel_loss: 0.4957, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6550, loss: 0.5093, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||:  14%|#3        | 15/111 [00:09<01:00,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9096, UAS: 0.9632, LAS: 0.9305, UEM: 0.6157, LEM: 0.3840, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7437, partial_loss/deprel_loss: 0.4854, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6957, loss: 0.5132, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||:  17%|#7        | 19/111 [00:11<00:58,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9644, LAS: 0.9318, UEM: 0.6112, LEM: 0.3696, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3087, partial_loss/deprel_loss: 0.3383, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4910, loss: 0.5065, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||:  21%|##        | 23/111 [00:13<00:52,  1.67it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9700, UAS: 0.9657, LAS: 0.9339, UEM: 0.6792, LEM: 0.4690, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0435, partial_loss/deprel_loss: 0.1104, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2556, loss: 0.4905, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||:  24%|##4       | 27/111 [00:16<00:52,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9643, LAS: 0.9328, UEM: 0.6564, LEM: 0.4454, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3674, partial_loss/deprel_loss: 0.3604, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5203, loss: 0.4984, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||:  28%|##7       | 31/111 [00:18<00:49,  1.63it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9282, UAS: 0.9642, LAS: 0.9326, UEM: 0.6407, LEM: 0.4252, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3813, partial_loss/deprel_loss: 0.3253, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4951, loss: 0.4981, batch_reg_loss: 0.1586, reg_loss: 0.1586 ||:  32%|###2      | 36/111 [00:20<00:42,  1.78it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9645, LAS: 0.9329, UEM: 0.6449, LEM: 0.4271, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4363, partial_loss/deprel_loss: 0.3574, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5318, loss: 0.4958, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||:  37%|###6      | 41/111 [00:23<00:37,  1.85it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9215, UAS: 0.9644, LAS: 0.9328, UEM: 0.6491, LEM: 0.4322, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4255, partial_loss/deprel_loss: 0.4384, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5944, loss: 0.4963, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||:  41%|####      | 45/111 [00:26<00:38,  1.70it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9642, LAS: 0.9327, UEM: 0.6549, LEM: 0.4391, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3966, partial_loss/deprel_loss: 0.3687, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5328, loss: 0.4974, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||:  44%|####4     | 49/111 [00:28<00:37,  1.66it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9357, UAS: 0.9646, LAS: 0.9330, UEM: 0.6640, LEM: 0.4502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2790, partial_loss/deprel_loss: 0.3283, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4769, loss: 0.4947, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||:  48%|####7     | 53/111 [00:31<00:37,  1.57it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9304, UAS: 0.9653, LAS: 0.9338, UEM: 0.6784, LEM: 0.4668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2823, partial_loss/deprel_loss: 0.3371, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4846, loss: 0.4883, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||:  51%|#####1    | 57/111 [00:34<00:37,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9426, UAS: 0.9657, LAS: 0.9338, UEM: 0.6797, LEM: 0.4635, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1760, partial_loss/deprel_loss: 0.2770, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4153, loss: 0.4867, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||:  55%|#####4    | 61/111 [00:37<00:34,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9659, LAS: 0.9341, UEM: 0.6800, LEM: 0.4620, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2181, partial_loss/deprel_loss: 0.3302, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4663, loss: 0.4860, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||:  58%|#####7    | 64/111 [00:39<00:32,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9398, UAS: 0.9655, LAS: 0.9335, UEM: 0.6778, LEM: 0.4590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1973, partial_loss/deprel_loss: 0.2701, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4140, loss: 0.4904, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||:  61%|######1   | 68/111 [00:42<00:29,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9100, UAS: 0.9646, LAS: 0.9325, UEM: 0.6730, LEM: 0.4548, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6611, partial_loss/deprel_loss: 0.4525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6527, loss: 0.4967, batch_reg_loss: 0.1585, reg_loss: 0.1586 ||:  64%|######3   | 71/111 [00:44<00:27,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9640, LAS: 0.9318, UEM: 0.6679, LEM: 0.4515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4213, partial_loss/deprel_loss: 0.4116, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5720, loss: 0.5014, batch_reg_loss: 0.1585, reg_loss: 0.1585 ||:  68%|######7   | 75/111 [00:46<00:24,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9157, UAS: 0.9636, LAS: 0.9316, UEM: 0.6655, LEM: 0.4514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5326, partial_loss/deprel_loss: 0.4338, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6120, loss: 0.5018, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||:  71%|#######1  | 79/111 [00:49<00:21,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9274, UAS: 0.9635, LAS: 0.9314, UEM: 0.6593, LEM: 0.4451, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4088, partial_loss/deprel_loss: 0.3212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4972, loss: 0.5036, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||:  74%|#######3  | 82/111 [00:51<00:19,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9638, LAS: 0.9319, UEM: 0.6595, LEM: 0.4433, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1496, partial_loss/deprel_loss: 0.2449, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3843, loss: 0.5006, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||:  77%|#######7  | 86/111 [00:54<00:16,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9055, UAS: 0.9638, LAS: 0.9319, UEM: 0.6648, LEM: 0.4531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6573, partial_loss/deprel_loss: 0.5130, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7003, loss: 0.5010, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||:  80%|########  | 89/111 [00:56<00:15,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9636, LAS: 0.9317, UEM: 0.6590, LEM: 0.4469, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4891, partial_loss/deprel_loss: 0.4768, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6377, loss: 0.5029, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||:  84%|########3 | 93/111 [00:59<00:11,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9497, UAS: 0.9635, LAS: 0.9316, UEM: 0.6583, LEM: 0.4467, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1251, partial_loss/deprel_loss: 0.2280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3658, loss: 0.5027, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||:  87%|########7 | 97/111 [01:02<00:09,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9636, LAS: 0.9318, UEM: 0.6572, LEM: 0.4449, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1973, partial_loss/deprel_loss: 0.2348, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3857, loss: 0.5018, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||:  90%|######### | 100/111 [01:04<00:07,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9313, UAS: 0.9639, LAS: 0.9319, UEM: 0.6622, LEM: 0.4478, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2035, partial_loss/deprel_loss: 0.3206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4556, loss: 0.5003, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||:  93%|#########2| 103/111 [01:06<00:05,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9097, UAS: 0.9637, LAS: 0.9318, UEM: 0.6594, LEM: 0.4448, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7736, partial_loss/deprel_loss: 0.4351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6612, loss: 0.5017, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||:  95%|#########5| 106/111 [01:08<00:03,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9633, LAS: 0.9314, UEM: 0.6576, LEM: 0.4430, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4196, partial_loss/deprel_loss: 0.3443, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5178, loss: 0.5043, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||:  98%|#########8| 109/111 [01:10<00:01,  1.41it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9162, UAS: 0.9633, LAS: 0.9314, UEM: 0.6589, LEM: 0.4443, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5801, partial_loss/deprel_loss: 0.4209, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6111, loss: 0.5043, batch_reg_loss: 0.1584, reg_loss: 0.1585 ||: 100%|##########| 111/111 [01:12<00:00,  1.53it/s]\n",
      "2023-04-07 01:50:57,365 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:50:57,365 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:50:57,365 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:50:57,365 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:50:57,365 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.421  |       N/A\n",
      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.580  |       N/A\n",
      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.159  |       N/A\n",
      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - UEM                      |     0.659  |       N/A\n",
      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - LAS                      |     0.931  |       N/A\n",
      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - loss                     |     0.504  |       N/A\n",
      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - LEM                      |     0.444  |       N/A\n",
      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:50:57,366 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:50:57,367 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |       N/A\n",
      "2023-04-07 01:50:57,367 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:50:57,367 - INFO - combo.training.tensorboard_writer - EM                       |     0.916  |       N/A\n",
      "2023-04-07 01:50:57,367 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:50:57,372 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:51:04,337 - INFO - combo.training.trainer - Epoch duration: 0:01:22.576860\n",
      "2023-04-07 01:51:04,337 - INFO - combo.training.trainer - Estimated training time remaining: 6:08:03\n",
      "2023-04-07 01:51:04,338 - INFO - allennlp.training.trainer - Epoch 132/399\n",
      "2023-04-07 01:51:04,338 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:51:04,339 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:51:04,348 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9239, UAS: 0.9355, LAS: 0.9035, UEM: 0.2982, LEM: 0.1404, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4192, partial_loss/deprel_loss: 0.4010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5630, loss: 0.6882, batch_reg_loss: 0.1584, reg_loss: 0.1584 ||:   3%|2         | 3/111 [00:02<01:25,  1.26it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9578, UAS: 0.9504, LAS: 0.9180, UEM: 0.5783, LEM: 0.3771, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1050, partial_loss/deprel_loss: 0.2255, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3598, loss: 0.5970, batch_reg_loss: 0.1584, reg_loss: 0.1584 ||:   6%|6         | 7/111 [00:04<01:14,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9253, UAS: 0.9573, LAS: 0.9259, UEM: 0.6287, LEM: 0.4337, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5310, partial_loss/deprel_loss: 0.3926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5786, loss: 0.5515, batch_reg_loss: 0.1584, reg_loss: 0.1584 ||:  11%|#         | 12/111 [00:06<01:04,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9336, UAS: 0.9604, LAS: 0.9291, UEM: 0.6289, LEM: 0.4149, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3882, partial_loss/deprel_loss: 0.3036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4788, loss: 0.5247, batch_reg_loss: 0.1583, reg_loss: 0.1584 ||:  15%|#5        | 17/111 [00:09<00:55,  1.69it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9363, UAS: 0.9596, LAS: 0.9288, UEM: 0.5911, LEM: 0.3805, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2431, partial_loss/deprel_loss: 0.2964, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4441, loss: 0.5271, batch_reg_loss: 0.1583, reg_loss: 0.1584 ||:  20%|#9        | 22/111 [00:11<00:49,  1.80it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9493, UAS: 0.9608, LAS: 0.9298, UEM: 0.6044, LEM: 0.3931, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1252, partial_loss/deprel_loss: 0.2280, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3657, loss: 0.5187, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||:  23%|##3       | 26/111 [00:14<00:49,  1.72it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9229, UAS: 0.9616, LAS: 0.9301, UEM: 0.6135, LEM: 0.3947, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4241, partial_loss/deprel_loss: 0.3883, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5538, loss: 0.5136, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||:  27%|##7       | 30/111 [00:16<00:48,  1.68it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9341, UAS: 0.9613, LAS: 0.9295, UEM: 0.5998, LEM: 0.3801, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2229, partial_loss/deprel_loss: 0.3298, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4667, loss: 0.5181, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||:  31%|###       | 34/111 [00:19<00:46,  1.67it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9604, UAS: 0.9620, LAS: 0.9306, UEM: 0.6366, LEM: 0.4269, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0532, partial_loss/deprel_loss: 0.1433, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2835, loss: 0.5104, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||:  34%|###4      | 38/111 [00:22<00:48,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9631, LAS: 0.9317, UEM: 0.6435, LEM: 0.4283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1988, partial_loss/deprel_loss: 0.3114, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4472, loss: 0.5039, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||:  38%|###7      | 42/111 [00:24<00:43,  1.57it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9167, UAS: 0.9622, LAS: 0.9310, UEM: 0.6257, LEM: 0.4133, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6065, partial_loss/deprel_loss: 0.4111, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6085, loss: 0.5105, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||:  41%|####1     | 46/111 [00:27<00:41,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9235, UAS: 0.9623, LAS: 0.9310, UEM: 0.6233, LEM: 0.4077, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4085, partial_loss/deprel_loss: 0.4134, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5707, loss: 0.5106, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||:  45%|####5     | 50/111 [00:30<00:41,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9335, UAS: 0.9628, LAS: 0.9316, UEM: 0.6238, LEM: 0.4058, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2636, partial_loss/deprel_loss: 0.3504, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4913, loss: 0.5083, batch_reg_loss: 0.1583, reg_loss: 0.1583 ||:  49%|####8     | 54/111 [00:33<00:39,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9632, LAS: 0.9320, UEM: 0.6408, LEM: 0.4249, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3688, partial_loss/deprel_loss: 0.3437, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5070, loss: 0.5037, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  51%|#####1    | 57/111 [00:35<00:39,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9462, UAS: 0.9636, LAS: 0.9324, UEM: 0.6484, LEM: 0.4327, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1830, partial_loss/deprel_loss: 0.2714, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4120, loss: 0.5000, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  54%|#####4    | 60/111 [00:37<00:36,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9334, UAS: 0.9638, LAS: 0.9326, UEM: 0.6474, LEM: 0.4314, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2889, partial_loss/deprel_loss: 0.3331, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4825, loss: 0.4986, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  57%|#####6    | 63/111 [00:39<00:34,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8966, UAS: 0.9625, LAS: 0.9312, UEM: 0.6366, LEM: 0.4223, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9148, partial_loss/deprel_loss: 0.4920, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7348, loss: 0.5080, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  60%|######    | 67/111 [00:42<00:30,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9375, UAS: 0.9625, LAS: 0.9313, UEM: 0.6407, LEM: 0.4283, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3029, partial_loss/deprel_loss: 0.3052, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4629, loss: 0.5070, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  63%|######3   | 70/111 [00:44<00:28,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9121, UAS: 0.9623, LAS: 0.9311, UEM: 0.6390, LEM: 0.4277, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6995, partial_loss/deprel_loss: 0.4300, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6421, loss: 0.5082, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  66%|######5   | 73/111 [00:46<00:26,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9509, UAS: 0.9628, LAS: 0.9315, UEM: 0.6497, LEM: 0.4384, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0792, partial_loss/deprel_loss: 0.2490, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3733, loss: 0.5059, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  68%|######8   | 76/111 [00:49<00:26,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9437, UAS: 0.9626, LAS: 0.9311, UEM: 0.6497, LEM: 0.4388, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1317, partial_loss/deprel_loss: 0.2263, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3656, loss: 0.5085, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  71%|#######1  | 79/111 [00:51<00:23,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9218, UAS: 0.9628, LAS: 0.9313, UEM: 0.6545, LEM: 0.4447, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4289, partial_loss/deprel_loss: 0.4707, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6206, loss: 0.5078, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  75%|#######4  | 83/111 [00:53<00:19,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9324, UAS: 0.9630, LAS: 0.9315, UEM: 0.6547, LEM: 0.4427, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2771, partial_loss/deprel_loss: 0.3637, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5046, loss: 0.5069, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  77%|#######7  | 86/111 [00:55<00:17,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9396, UAS: 0.9633, LAS: 0.9316, UEM: 0.6556, LEM: 0.4405, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2261, partial_loss/deprel_loss: 0.3324, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4693, loss: 0.5058, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  80%|########  | 89/111 [00:57<00:15,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9353, UAS: 0.9631, LAS: 0.9313, UEM: 0.6521, LEM: 0.4364, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2621, partial_loss/deprel_loss: 0.2951, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4466, loss: 0.5071, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  83%|########2 | 92/111 [01:00<00:13,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9728, UAS: 0.9633, LAS: 0.9317, UEM: 0.6672, LEM: 0.4582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0490, partial_loss/deprel_loss: 0.1049, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2518, loss: 0.5055, batch_reg_loss: 0.1582, reg_loss: 0.1583 ||:  86%|########5 | 95/111 [01:03<00:12,  1.27it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9637, LAS: 0.9318, UEM: 0.6667, LEM: 0.4554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3139, partial_loss/deprel_loss: 0.3837, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5279, loss: 0.5045, batch_reg_loss: 0.1581, reg_loss: 0.1583 ||:  89%|########9 | 99/111 [01:05<00:08,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9452, UAS: 0.9638, LAS: 0.9319, UEM: 0.6678, LEM: 0.4559, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1525, partial_loss/deprel_loss: 0.2578, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3949, loss: 0.5033, batch_reg_loss: 0.1581, reg_loss: 0.1583 ||:  92%|#########1| 102/111 [01:07<00:06,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9173, UAS: 0.9633, LAS: 0.9314, UEM: 0.6613, LEM: 0.4506, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5248, partial_loss/deprel_loss: 0.4121, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5928, loss: 0.5068, batch_reg_loss: 0.1581, reg_loss: 0.1583 ||:  95%|#########4| 105/111 [01:09<00:04,  1.36it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9151, UAS: 0.9629, LAS: 0.9311, UEM: 0.6577, LEM: 0.4468, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4233, partial_loss/deprel_loss: 0.4399, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5947, loss: 0.5092, batch_reg_loss: 0.1581, reg_loss: 0.1582 ||:  97%|#########7| 108/111 [01:12<00:02,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9632, LAS: 0.9313, UEM: 0.6598, LEM: 0.4465, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1641, partial_loss/deprel_loss: 0.2865, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4201, loss: 0.5077, batch_reg_loss: 0.1581, reg_loss: 0.1582 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
      "2023-04-07 01:52:21,453 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
      "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.287  |       N/A\n",
      "2023-04-07 01:52:21,454 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.164  |       N/A\n",
      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.158  |       N/A\n",
      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - UEM                      |     0.660  |       N/A\n",
      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - LAS                      |     0.931  |       N/A\n",
      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - loss                     |     0.508  |       N/A\n",
      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - LEM                      |     0.447  |       N/A\n",
      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |       N/A\n",
      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - EM                       |     0.944  |       N/A\n",
      "2023-04-07 01:52:21,455 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:52:21,460 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:52:29,124 - INFO - combo.training.trainer - Epoch duration: 0:01:24.786423\n",
      "2023-04-07 01:52:29,125 - INFO - combo.training.trainer - Estimated training time remaining: 6:06:46\n",
      "2023-04-07 01:52:29,125 - INFO - allennlp.training.trainer - Epoch 133/399\n",
      "2023-04-07 01:52:29,125 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:52:29,126 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:52:29,137 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9376, UAS: 0.9731, LAS: 0.9427, UEM: 0.7832, LEM: 0.5870, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3008, partial_loss/deprel_loss: 0.2936, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4532, loss: 0.4103, batch_reg_loss: 0.1581, reg_loss: 0.1581 ||:   5%|4         | 5/111 [00:02<00:52,  2.00it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9325, UAS: 0.9658, LAS: 0.9356, UEM: 0.7113, LEM: 0.5108, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3312, partial_loss/deprel_loss: 0.3483, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5030, loss: 0.4581, batch_reg_loss: 0.1581, reg_loss: 0.1581 ||:   7%|7         | 8/111 [00:04<00:59,  1.74it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9656, LAS: 0.9347, UEM: 0.7061, LEM: 0.4976, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3322, partial_loss/deprel_loss: 0.3353, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4928, loss: 0.4600, batch_reg_loss: 0.1581, reg_loss: 0.1581 ||:  10%|9         | 11/111 [00:06<01:02,  1.61it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9091, UAS: 0.9632, LAS: 0.9318, UEM: 0.6725, LEM: 0.4664, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7018, partial_loss/deprel_loss: 0.4381, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6489, loss: 0.4809, batch_reg_loss: 0.1581, reg_loss: 0.1581 ||:  13%|#2        | 14/111 [00:08<01:02,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9634, LAS: 0.9313, UEM: 0.6568, LEM: 0.4424, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1925, partial_loss/deprel_loss: 0.3132, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4472, loss: 0.4887, batch_reg_loss: 0.1581, reg_loss: 0.1581 ||:  15%|#5        | 17/111 [00:11<01:02,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9329, UAS: 0.9628, LAS: 0.9303, UEM: 0.6486, LEM: 0.4315, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2312, partial_loss/deprel_loss: 0.2814, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4294, loss: 0.4948, batch_reg_loss: 0.1581, reg_loss: 0.1581 ||:  18%|#8        | 20/111 [00:13<01:03,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9039, UAS: 0.9638, LAS: 0.9312, UEM: 0.6779, LEM: 0.4617, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7755, partial_loss/deprel_loss: 0.4929, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7074, loss: 0.4923, batch_reg_loss: 0.1581, reg_loss: 0.1581 ||:  21%|##        | 23/111 [00:15<01:01,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9616, UAS: 0.9652, LAS: 0.9330, UEM: 0.7083, LEM: 0.4995, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0606, partial_loss/deprel_loss: 0.1413, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2832, loss: 0.4807, batch_reg_loss: 0.1580, reg_loss: 0.1581 ||:  23%|##3       | 26/111 [00:18<01:02,  1.36it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9646, LAS: 0.9325, UEM: 0.7066, LEM: 0.5026, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4830, partial_loss/deprel_loss: 0.3893, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5661, loss: 0.4855, batch_reg_loss: 0.1580, reg_loss: 0.1581 ||:  26%|##6       | 29/111 [00:20<00:59,  1.38it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8908, UAS: 0.9635, LAS: 0.9313, UEM: 0.6873, LEM: 0.4828, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8328, partial_loss/deprel_loss: 0.5691, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7799, loss: 0.4968, batch_reg_loss: 0.1580, reg_loss: 0.1581 ||:  30%|##9       | 33/111 [00:22<00:54,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9328, UAS: 0.9639, LAS: 0.9316, UEM: 0.6871, LEM: 0.4818, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2880, partial_loss/deprel_loss: 0.3547, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4994, loss: 0.4923, batch_reg_loss: 0.1580, reg_loss: 0.1581 ||:  32%|###2      | 36/111 [00:24<00:53,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9147, UAS: 0.9619, LAS: 0.9301, UEM: 0.6684, LEM: 0.4652, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6564, partial_loss/deprel_loss: 0.4076, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6154, loss: 0.5014, batch_reg_loss: 0.1580, reg_loss: 0.1581 ||:  36%|###6      | 40/111 [00:27<00:48,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9191, UAS: 0.9617, LAS: 0.9298, UEM: 0.6542, LEM: 0.4504, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5085, partial_loss/deprel_loss: 0.4750, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6397, loss: 0.5079, batch_reg_loss: 0.1580, reg_loss: 0.1581 ||:  40%|###9      | 44/111 [00:29<00:44,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9423, UAS: 0.9625, LAS: 0.9306, UEM: 0.6561, LEM: 0.4484, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2151, partial_loss/deprel_loss: 0.2727, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4192, loss: 0.5018, batch_reg_loss: 0.1580, reg_loss: 0.1580 ||:  43%|####3     | 48/111 [00:32<00:40,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9398, UAS: 0.9626, LAS: 0.9304, UEM: 0.6582, LEM: 0.4461, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1578, partial_loss/deprel_loss: 0.2982, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4281, loss: 0.5035, batch_reg_loss: 0.1580, reg_loss: 0.1580 ||:  47%|####6     | 52/111 [00:35<00:39,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9394, UAS: 0.9627, LAS: 0.9306, UEM: 0.6538, LEM: 0.4389, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2265, partial_loss/deprel_loss: 0.3118, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4527, loss: 0.5034, batch_reg_loss: 0.1580, reg_loss: 0.1580 ||:  50%|#####     | 56/111 [00:38<00:38,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9321, UAS: 0.9630, LAS: 0.9310, UEM: 0.6533, LEM: 0.4381, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3521, partial_loss/deprel_loss: 0.3434, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5031, loss: 0.5006, batch_reg_loss: 0.1580, reg_loss: 0.1580 ||:  53%|#####3    | 59/111 [00:40<00:35,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9302, UAS: 0.9634, LAS: 0.9315, UEM: 0.6593, LEM: 0.4436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3861, partial_loss/deprel_loss: 0.3899, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5471, loss: 0.4973, batch_reg_loss: 0.1580, reg_loss: 0.1580 ||:  56%|#####5    | 62/111 [00:42<00:34,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9154, UAS: 0.9632, LAS: 0.9313, UEM: 0.6543, LEM: 0.4386, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4943, partial_loss/deprel_loss: 0.4377, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6070, loss: 0.4994, batch_reg_loss: 0.1580, reg_loss: 0.1580 ||:  59%|#####8    | 65/111 [00:44<00:33,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9637, LAS: 0.9317, UEM: 0.6609, LEM: 0.4441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2084, partial_loss/deprel_loss: 0.2780, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4221, loss: 0.4958, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  61%|######1   | 68/111 [00:47<00:32,  1.31it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9776, UAS: 0.9645, LAS: 0.9327, UEM: 0.6818, LEM: 0.4724, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0263, partial_loss/deprel_loss: 0.0802, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2273, loss: 0.4900, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  65%|######4   | 72/111 [00:50<00:29,  1.33it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9231, UAS: 0.9648, LAS: 0.9329, UEM: 0.6870, LEM: 0.4766, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3513, partial_loss/deprel_loss: 0.4002, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5484, loss: 0.4877, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  68%|######7   | 75/111 [00:52<00:27,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9364, UAS: 0.9645, LAS: 0.9325, UEM: 0.6847, LEM: 0.4736, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2349, partial_loss/deprel_loss: 0.3626, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4950, loss: 0.4920, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  71%|#######1  | 79/111 [00:55<00:23,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9019, UAS: 0.9640, LAS: 0.9320, UEM: 0.6775, LEM: 0.4668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7113, partial_loss/deprel_loss: 0.4739, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6793, loss: 0.4946, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  75%|#######4  | 83/111 [00:57<00:19,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9206, UAS: 0.9639, LAS: 0.9317, UEM: 0.6702, LEM: 0.4585, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4289, partial_loss/deprel_loss: 0.4559, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6084, loss: 0.4979, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  78%|#######8  | 87/111 [01:00<00:16,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9139, UAS: 0.9635, LAS: 0.9313, UEM: 0.6640, LEM: 0.4533, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5999, partial_loss/deprel_loss: 0.4465, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6351, loss: 0.5010, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  81%|########1 | 90/111 [01:02<00:14,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9118, UAS: 0.9631, LAS: 0.9310, UEM: 0.6608, LEM: 0.4497, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6336, partial_loss/deprel_loss: 0.5125, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6946, loss: 0.5039, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  85%|########4 | 94/111 [01:04<00:11,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9257, UAS: 0.9634, LAS: 0.9313, UEM: 0.6633, LEM: 0.4514, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4677, partial_loss/deprel_loss: 0.3887, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5624, loss: 0.5020, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  88%|########8 | 98/111 [01:07<00:08,  1.49it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9508, UAS: 0.9631, LAS: 0.9310, UEM: 0.6651, LEM: 0.4536, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1180, partial_loss/deprel_loss: 0.2272, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3632, loss: 0.5052, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  92%|#########1| 102/111 [01:09<00:05,  1.59it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9632, LAS: 0.9310, UEM: 0.6633, LEM: 0.4508, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1988, partial_loss/deprel_loss: 0.3010, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4385, loss: 0.5050, batch_reg_loss: 0.1579, reg_loss: 0.1580 ||:  96%|#########6| 107/111 [01:11<00:02,  1.74it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9630, LAS: 0.9308, UEM: 0.6586, LEM: 0.4462, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2975, partial_loss/deprel_loss: 0.2869, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4469, loss: 0.5058, batch_reg_loss: 0.1578, reg_loss: 0.1580 ||: 100%|##########| 111/111 [01:13<00:00,  1.51it/s]\n",
      "2023-04-07 01:53:46,006 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:53:46,006 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:53:46,006 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:53:46,006 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:53:46,006 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:53:46,006 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.287  |       N/A\n",
      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.297  |       N/A\n",
      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.158  |       N/A\n",
      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - UEM                      |     0.659  |       N/A\n",
      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - LAS                      |     0.931  |       N/A\n",
      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - loss                     |     0.506  |       N/A\n",
      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - LEM                      |     0.446  |       N/A\n",
      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |       N/A\n",
      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - EM                       |     0.939  |       N/A\n",
      "2023-04-07 01:53:46,007 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:53:46,012 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:53:50,768 - INFO - combo.training.trainer - Epoch duration: 0:01:21.642784\n",
      "2023-04-07 01:53:50,768 - INFO - combo.training.trainer - Estimated training time remaining: 6:05:22\n",
      "2023-04-07 01:53:50,768 - INFO - allennlp.training.trainer - Epoch 134/399\n",
      "2023-04-07 01:53:50,768 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:53:50,769 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:53:50,776 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9287, UAS: 0.9718, LAS: 0.9412, UEM: 0.7633, LEM: 0.5488, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3156, partial_loss/deprel_loss: 0.3260, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4818, loss: 0.4079, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:   3%|2         | 3/111 [00:02<01:31,  1.18it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9428, UAS: 0.9762, LAS: 0.9468, UEM: 0.8419, LEM: 0.6702, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2195, partial_loss/deprel_loss: 0.2797, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4255, loss: 0.3891, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:   5%|5         | 6/111 [00:05<01:29,  1.17it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9733, LAS: 0.9431, UEM: 0.8027, LEM: 0.6205, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5134, partial_loss/deprel_loss: 0.4853, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6488, loss: 0.4243, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:   8%|8         | 9/111 [00:07<01:24,  1.21it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9493, UAS: 0.9699, LAS: 0.9392, UEM: 0.7601, LEM: 0.5743, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2198, partial_loss/deprel_loss: 0.2679, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4161, loss: 0.4574, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:  11%|#         | 12/111 [00:09<01:19,  1.25it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9578, UAS: 0.9700, LAS: 0.9394, UEM: 0.7412, LEM: 0.5441, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1170, partial_loss/deprel_loss: 0.2407, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3738, loss: 0.4592, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:  14%|#4        | 16/111 [00:12<01:13,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9270, UAS: 0.9695, LAS: 0.9389, UEM: 0.7309, LEM: 0.5301, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4520, partial_loss/deprel_loss: 0.3602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5364, loss: 0.4606, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:  17%|#7        | 19/111 [00:14<01:09,  1.32it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9080, UAS: 0.9663, LAS: 0.9359, UEM: 0.7046, LEM: 0.5065, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7200, partial_loss/deprel_loss: 0.4309, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6465, loss: 0.4794, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:  20%|#9        | 22/111 [00:16<01:06,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9653, LAS: 0.9347, UEM: 0.6950, LEM: 0.4916, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2095, partial_loss/deprel_loss: 0.3036, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4425, loss: 0.4847, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:  23%|##3       | 26/111 [00:19<00:59,  1.43it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9269, UAS: 0.9653, LAS: 0.9347, UEM: 0.6830, LEM: 0.4757, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4296, partial_loss/deprel_loss: 0.4066, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5690, loss: 0.4861, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:  26%|##6       | 29/111 [00:21<00:57,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8952, UAS: 0.9645, LAS: 0.9338, UEM: 0.6744, LEM: 0.4669, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8113, partial_loss/deprel_loss: 0.4967, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7174, loss: 0.4907, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:  29%|##8       | 32/111 [00:23<00:54,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9429, UAS: 0.9649, LAS: 0.9343, UEM: 0.6683, LEM: 0.4565, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1948, partial_loss/deprel_loss: 0.3047, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4405, loss: 0.4874, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:  32%|###2      | 36/111 [00:25<00:50,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9286, UAS: 0.9644, LAS: 0.9336, UEM: 0.6664, LEM: 0.4544, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3603, partial_loss/deprel_loss: 0.3563, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5148, loss: 0.4898, batch_reg_loss: 0.1578, reg_loss: 0.1578 ||:  35%|###5      | 39/111 [00:27<00:49,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9366, UAS: 0.9648, LAS: 0.9339, UEM: 0.6610, LEM: 0.4440, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3040, partial_loss/deprel_loss: 0.2915, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4517, loss: 0.4882, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  39%|###8      | 43/111 [00:30<00:44,  1.54it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9580, UAS: 0.9658, LAS: 0.9349, UEM: 0.6893, LEM: 0.4781, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0704, partial_loss/deprel_loss: 0.1725, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3098, loss: 0.4800, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  42%|####2     | 47/111 [00:33<00:43,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9155, UAS: 0.9647, LAS: 0.9337, UEM: 0.6763, LEM: 0.4668, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6020, partial_loss/deprel_loss: 0.4514, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6392, loss: 0.4875, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  45%|####5     | 50/111 [00:35<00:42,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9278, UAS: 0.9651, LAS: 0.9342, UEM: 0.6885, LEM: 0.4830, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3910, partial_loss/deprel_loss: 0.3737, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5349, loss: 0.4831, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  48%|####7     | 53/111 [00:37<00:41,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8906, UAS: 0.9645, LAS: 0.9335, UEM: 0.6874, LEM: 0.4803, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.8582, partial_loss/deprel_loss: 0.5299, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7533, loss: 0.4878, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  50%|#####     | 56/111 [00:39<00:39,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9377, UAS: 0.9646, LAS: 0.9337, UEM: 0.6868, LEM: 0.4777, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2436, partial_loss/deprel_loss: 0.3096, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4541, loss: 0.4881, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  53%|#####3    | 59/111 [00:41<00:36,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8732, UAS: 0.9632, LAS: 0.9320, UEM: 0.6767, LEM: 0.4680, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3082, partial_loss/deprel_loss: 0.5926, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8934, loss: 0.4992, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  57%|#####6    | 63/111 [00:44<00:32,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9249, UAS: 0.9628, LAS: 0.9318, UEM: 0.6657, LEM: 0.4568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4753, partial_loss/deprel_loss: 0.3602, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5409, loss: 0.5014, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  60%|######    | 67/111 [00:46<00:29,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9629, LAS: 0.9317, UEM: 0.6634, LEM: 0.4513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1659, partial_loss/deprel_loss: 0.2795, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4145, loss: 0.5002, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  64%|######3   | 71/111 [00:50<00:29,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9411, UAS: 0.9631, LAS: 0.9319, UEM: 0.6611, LEM: 0.4487, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2327, partial_loss/deprel_loss: 0.2979, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4425, loss: 0.4989, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  68%|######7   | 75/111 [00:52<00:24,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9127, UAS: 0.9624, LAS: 0.9312, UEM: 0.6529, LEM: 0.4410, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6647, partial_loss/deprel_loss: 0.3638, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5816, loss: 0.5027, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  71%|#######1  | 79/111 [00:55<00:21,  1.46it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9530, UAS: 0.9625, LAS: 0.9314, UEM: 0.6539, LEM: 0.4423, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1623, partial_loss/deprel_loss: 0.2136, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3610, loss: 0.5015, batch_reg_loss: 0.1577, reg_loss: 0.1578 ||:  74%|#######3  | 82/111 [00:57<00:20,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9600, UAS: 0.9631, LAS: 0.9319, UEM: 0.6668, LEM: 0.4563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0680, partial_loss/deprel_loss: 0.1759, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3119, loss: 0.4982, batch_reg_loss: 0.1576, reg_loss: 0.1577 ||:  77%|#######7  | 86/111 [01:00<00:17,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9406, UAS: 0.9634, LAS: 0.9321, UEM: 0.6686, LEM: 0.4560, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1692, partial_loss/deprel_loss: 0.3149, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4434, loss: 0.4973, batch_reg_loss: 0.1576, reg_loss: 0.1577 ||:  81%|########1 | 90/111 [01:02<00:13,  1.56it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9453, UAS: 0.9634, LAS: 0.9322, UEM: 0.6708, LEM: 0.4582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1608, partial_loss/deprel_loss: 0.2269, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3713, loss: 0.4965, batch_reg_loss: 0.1576, reg_loss: 0.1577 ||:  86%|########5 | 95/111 [01:04<00:09,  1.67it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9337, UAS: 0.9634, LAS: 0.9321, UEM: 0.6702, LEM: 0.4563, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3192, partial_loss/deprel_loss: 0.3119, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4710, loss: 0.4978, batch_reg_loss: 0.1576, reg_loss: 0.1577 ||:  90%|######### | 100/111 [01:07<00:06,  1.81it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9284, UAS: 0.9633, LAS: 0.9318, UEM: 0.6683, LEM: 0.4531, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3566, partial_loss/deprel_loss: 0.3839, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5360, loss: 0.5001, batch_reg_loss: 0.1576, reg_loss: 0.1577 ||:  94%|#########3| 104/111 [01:09<00:04,  1.72it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9434, UAS: 0.9633, LAS: 0.9319, UEM: 0.6666, LEM: 0.4517, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2006, partial_loss/deprel_loss: 0.2815, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4229, loss: 0.4998, batch_reg_loss: 0.1576, reg_loss: 0.1577 ||:  97%|#########7| 108/111 [01:12<00:01,  1.69it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9425, UAS: 0.9632, LAS: 0.9319, UEM: 0.6637, LEM: 0.4491, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2409, partial_loss/deprel_loss: 0.2592, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4131, loss: 0.4991, batch_reg_loss: 0.1576, reg_loss: 0.1577 ||: 100%|##########| 111/111 [01:13<00:00,  1.50it/s]\n",
      "2023-04-07 01:55:07,230 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |       N/A\n",
      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |       N/A\n",
      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |       N/A\n",
      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |       N/A\n",
      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.259  |       N/A\n",
      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.241  |       N/A\n",
      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.158  |       N/A\n",
      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - UEM                      |     0.664  |       N/A\n",
      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - LAS                      |     0.932  |       N/A\n",
      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - loss                     |     0.499  |       N/A\n",
      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - LEM                      |     0.449  |       N/A\n",
      "2023-04-07 01:55:07,231 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:55:07,232 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |       N/A\n",
      "2023-04-07 01:55:07,232 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |       N/A\n",
      "2023-04-07 01:55:07,232 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |       N/A\n",
      "2023-04-07 01:55:07,232 - INFO - combo.training.tensorboard_writer - EM                       |     0.943  |       N/A\n",
      "2023-04-07 01:55:07,232 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:55:07,236 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:55:11,923 - INFO - combo.training.trainer - Epoch duration: 0:01:21.154867\n",
      "2023-04-07 01:55:11,924 - INFO - combo.training.trainer - Estimated training time remaining: 6:03:57\n",
      "2023-04-07 01:55:11,924 - INFO - allennlp.training.trainer - Epoch 135/399\n",
      "2023-04-07 01:55:11,924 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:55:11,925 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:55:11,933 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9438, UAS: 0.9691, LAS: 0.9380, UEM: 0.5843, LEM: 0.3390, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2373, partial_loss/deprel_loss: 0.3147, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4568, loss: 0.4858, batch_reg_loss: 0.1576, reg_loss: 0.1576 ||:   4%|3         | 4/111 [00:02<01:06,  1.62it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9238, UAS: 0.9676, LAS: 0.9361, UEM: 0.6419, LEM: 0.3989, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4023, partial_loss/deprel_loss: 0.3518, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5195, loss: 0.4727, batch_reg_loss: 0.1576, reg_loss: 0.1576 ||:   6%|6         | 7/111 [00:04<01:09,  1.49it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9230, UAS: 0.9674, LAS: 0.9363, UEM: 0.6454, LEM: 0.4098, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4563, partial_loss/deprel_loss: 0.3694, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5443, loss: 0.4696, batch_reg_loss: 0.1576, reg_loss: 0.1576 ||:   9%|9         | 10/111 [00:07<01:10,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9138, UAS: 0.9644, LAS: 0.9332, UEM: 0.6007, LEM: 0.3720, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6226, partial_loss/deprel_loss: 0.4763, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6631, loss: 0.4970, batch_reg_loss: 0.1576, reg_loss: 0.1576 ||:  13%|#2        | 14/111 [00:09<01:04,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9207, UAS: 0.9651, LAS: 0.9338, UEM: 0.6030, LEM: 0.3691, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4544, partial_loss/deprel_loss: 0.4473, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6063, loss: 0.4959, batch_reg_loss: 0.1575, reg_loss: 0.1576 ||:  15%|#5        | 17/111 [00:11<01:03,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9548, UAS: 0.9668, LAS: 0.9357, UEM: 0.6544, LEM: 0.4272, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1150, partial_loss/deprel_loss: 0.1990, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3397, loss: 0.4817, batch_reg_loss: 0.1575, reg_loss: 0.1576 ||:  18%|#8        | 20/111 [00:13<01:03,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9213, UAS: 0.9659, LAS: 0.9352, UEM: 0.6471, LEM: 0.4242, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5934, partial_loss/deprel_loss: 0.4032, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5988, loss: 0.4846, batch_reg_loss: 0.1575, reg_loss: 0.1576 ||:  21%|##        | 23/111 [00:16<01:03,  1.38it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9362, UAS: 0.9641, LAS: 0.9333, UEM: 0.6212, LEM: 0.3983, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3112, partial_loss/deprel_loss: 0.3003, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4600, loss: 0.4957, batch_reg_loss: 0.1575, reg_loss: 0.1576 ||:  24%|##4       | 27/111 [00:18<00:59,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9384, UAS: 0.9648, LAS: 0.9337, UEM: 0.6407, LEM: 0.4168, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2263, partial_loss/deprel_loss: 0.3393, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4742, loss: 0.4937, batch_reg_loss: 0.1575, reg_loss: 0.1576 ||:  27%|##7       | 30/111 [00:20<00:56,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9233, UAS: 0.9644, LAS: 0.9333, UEM: 0.6349, LEM: 0.4096, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3704, partial_loss/deprel_loss: 0.3750, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5316, loss: 0.4975, batch_reg_loss: 0.1575, reg_loss: 0.1576 ||:  30%|##9       | 33/111 [00:23<00:54,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9444, UAS: 0.9655, LAS: 0.9345, UEM: 0.6660, LEM: 0.4442, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1504, partial_loss/deprel_loss: 0.2351, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3756, loss: 0.4871, batch_reg_loss: 0.1575, reg_loss: 0.1575 ||:  32%|###2      | 36/111 [00:26<01:04,  1.16it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9454, UAS: 0.9662, LAS: 0.9350, UEM: 0.6732, LEM: 0.4479, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1823, partial_loss/deprel_loss: 0.2917, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4273, loss: 0.4840, batch_reg_loss: 0.1575, reg_loss: 0.1575 ||:  35%|###5      | 39/111 [00:28<00:58,  1.23it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9490, UAS: 0.9670, LAS: 0.9356, UEM: 0.6809, LEM: 0.4519, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1688, partial_loss/deprel_loss: 0.2671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4049, loss: 0.4804, batch_reg_loss: 0.1575, reg_loss: 0.1575 ||:  38%|###7      | 42/111 [00:31<00:54,  1.27it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9457, UAS: 0.9672, LAS: 0.9359, UEM: 0.6859, LEM: 0.4582, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1178, partial_loss/deprel_loss: 0.2272, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3628, loss: 0.4778, batch_reg_loss: 0.1575, reg_loss: 0.1575 ||:  41%|####      | 45/111 [00:33<00:50,  1.30it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9301, UAS: 0.9668, LAS: 0.9354, UEM: 0.6857, LEM: 0.4583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2961, partial_loss/deprel_loss: 0.3744, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5162, loss: 0.4803, batch_reg_loss: 0.1575, reg_loss: 0.1575 ||:  43%|####3     | 48/111 [00:35<00:46,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9315, UAS: 0.9666, LAS: 0.9353, UEM: 0.6826, LEM: 0.4584, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3903, partial_loss/deprel_loss: 0.3601, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5236, loss: 0.4821, batch_reg_loss: 0.1575, reg_loss: 0.1575 ||:  47%|####6     | 52/111 [00:37<00:42,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8952, UAS: 0.9658, LAS: 0.9346, UEM: 0.6777, LEM: 0.4554, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7723, partial_loss/deprel_loss: 0.4786, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6948, loss: 0.4863, batch_reg_loss: 0.1575, reg_loss: 0.1575 ||:  50%|####9     | 55/111 [00:39<00:39,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8946, UAS: 0.9643, LAS: 0.9332, UEM: 0.6707, LEM: 0.4501, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9087, partial_loss/deprel_loss: 0.4306, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6837, loss: 0.4946, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  52%|#####2    | 58/111 [00:42<00:38,  1.39it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9465, UAS: 0.9643, LAS: 0.9332, UEM: 0.6744, LEM: 0.4534, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1724, partial_loss/deprel_loss: 0.2206, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3684, loss: 0.4935, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  56%|#####5    | 62/111 [00:44<00:34,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8704, UAS: 0.9634, LAS: 0.9321, UEM: 0.6687, LEM: 0.4472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.2048, partial_loss/deprel_loss: 0.6180, partial_loss/cycle_loss: 0.0000, batch_loss: 0.8928, loss: 0.5009, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  59%|#####8    | 65/111 [00:46<00:32,  1.43it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8924, UAS: 0.9634, LAS: 0.9317, UEM: 0.6662, LEM: 0.4438, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7750, partial_loss/deprel_loss: 0.5395, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7440, loss: 0.5028, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  62%|######2   | 69/111 [00:49<00:27,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9365, UAS: 0.9630, LAS: 0.9314, UEM: 0.6552, LEM: 0.4332, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2282, partial_loss/deprel_loss: 0.3793, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5065, loss: 0.5066, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  67%|######6   | 74/111 [00:51<00:22,  1.64it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9381, UAS: 0.9623, LAS: 0.9308, UEM: 0.6477, LEM: 0.4274, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1806, partial_loss/deprel_loss: 0.2618, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4030, loss: 0.5100, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  70%|#######   | 78/111 [00:54<00:20,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9275, UAS: 0.9625, LAS: 0.9310, UEM: 0.6503, LEM: 0.4295, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2958, partial_loss/deprel_loss: 0.3772, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5183, loss: 0.5094, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  74%|#######3  | 82/111 [00:56<00:18,  1.60it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9623, LAS: 0.9308, UEM: 0.6431, LEM: 0.4219, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3598, partial_loss/deprel_loss: 0.3868, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5388, loss: 0.5104, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  77%|#######7  | 86/111 [00:59<00:15,  1.66it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9800, UAS: 0.9630, LAS: 0.9316, UEM: 0.6675, LEM: 0.4568, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0234, partial_loss/deprel_loss: 0.0818, partial_loss/cycle_loss: 0.0000, batch_loss: 0.2275, loss: 0.5049, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  81%|########1 | 90/111 [01:01<00:13,  1.56it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9119, UAS: 0.9625, LAS: 0.9312, UEM: 0.6606, LEM: 0.4513, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6511, partial_loss/deprel_loss: 0.4525, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6496, loss: 0.5073, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  86%|########5 | 95/111 [01:04<00:09,  1.68it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9345, UAS: 0.9624, LAS: 0.9311, UEM: 0.6529, LEM: 0.4436, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3028, partial_loss/deprel_loss: 0.3201, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4740, loss: 0.5081, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  90%|######### | 100/111 [01:06<00:06,  1.79it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9629, LAS: 0.9315, UEM: 0.6583, LEM: 0.4480, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3456, partial_loss/deprel_loss: 0.4009, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5472, loss: 0.5050, batch_reg_loss: 0.1574, reg_loss: 0.1575 ||:  95%|#########4| 105/111 [01:09<00:03,  1.90it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9260, UAS: 0.9632, LAS: 0.9317, UEM: 0.6619, LEM: 0.4502, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4365, partial_loss/deprel_loss: 0.4079, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5709, loss: 0.5032, batch_reg_loss: 0.1573, reg_loss: 0.1575 ||:  98%|#########8| 109/111 [01:11<00:01,  1.78it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9632, LAS: 0.9317, UEM: 0.6597, LEM: 0.4482, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4608, partial_loss/deprel_loss: 0.3829, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5558, loss: 0.5031, batch_reg_loss: 0.1573, reg_loss: 0.1575 ||: 100%|##########| 111/111 [01:13<00:00,  1.52it/s]\n",
      "2023-04-07 01:56:27,897 - INFO - allennlp.training.trainer - Validating\n",
      "  0%|          | 0/13 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8755, UAS: 0.9614, LAS: 0.9128, UEM: 0.7969, LEM: 0.5543, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.0105, partial_loss/deprel_loss: 34.5376, partial_loss/cycle_loss: 0.0000, batch_loss: 27.8322, loss: 19.9957, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  23%|##3       | 3/13 [00:02<00:09,  1.01it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8697, UAS: 0.9551, LAS: 0.9059, UEM: 0.7413, LEM: 0.4867, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 1.3425, partial_loss/deprel_loss: 44.6023, partial_loss/cycle_loss: 0.0000, batch_loss: 35.9504, loss: 23.2370, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  46%|####6     | 6/13 [00:05<00:06,  1.03it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8892, UAS: 0.9458, LAS: 0.8954, UEM: 0.6814, LEM: 0.4354, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7257, partial_loss/deprel_loss: 28.0299, partial_loss/cycle_loss: 0.0000, batch_loss: 22.5690, loss: 25.5143, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  62%|######1   | 8/13 [00:07<00:04,  1.00it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9219, UAS: 0.9509, LAS: 0.9015, UEM: 0.6917, LEM: 0.4261, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4239, partial_loss/deprel_loss: 24.7843, partial_loss/cycle_loss: 0.0000, batch_loss: 19.9122, loss: 23.2583, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||:  85%|########4 | 11/13 [00:10<00:01,  1.02it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8841, UAS: 0.9485, LAS: 0.8984, UEM: 0.6581, LEM: 0.3961, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9117, partial_loss/deprel_loss: 29.0845, partial_loss/cycle_loss: 0.0000, batch_loss: 23.4500, loss: 23.9880, batch_reg_loss: 0.0000, reg_loss: 0.0000 ||: 100%|##########| 13/13 [00:12<00:00,  1.03it/s]\n",
      "2023-04-07 01:56:40,528 - INFO - combo.training.tensorboard_writer -                              Training |  Validation\n",
      "2023-04-07 01:56:40,528 - INFO - combo.training.tensorboard_writer - ELEM                     |     0.000  |     0.000\n",
      "2023-04-07 01:56:40,528 - INFO - combo.training.tensorboard_writer - XPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - UPOS_ACC                 |     0.000  |     0.000\n",
      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - partial_loss/cycle_loss  |     0.000  |     0.000\n",
      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - ELAS                     |     0.000  |     0.000\n",
      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - patience                 |     1.000  |       N/A\n",
      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - SEMREL_ACC               |     0.000  |     0.000\n",
      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - EUEM                     |     0.000  |     0.000\n",
      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - partial_loss/deprel_loss |     0.383  |    29.085\n",
      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - partial_loss/head_loss   |     0.461  |     0.912\n",
      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - reg_loss                 |     0.157  |     0.000\n",
      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - UEM                      |     0.660  |     0.658\n",
      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - LAS                      |     0.932  |     0.898\n",
      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - loss                     |     0.503  |    23.988\n",
      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - gpu_0_memory_MB          |  2425.273  |       N/A\n",
      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - LEM                      |     0.448  |     0.396\n",
      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - LEMMA_ACC                |     0.000  |     0.000\n",
      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - EUAS                     |     0.000  |     0.000\n",
      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - UAS                      |     0.963  |     0.949\n",
      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - FEATS_ACC                |     0.000  |     0.000\n",
      "2023-04-07 01:56:40,529 - INFO - combo.training.tensorboard_writer - EM                       |     0.921  |     0.884\n",
      "2023-04-07 01:56:40,530 - INFO - combo.training.tensorboard_writer - worker_0_memory_MB       |  7070.324  |       N/A\n",
      "2023-04-07 01:56:40,533 - INFO - allennlp.training.checkpointer - Best validation performance so far. Copying weights to './allennlpru3hb8qq/best.th'.\n",
      "2023-04-07 01:56:44,748 - INFO - combo.training.trainer - Epoch duration: 0:01:32.824060\n",
      "2023-04-07 01:56:44,748 - INFO - combo.training.trainer - Estimated training time remaining: 6:02:55\n",
      "2023-04-07 01:56:44,749 - INFO - allennlp.training.trainer - Epoch 136/399\n",
      "2023-04-07 01:56:44,749 - INFO - allennlp.training.trainer - Worker 0 memory usage: 6.9G\n",
      "2023-04-07 01:56:44,750 - INFO - allennlp.training.trainer - GPU 0 memory usage: 2.4G\n",
      "2023-04-07 01:56:44,759 - INFO - allennlp.training.trainer - Training\n",
      "  0%|          | 0/111 [00:00<?, ?it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9446, UAS: 0.9701, LAS: 0.9398, UEM: 0.6759, LEM: 0.4194, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1820, partial_loss/deprel_loss: 0.2697, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4095, loss: 0.4615, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||:   4%|3         | 4/111 [00:02<01:11,  1.49it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9214, UAS: 0.9697, LAS: 0.9401, UEM: 0.7084, LEM: 0.4874, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4933, partial_loss/deprel_loss: 0.3671, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5497, loss: 0.4480, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||:   7%|7         | 8/111 [00:05<01:07,  1.52it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9413, UAS: 0.9687, LAS: 0.9379, UEM: 0.6801, LEM: 0.4486, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2307, partial_loss/deprel_loss: 0.3055, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4479, loss: 0.4613, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||:  10%|9         | 11/111 [00:07<01:06,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9474, UAS: 0.9682, LAS: 0.9380, UEM: 0.6869, LEM: 0.4659, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1802, partial_loss/deprel_loss: 0.2410, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3861, loss: 0.4555, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||:  14%|#3        | 15/111 [00:09<01:03,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9389, UAS: 0.9685, LAS: 0.9379, UEM: 0.6714, LEM: 0.4464, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2852, partial_loss/deprel_loss: 0.3214, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4714, loss: 0.4577, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||:  17%|#7        | 19/111 [00:12<01:01,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8933, UAS: 0.9658, LAS: 0.9350, UEM: 0.6613, LEM: 0.4399, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.9620, partial_loss/deprel_loss: 0.5151, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7618, loss: 0.4760, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||:  21%|##        | 23/111 [00:15<00:58,  1.51it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9211, UAS: 0.9653, LAS: 0.9344, UEM: 0.6476, LEM: 0.4248, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5369, partial_loss/deprel_loss: 0.3851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5727, loss: 0.4804, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||:  23%|##3       | 26/111 [00:17<00:57,  1.48it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9266, UAS: 0.9657, LAS: 0.9349, UEM: 0.6618, LEM: 0.4411, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4090, partial_loss/deprel_loss: 0.3663, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5321, loss: 0.4762, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||:  26%|##6       | 29/111 [00:19<00:57,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9505, UAS: 0.9647, LAS: 0.9336, UEM: 0.6680, LEM: 0.4505, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0720, partial_loss/deprel_loss: 0.2051, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3357, loss: 0.4839, batch_reg_loss: 0.1573, reg_loss: 0.1573 ||:  29%|##8       | 32/111 [00:21<00:57,  1.37it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9482, UAS: 0.9650, LAS: 0.9338, UEM: 0.6674, LEM: 0.4472, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1642, partial_loss/deprel_loss: 0.2539, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3932, loss: 0.4823, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||:  32%|###2      | 36/111 [00:24<00:54,  1.38it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9315, UAS: 0.9646, LAS: 0.9335, UEM: 0.6565, LEM: 0.4366, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4016, partial_loss/deprel_loss: 0.3892, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5489, loss: 0.4877, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||:  35%|###5      | 39/111 [00:26<00:51,  1.40it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9291, UAS: 0.9645, LAS: 0.9335, UEM: 0.6487, LEM: 0.4291, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4346, partial_loss/deprel_loss: 0.3860, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5530, loss: 0.4894, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||:  38%|###7      | 42/111 [00:28<00:48,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9616, UAS: 0.9646, LAS: 0.9337, UEM: 0.6573, LEM: 0.4420, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.0802, partial_loss/deprel_loss: 0.1775, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3153, loss: 0.4892, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||:  41%|####1     | 46/111 [00:31<00:45,  1.41it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9332, UAS: 0.9645, LAS: 0.9333, UEM: 0.6492, LEM: 0.4313, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2660, partial_loss/deprel_loss: 0.3857, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5190, loss: 0.4911, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||:  45%|####5     | 50/111 [00:34<00:41,  1.47it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9047, UAS: 0.9644, LAS: 0.9332, UEM: 0.6480, LEM: 0.4294, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.6622, partial_loss/deprel_loss: 0.4969, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6872, loss: 0.4916, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||:  49%|####8     | 54/111 [00:36<00:37,  1.50it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9378, UAS: 0.9653, LAS: 0.9342, UEM: 0.6665, LEM: 0.4463, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2271, partial_loss/deprel_loss: 0.3296, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4663, loss: 0.4853, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||:  52%|#####2    | 58/111 [00:38<00:33,  1.58it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9177, UAS: 0.9645, LAS: 0.9335, UEM: 0.6710, LEM: 0.4583, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5423, partial_loss/deprel_loss: 0.4684, partial_loss/cycle_loss: 0.0000, batch_loss: 0.6404, loss: 0.4904, batch_reg_loss: 0.1572, reg_loss: 0.1573 ||:  56%|#####5    | 62/111 [00:41<00:29,  1.68it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9290, UAS: 0.9643, LAS: 0.9335, UEM: 0.6663, LEM: 0.4535, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3827, partial_loss/deprel_loss: 0.3363, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5027, loss: 0.4911, batch_reg_loss: 0.1572, reg_loss: 0.1572 ||:  60%|######    | 67/111 [00:43<00:24,  1.83it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9306, UAS: 0.9639, LAS: 0.9331, UEM: 0.6543, LEM: 0.4413, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3624, partial_loss/deprel_loss: 0.3598, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5175, loss: 0.4936, batch_reg_loss: 0.1572, reg_loss: 0.1572 ||:  65%|######4   | 72/111 [00:45<00:20,  1.93it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9639, LAS: 0.9333, UEM: 0.6653, LEM: 0.4611, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4176, partial_loss/deprel_loss: 0.3589, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5278, loss: 0.4929, batch_reg_loss: 0.1572, reg_loss: 0.1572 ||:  68%|######8   | 76/111 [00:48<00:20,  1.75it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9470, UAS: 0.9643, LAS: 0.9336, UEM: 0.6732, LEM: 0.4684, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1612, partial_loss/deprel_loss: 0.2706, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4059, loss: 0.4902, batch_reg_loss: 0.1572, reg_loss: 0.1572 ||:  72%|#######2  | 80/111 [00:51<00:19,  1.55it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9409, UAS: 0.9637, LAS: 0.9332, UEM: 0.6708, LEM: 0.4675, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2048, partial_loss/deprel_loss: 0.2418, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3916, loss: 0.4919, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||:  76%|#######5  | 84/111 [00:54<00:18,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.8990, UAS: 0.9633, LAS: 0.9327, UEM: 0.6642, LEM: 0.4607, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.7137, partial_loss/deprel_loss: 0.5212, partial_loss/cycle_loss: 0.0000, batch_loss: 0.7168, loss: 0.4959, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||:  79%|#######9  | 88/111 [00:57<00:16,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9202, UAS: 0.9628, LAS: 0.9321, UEM: 0.6605, LEM: 0.4564, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.5023, partial_loss/deprel_loss: 0.4027, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5797, loss: 0.4999, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||:  82%|########1 | 91/111 [01:00<00:14,  1.35it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9361, UAS: 0.9626, LAS: 0.9319, UEM: 0.6593, LEM: 0.4546, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1783, partial_loss/deprel_loss: 0.2851, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4208, loss: 0.5013, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||:  85%|########4 | 94/111 [01:02<00:12,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9473, UAS: 0.9628, LAS: 0.9321, UEM: 0.6646, LEM: 0.4604, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.1742, partial_loss/deprel_loss: 0.2021, partial_loss/cycle_loss: 0.0000, batch_loss: 0.3536, loss: 0.4988, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||:  87%|########7 | 97/111 [01:04<00:10,  1.29it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9209, UAS: 0.9628, LAS: 0.9321, UEM: 0.6630, LEM: 0.4590, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.4777, partial_loss/deprel_loss: 0.3639, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5438, loss: 0.4990, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||:  90%|######### | 100/111 [01:06<00:08,  1.34it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9242, UAS: 0.9631, LAS: 0.9322, UEM: 0.6644, LEM: 0.4581, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3459, partial_loss/deprel_loss: 0.3799, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5302, loss: 0.4976, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||:  94%|#########3| 104/111 [01:09<00:04,  1.45it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9261, UAS: 0.9630, LAS: 0.9320, UEM: 0.6604, LEM: 0.4538, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.3434, partial_loss/deprel_loss: 0.3645, partial_loss/cycle_loss: 0.0000, batch_loss: 0.5174, loss: 0.4983, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||:  96%|#########6| 107/111 [01:11<00:02,  1.44it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9631, LAS: 0.9321, UEM: 0.6599, LEM: 0.4515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2039, partial_loss/deprel_loss: 0.2603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4061, loss: 0.4970, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||: 100%|##########| 111/111 [01:14<00:00,  1.42it/s]\n",
      "UPOS_ACC: 0.0000, XPOS_ACC: 0.0000, SEMREL_ACC: 0.0000, LEMMA_ACC: 0.0000, FEATS_ACC: 0.0000, EM: 0.9386, UAS: 0.9631, LAS: 0.9321, UEM: 0.6599, LEM: 0.4515, EUAS: 0.0000, ELAS: 0.0000, EUEM: 0.0000, ELEM: 0.0000, partial_loss/head_loss: 0.2039, partial_loss/deprel_loss: 0.2603, partial_loss/cycle_loss: 0.0000, batch_loss: 0.4061, loss: 0.4970, batch_reg_loss: 0.1571, reg_loss: 0.1572 ||: 100%|##########| 111/111 [01:14<00:00,  1.50it/s]\n",
      "2023-04-07 01:58:01,554 - INFO - combo.training.trainer - Ran out of patience.  Stopping training.\n",
      "2023-04-07 01:58:01,554 - INFO - allennlp.training.checkpointer - loading best weights\n",
      "2023-04-07 01:58:02,804 - INFO - allennlp.common.util - Metrics: {\n",
      "  \"best_epoch\": 135,\n",
      "  \"peak_worker_0_memory_MB\": 7070.32421875,\n",
      "  \"peak_gpu_0_memory_MB\": 2425.27294921875,\n",
      "  \"training_duration\": \"3:06:53.221860\",\n",
      "  \"training_start_epoch\": 0,\n",
      "  \"training_epochs\": 135,\n",
      "  \"epoch\": 135,\n",
      "  \"training_UPOS_ACC\": 0.0,\n",
      "  \"training_XPOS_ACC\": 0.0,\n",
      "  \"training_SEMREL_ACC\": 0.0,\n",
      "  \"training_LEMMA_ACC\": 0.0,\n",
      "  \"training_FEATS_ACC\": 0.0,\n",
      "  \"training_EM\": 0.9211469292640686,\n",
      "  \"training_UAS\": 0.9631774675364263,\n",
      "  \"training_LAS\": 0.9317305657860291,\n",
      "  \"training_UEM\": 0.6596950631978689,\n",
      "  \"training_LEM\": 0.4481664116080032,\n",
      "  \"training_EUAS\": 0.0,\n",
      "  \"training_ELAS\": 0.0,\n",
      "  \"training_EUEM\": 0.0,\n",
      "  \"training_ELEM\": 0.0,\n",
      "  \"training_partial_loss/head_loss\": 0.4608195722103119,\n",
      "  \"training_partial_loss/deprel_loss\": 0.3828725218772888,\n",
      "  \"training_partial_loss/cycle_loss\": 0.0,\n",
      "  \"training_loss\": 0.5030799737653217,\n",
      "  \"training_reg_loss\": 0.15746027405734533,\n",
      "  \"training_worker_0_memory_MB\": 7070.32421875,\n",
      "  \"training_gpu_0_memory_MB\": 2425.27294921875,\n",
      "  \"training_patience\": 1,\n",
      "  \"validation_UPOS_ACC\": 0.0,\n",
      "  \"validation_XPOS_ACC\": 0.0,\n",
      "  \"validation_SEMREL_ACC\": 0.0,\n",
      "  \"validation_LEMMA_ACC\": 0.0,\n",
      "  \"validation_FEATS_ACC\": 0.0,\n",
      "  \"validation_EM\": 0.8841390609741211,\n",
      "  \"validation_UAS\": 0.948533243417221,\n",
      "  \"validation_LAS\": 0.898415228519756,\n",
      "  \"validation_UEM\": 0.6580882352941176,\n",
      "  \"validation_LEM\": 0.3961397058823529,\n",
      "  \"validation_EUAS\": 0.0,\n",
      "  \"validation_ELAS\": 0.0,\n",
      "  \"validation_EUEM\": 0.0,\n",
      "  \"validation_ELEM\": 0.0,\n",
      "  \"validation_partial_loss/head_loss\": 0.91168212890625,\n",
      "  \"validation_partial_loss/deprel_loss\": 29.084543228149414,\n",
      "  \"validation_partial_loss/cycle_loss\": 0.0,\n",
      "  \"validation_loss\": 23.987967637869026,\n",
      "  \"validation_reg_loss\": 0.0,\n",
      "  \"best_validation_UPOS_ACC\": 0.0,\n",
      "  \"best_validation_XPOS_ACC\": 0.0,\n",
      "  \"best_validation_SEMREL_ACC\": 0.0,\n",
      "  \"best_validation_LEMMA_ACC\": 0.0,\n",
      "  \"best_validation_FEATS_ACC\": 0.0,\n",
      "  \"best_validation_EM\": 0.8841390609741211,\n",
      "  \"best_validation_UAS\": 0.948533243417221,\n",
      "  \"best_validation_LAS\": 0.898415228519756,\n",
      "  \"best_validation_UEM\": 0.6580882352941176,\n",
      "  \"best_validation_LEM\": 0.3961397058823529,\n",
      "  \"best_validation_EUAS\": 0.0,\n",
      "  \"best_validation_ELAS\": 0.0,\n",
      "  \"best_validation_EUEM\": 0.0,\n",
      "  \"best_validation_ELEM\": 0.0,\n",
      "  \"best_validation_partial_loss/head_loss\": 0.91168212890625,\n",
      "  \"best_validation_partial_loss/deprel_loss\": 29.084543228149414,\n",
      "  \"best_validation_partial_loss/cycle_loss\": 0.0,\n",
      "  \"best_validation_loss\": 23.987967637869026,\n",
      "  \"best_validation_reg_loss\": 0.0\n",
      "}\n",
      "2023-04-07 01:58:02,805 - INFO - allennlp.models.archival - archiving weights and vocabulary to ./allennlpru3hb8qq/model.tar.gz\n",
      "2023-04-07 02:10:56,965 - INFO - combo.main - Training model stored in: ./allennlpru3hb8qq\n"
     ]
    }
   ],
   "source": [
    "! {COMBO} --mode train \\\n",
    "    --training_data_path connlu/pdbc-train.conllu \\\n",
    "    --validation_data_path connlu/pdbc-validation.conllu \\\n",
    "    --cuda_device 0 \\\n",
    "    --pretrained_transformer_name allegro/herbert-large-cased \\\n",
    "    --targets head,deprel \\\n",
    "    --serialization_dir ."
   ]
  },
  {
   "cell_type": "markdown",
   "id": "e2c0090a",
   "metadata": {},
   "source": [
    "Change `allennlp...` to the directory produced by COMBO."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "f630757b",
   "metadata": {},
   "outputs": [],
   "source": [
    "! rm -r model-pdbc/\n",
    "! mv allennlpru3hb8qq/ model-pdbc/"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "combo_python39",
   "language": "python",
   "name": "combo_python39"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.16"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}